Versions of command-r using either the default system prompt or the rag/tool use prompt suggested by Cohere.
35B
155 Pulls Updated 5 months ago
8a9611e7bca1 · 20GB
-
general.architecturecommand-r
-
general.file_typeQ4_0
-
command-r.attention.head_count64
-
command-r.attention.head_count_kv64
-
command-r.attention.layer_norm_epsilon1e-05
-
command-r.block_count40
-
command-r.context_length131072
-
command-r.embedding_length8192
-
command-r.feed_forward_length22528
-
command-r.logit_scale0.0625
-
command-r.rope.freq_base8e+06
-
command-r.rope.scaling.typenone
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id5
-
tokenizer.ggml.eos_token_id255001
-
tokenizer.ggml.merges[Ġ Ġ Ġ t e r i n Ġ a ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<PAD> <UNK> <CLS> <SEP> <MASK_TOKEN> ...]
-
NameTypeShape
-
token_embd.weightQ6_K[8192 256000]
-
blk.0.attn_k.weightQ4_0[8192 8192]
-
blk.0.attn_output.weightQ4_0[8192 8192]
-
blk.0.attn_q.weightQ4_0[8192 8192]
-
blk.0.attn_v.weightQ4_0[8192 8192]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ4_0[22528 8192]
-
blk.0.ffn_gate.weightQ4_0[8192 22528]
-
blk.0.ffn_up.weightQ4_0[8192 22528]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ4_0[22528 8192]
-
blk.1.ffn_gate.weightQ4_0[8192 22528]
-
blk.1.ffn_up.weightQ4_0[8192 22528]
-
blk.1.attn_k.weightQ4_0[8192 8192]
-
blk.1.attn_output.weightQ4_0[8192 8192]
-
blk.1.attn_q.weightQ4_0[8192 8192]
-
blk.1.attn_v.weightQ4_0[8192 8192]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ4_0[22528 8192]
-
blk.2.ffn_gate.weightQ4_0[8192 22528]
-
blk.2.ffn_up.weightQ4_0[8192 22528]
-
blk.2.attn_k.weightQ4_0[8192 8192]
-
blk.2.attn_output.weightQ4_0[8192 8192]
-
blk.2.attn_q.weightQ4_0[8192 8192]
-
blk.2.attn_v.weightQ4_0[8192 8192]
-
blk.3.attn_k.weightQ4_0[8192 8192]
-
blk.3.attn_output.weightQ4_0[8192 8192]
-
blk.3.attn_q.weightQ4_0[8192 8192]
-
blk.3.attn_v.weightQ4_0[8192 8192]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ4_0[22528 8192]
-
blk.3.ffn_gate.weightQ4_0[8192 22528]
-
blk.3.ffn_up.weightQ4_0[8192 22528]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ4_0[22528 8192]
-
blk.4.ffn_gate.weightQ4_0[8192 22528]
-
blk.4.ffn_up.weightQ4_0[8192 22528]
-
blk.4.attn_k.weightQ4_0[8192 8192]
-
blk.4.attn_output.weightQ4_0[8192 8192]
-
blk.4.attn_q.weightQ4_0[8192 8192]
-
blk.4.attn_v.weightQ4_0[8192 8192]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ4_0[22528 8192]
-
blk.5.ffn_gate.weightQ4_0[8192 22528]
-
blk.5.ffn_up.weightQ4_0[8192 22528]
-
blk.5.attn_k.weightQ4_0[8192 8192]
-
blk.5.attn_output.weightQ4_0[8192 8192]
-
blk.5.attn_q.weightQ4_0[8192 8192]
-
blk.5.attn_v.weightQ4_0[8192 8192]
-
blk.6.attn_k.weightQ4_0[8192 8192]
-
blk.6.attn_output.weightQ4_0[8192 8192]
-
blk.6.attn_q.weightQ4_0[8192 8192]
-
blk.6.attn_v.weightQ4_0[8192 8192]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ4_0[22528 8192]
-
blk.6.ffn_gate.weightQ4_0[8192 22528]
-
blk.6.ffn_up.weightQ4_0[8192 22528]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ4_0[22528 8192]
-
blk.7.ffn_gate.weightQ4_0[8192 22528]
-
blk.7.ffn_up.weightQ4_0[8192 22528]
-
blk.7.attn_k.weightQ4_0[8192 8192]
-
blk.7.attn_output.weightQ4_0[8192 8192]
-
blk.7.attn_q.weightQ4_0[8192 8192]
-
blk.7.attn_v.weightQ4_0[8192 8192]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ4_0[22528 8192]
-
blk.8.ffn_gate.weightQ4_0[8192 22528]
-
blk.8.ffn_up.weightQ4_0[8192 22528]
-
blk.8.attn_k.weightQ4_0[8192 8192]
-
blk.8.attn_output.weightQ4_0[8192 8192]
-
blk.8.attn_q.weightQ4_0[8192 8192]
-
blk.8.attn_v.weightQ4_0[8192 8192]
-
blk.9.attn_k.weightQ4_0[8192 8192]
-
blk.9.attn_output.weightQ4_0[8192 8192]
-
blk.9.attn_q.weightQ4_0[8192 8192]
-
blk.9.attn_v.weightQ4_0[8192 8192]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ4_0[22528 8192]
-
blk.9.ffn_gate.weightQ4_0[8192 22528]
-
blk.9.ffn_up.weightQ4_0[8192 22528]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ4_0[22528 8192]
-
blk.10.ffn_gate.weightQ4_0[8192 22528]
-
blk.10.ffn_up.weightQ4_0[8192 22528]
-
blk.10.attn_k.weightQ4_0[8192 8192]
-
blk.10.attn_output.weightQ4_0[8192 8192]
-
blk.10.attn_q.weightQ4_0[8192 8192]
-
blk.10.attn_v.weightQ4_0[8192 8192]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ4_0[22528 8192]
-
blk.11.ffn_gate.weightQ4_0[8192 22528]
-
blk.11.ffn_up.weightQ4_0[8192 22528]
-
blk.11.attn_k.weightQ4_0[8192 8192]
-
blk.11.attn_output.weightQ4_0[8192 8192]
-
blk.11.attn_q.weightQ4_0[8192 8192]
-
blk.11.attn_v.weightQ4_0[8192 8192]
-
blk.12.attn_k.weightQ4_0[8192 8192]
-
blk.12.attn_output.weightQ4_0[8192 8192]
-
blk.12.attn_q.weightQ4_0[8192 8192]
-
blk.12.attn_v.weightQ4_0[8192 8192]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ4_0[22528 8192]
-
blk.12.ffn_gate.weightQ4_0[8192 22528]
-
blk.12.ffn_up.weightQ4_0[8192 22528]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ4_0[22528 8192]
-
blk.13.ffn_gate.weightQ4_0[8192 22528]
-
blk.13.ffn_up.weightQ4_0[8192 22528]
-
blk.13.attn_k.weightQ4_0[8192 8192]
-
blk.13.attn_output.weightQ4_0[8192 8192]
-
blk.13.attn_q.weightQ4_0[8192 8192]
-
blk.13.attn_v.weightQ4_0[8192 8192]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ4_0[22528 8192]
-
blk.14.ffn_gate.weightQ4_0[8192 22528]
-
blk.14.ffn_up.weightQ4_0[8192 22528]
-
blk.14.attn_k.weightQ4_0[8192 8192]
-
blk.14.attn_output.weightQ4_0[8192 8192]
-
blk.14.attn_q.weightQ4_0[8192 8192]
-
blk.14.attn_v.weightQ4_0[8192 8192]
-
blk.15.attn_k.weightQ4_0[8192 8192]
-
blk.15.attn_output.weightQ4_0[8192 8192]
-
blk.15.attn_q.weightQ4_0[8192 8192]
-
blk.15.attn_v.weightQ4_0[8192 8192]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ4_0[22528 8192]
-
blk.15.ffn_gate.weightQ4_0[8192 22528]
-
blk.15.ffn_up.weightQ4_0[8192 22528]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ4_0[22528 8192]
-
blk.16.ffn_gate.weightQ4_0[8192 22528]
-
blk.16.ffn_up.weightQ4_0[8192 22528]
-
blk.16.attn_k.weightQ4_0[8192 8192]
-
blk.16.attn_output.weightQ4_0[8192 8192]
-
blk.16.attn_q.weightQ4_0[8192 8192]
-
blk.16.attn_v.weightQ4_0[8192 8192]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ4_0[22528 8192]
-
blk.17.ffn_gate.weightQ4_0[8192 22528]
-
blk.17.ffn_up.weightQ4_0[8192 22528]
-
blk.17.attn_k.weightQ4_0[8192 8192]
-
blk.17.attn_output.weightQ4_0[8192 8192]
-
blk.17.attn_q.weightQ4_0[8192 8192]
-
blk.17.attn_v.weightQ4_0[8192 8192]
-
blk.18.attn_k.weightQ4_0[8192 8192]
-
blk.18.attn_output.weightQ4_0[8192 8192]
-
blk.18.attn_q.weightQ4_0[8192 8192]
-
blk.18.attn_v.weightQ4_0[8192 8192]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ4_0[22528 8192]
-
blk.18.ffn_gate.weightQ4_0[8192 22528]
-
blk.18.ffn_up.weightQ4_0[8192 22528]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ4_0[22528 8192]
-
blk.19.ffn_gate.weightQ4_0[8192 22528]
-
blk.19.ffn_up.weightQ4_0[8192 22528]
-
blk.19.attn_k.weightQ4_0[8192 8192]
-
blk.19.attn_output.weightQ4_0[8192 8192]
-
blk.19.attn_q.weightQ4_0[8192 8192]
-
blk.19.attn_v.weightQ4_0[8192 8192]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ4_0[22528 8192]
-
blk.20.ffn_gate.weightQ4_0[8192 22528]
-
blk.20.ffn_up.weightQ4_0[8192 22528]
-
blk.20.attn_k.weightQ4_0[8192 8192]
-
blk.20.attn_output.weightQ4_0[8192 8192]
-
blk.20.attn_q.weightQ4_0[8192 8192]
-
blk.20.attn_v.weightQ4_0[8192 8192]
-
blk.21.attn_k.weightQ4_0[8192 8192]
-
blk.21.attn_output.weightQ4_0[8192 8192]
-
blk.21.attn_q.weightQ4_0[8192 8192]
-
blk.21.attn_v.weightQ4_0[8192 8192]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ4_0[22528 8192]
-
blk.21.ffn_gate.weightQ4_0[8192 22528]
-
blk.21.ffn_up.weightQ4_0[8192 22528]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ4_0[22528 8192]
-
blk.22.ffn_gate.weightQ4_0[8192 22528]
-
blk.22.ffn_up.weightQ4_0[8192 22528]
-
blk.22.attn_k.weightQ4_0[8192 8192]
-
blk.22.attn_output.weightQ4_0[8192 8192]
-
blk.22.attn_q.weightQ4_0[8192 8192]
-
blk.22.attn_v.weightQ4_0[8192 8192]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ4_0[22528 8192]
-
blk.23.ffn_gate.weightQ4_0[8192 22528]
-
blk.23.ffn_up.weightQ4_0[8192 22528]
-
blk.23.attn_k.weightQ4_0[8192 8192]
-
blk.23.attn_output.weightQ4_0[8192 8192]
-
blk.23.attn_q.weightQ4_0[8192 8192]
-
blk.23.attn_v.weightQ4_0[8192 8192]
-
blk.24.attn_k.weightQ4_0[8192 8192]
-
blk.24.attn_output.weightQ4_0[8192 8192]
-
blk.24.attn_q.weightQ4_0[8192 8192]
-
blk.24.attn_v.weightQ4_0[8192 8192]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightQ4_0[22528 8192]
-
blk.24.ffn_gate.weightQ4_0[8192 22528]
-
blk.24.ffn_up.weightQ4_0[8192 22528]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightQ4_0[22528 8192]
-
blk.25.ffn_gate.weightQ4_0[8192 22528]
-
blk.25.ffn_up.weightQ4_0[8192 22528]
-
blk.25.attn_k.weightQ4_0[8192 8192]
-
blk.25.attn_output.weightQ4_0[8192 8192]
-
blk.25.attn_q.weightQ4_0[8192 8192]
-
blk.25.attn_v.weightQ4_0[8192 8192]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ4_0[22528 8192]
-
blk.26.ffn_gate.weightQ4_0[8192 22528]
-
blk.26.ffn_up.weightQ4_0[8192 22528]
-
blk.26.attn_k.weightQ4_0[8192 8192]
-
blk.26.attn_output.weightQ4_0[8192 8192]
-
blk.26.attn_q.weightQ4_0[8192 8192]
-
blk.26.attn_v.weightQ4_0[8192 8192]
-
blk.27.attn_k.weightQ4_0[8192 8192]
-
blk.27.attn_output.weightQ4_0[8192 8192]
-
blk.27.attn_q.weightQ4_0[8192 8192]
-
blk.27.attn_v.weightQ4_0[8192 8192]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ4_0[22528 8192]
-
blk.27.ffn_gate.weightQ4_0[8192 22528]
-
blk.27.ffn_up.weightQ4_0[8192 22528]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ4_0[22528 8192]
-
blk.28.ffn_gate.weightQ4_0[8192 22528]
-
blk.28.ffn_up.weightQ4_0[8192 22528]
-
blk.28.attn_k.weightQ4_0[8192 8192]
-
blk.28.attn_output.weightQ4_0[8192 8192]
-
blk.28.attn_q.weightQ4_0[8192 8192]
-
blk.28.attn_v.weightQ4_0[8192 8192]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ4_0[22528 8192]
-
blk.29.ffn_gate.weightQ4_0[8192 22528]
-
blk.29.ffn_up.weightQ4_0[8192 22528]
-
blk.29.attn_k.weightQ4_0[8192 8192]
-
blk.29.attn_output.weightQ4_0[8192 8192]
-
blk.29.attn_q.weightQ4_0[8192 8192]
-
blk.29.attn_v.weightQ4_0[8192 8192]
-
blk.30.attn_k.weightQ4_0[8192 8192]
-
blk.30.attn_output.weightQ4_0[8192 8192]
-
blk.30.attn_q.weightQ4_0[8192 8192]
-
blk.30.attn_v.weightQ4_0[8192 8192]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ4_0[22528 8192]
-
blk.30.ffn_gate.weightQ4_0[8192 22528]
-
blk.30.ffn_up.weightQ4_0[8192 22528]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ4_0[22528 8192]
-
blk.31.ffn_gate.weightQ4_0[8192 22528]
-
blk.31.ffn_up.weightQ4_0[8192 22528]
-
blk.31.attn_k.weightQ4_0[8192 8192]
-
blk.31.attn_output.weightQ4_0[8192 8192]
-
blk.31.attn_q.weightQ4_0[8192 8192]
-
blk.31.attn_v.weightQ4_0[8192 8192]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ4_0[22528 8192]
-
blk.32.ffn_gate.weightQ4_0[8192 22528]
-
blk.32.ffn_up.weightQ4_0[8192 22528]
-
blk.32.attn_k.weightQ4_0[8192 8192]
-
blk.32.attn_output.weightQ4_0[8192 8192]
-
blk.32.attn_q.weightQ4_0[8192 8192]
-
blk.32.attn_v.weightQ4_0[8192 8192]
-
blk.33.attn_k.weightQ4_0[8192 8192]
-
blk.33.attn_output.weightQ4_0[8192 8192]
-
blk.33.attn_q.weightQ4_0[8192 8192]
-
blk.33.attn_v.weightQ4_0[8192 8192]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightQ4_0[22528 8192]
-
blk.33.ffn_gate.weightQ4_0[8192 22528]
-
blk.33.ffn_up.weightQ4_0[8192 22528]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ4_0[22528 8192]
-
blk.34.ffn_gate.weightQ4_0[8192 22528]
-
blk.34.ffn_up.weightQ4_0[8192 22528]
-
blk.34.attn_k.weightQ4_0[8192 8192]
-
blk.34.attn_output.weightQ4_0[8192 8192]
-
blk.34.attn_q.weightQ4_0[8192 8192]
-
blk.34.attn_v.weightQ4_0[8192 8192]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightQ4_0[22528 8192]
-
blk.35.ffn_gate.weightQ4_0[8192 22528]
-
blk.35.ffn_up.weightQ4_0[8192 22528]
-
blk.35.attn_k.weightQ4_0[8192 8192]
-
blk.35.attn_output.weightQ4_0[8192 8192]
-
blk.35.attn_q.weightQ4_0[8192 8192]
-
blk.35.attn_v.weightQ4_0[8192 8192]
-
blk.36.attn_k.weightQ4_0[8192 8192]
-
blk.36.attn_output.weightQ4_0[8192 8192]
-
blk.36.attn_q.weightQ4_0[8192 8192]
-
blk.36.attn_v.weightQ4_0[8192 8192]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightQ4_0[22528 8192]
-
blk.36.ffn_gate.weightQ4_0[8192 22528]
-
blk.36.ffn_up.weightQ4_0[8192 22528]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ4_0[22528 8192]
-
blk.37.ffn_gate.weightQ4_0[8192 22528]
-
blk.37.ffn_up.weightQ4_0[8192 22528]
-
blk.37.attn_k.weightQ4_0[8192 8192]
-
blk.37.attn_output.weightQ4_0[8192 8192]
-
blk.37.attn_q.weightQ4_0[8192 8192]
-
blk.37.attn_v.weightQ4_0[8192 8192]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ4_0[22528 8192]
-
blk.38.ffn_gate.weightQ4_0[8192 22528]
-
blk.38.ffn_up.weightQ4_0[8192 22528]
-
blk.38.attn_k.weightQ4_0[8192 8192]
-
blk.38.attn_output.weightQ4_0[8192 8192]
-
blk.38.attn_q.weightQ4_0[8192 8192]
-
blk.38.attn_v.weightQ4_0[8192 8192]
-
blk.39.attn_k.weightQ4_0[8192 8192]
-
blk.39.attn_output.weightQ4_0[8192 8192]
-
blk.39.attn_q.weightQ4_0[8192 8192]
-
blk.39.attn_v.weightQ4_0[8192 8192]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightQ4_0[22528 8192]
-
blk.39.ffn_gate.weightQ4_0[8192 22528]
-
blk.39.ffn_up.weightQ4_0[8192 22528]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39