<?xml version="1.0" encoding="utf-8" standalone="yes" ?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>Tools | KVCache.ai</title>
    <link>https://kvcache.ai/tools/</link>
      <atom:link href="https://kvcache.ai/tools/index.xml" rel="self" type="application/rss+xml" />
    <description>Tools</description>
    <generator>Hugo Blox Builder (https://hugoblox.com)</generator><language>en-us</language><lastBuildDate>Wed, 20 May 2026 00:00:00 +0000</lastBuildDate>
    <image>
      <url>https://kvcache.ai/media/logo.svg</url>
      <title>Tools</title>
      <link>https://kvcache.ai/tools/</link>
    </image>
    
    <item>
      <title>KV Cache Size Calculator</title>
      <link>https://kvcache.ai/tools/kv-cache-calculator/</link>
      <pubDate>Wed, 20 May 2026 00:00:00 +0000</pubDate>
      <guid>https://kvcache.ai/tools/kv-cache-calculator/</guid>
      <description>



&lt;section id=&#34;kv-cache-calculator&#34; class=&#34;kv-calculator-shell&#34; data-state=&#34;loading&#34;&gt;
  &lt;div class=&#34;kv-calculator-grid&#34;&gt;
    &lt;form class=&#34;kv-controls&#34; onsubmit=&#34;return false;&#34;&gt;
      &lt;label&gt;
        &lt;span&gt;Model family&lt;/span&gt;
        &lt;select data-kv-input=&#34;modelFamily&#34;&gt;&lt;/select&gt;
      &lt;/label&gt;

      &lt;label&gt;
        &lt;span&gt;Model&lt;/span&gt;
        &lt;select data-kv-input=&#34;model&#34;&gt;&lt;/select&gt;
      &lt;/label&gt;

      &lt;label&gt;
        &lt;span&gt;Tokens per sequence&lt;/span&gt;
        &lt;input data-kv-input=&#34;tokens&#34; type=&#34;number&#34; min=&#34;1&#34; step=&#34;1&#34; inputmode=&#34;numeric&#34; value=&#34;1024&#34;&gt;
      &lt;/label&gt;

      &lt;label&gt;
        &lt;span&gt;Sequences&lt;/span&gt;
        &lt;input data-kv-input=&#34;sequences&#34; type=&#34;number&#34; min=&#34;1&#34; step=&#34;1&#34; inputmode=&#34;numeric&#34; value=&#34;1&#34;&gt;
      &lt;/label&gt;

      &lt;label&gt;
        &lt;span&gt;KV precision&lt;/span&gt;
        &lt;select data-kv-input=&#34;precision&#34;&gt;&lt;/select&gt;
      &lt;/label&gt;

      &lt;label data-kv-indexer-control hidden&gt;
        &lt;span&gt;Indexer precision&lt;/span&gt;
        &lt;select data-kv-input=&#34;indexerPrecision&#34;&gt;&lt;/select&gt;
      &lt;/label&gt;

      &lt;label class=&#34;kv-checkbox-row&#34; data-kv-draft-control hidden&gt;
        &lt;input data-kv-input=&#34;includeDraftKvCache&#34; type=&#34;checkbox&#34;&gt;
        &lt;span data-kv-inline-help=&#34;Adds model-specific MTP/draft KV layers when enabled by the serving stack. DeepSeek V4 draft layers use ratio=0 sliding-window cache.&#34;&gt;Include draft KV cache&lt;/span&gt;
      &lt;/label&gt;

      &lt;label class=&#34;kv-checkbox-row&#34; data-kv-linear-state-control hidden&gt;
        &lt;input data-kv-input=&#34;includeLinearAttentionState&#34; type=&#34;checkbox&#34;&gt;
        &lt;span data-kv-inline-help=&#34;Adds Qwen3.5/3.6 linear-attention recurrent and convolution state. This state is sequence-level runtime cache, not ordinary per-token KV.&#34;&gt;Include linear-attention state&lt;/span&gt;
      &lt;/label&gt;
    &lt;/form&gt;

    &lt;div class=&#34;kv-results&#34;&gt;
      &lt;div class=&#34;kv-total-band&#34;&gt;
        &lt;div&gt;
          &lt;span&gt;Total cache size&lt;/span&gt;
          &lt;strong data-kv-output=&#34;totalGiB&#34;&gt;--&lt;/strong&gt;
        &lt;/div&gt;
        &lt;em data-kv-output=&#34;totalGB&#34;&gt;= -- GB&lt;/em&gt;
      &lt;/div&gt;

      &lt;div class=&#34;kv-metric-grid&#34; data-kv-metrics&gt;&lt;/div&gt;

      &lt;div class=&#34;kv-formula-panel&#34;&gt;
        &lt;div class=&#34;kv-formula-heading&#34;&gt;
          &lt;span data-kv-output=&#34;formulaLabel&#34;&gt;--&lt;/span&gt;
        &lt;/div&gt;
        &lt;div class=&#34;kv-formula-list&#34; data-kv-formula-rows&gt;
          &lt;div class=&#34;kv-formula-row&#34;&gt;
            &lt;span class=&#34;kv-formula-name&#34;&gt;--&lt;/span&gt;
            &lt;span class=&#34;kv-formula-equals&#34;&gt;=&lt;/span&gt;
            &lt;span class=&#34;kv-formula-expression&#34;&gt;--&lt;/span&gt;
          &lt;/div&gt;
        &lt;/div&gt;
        &lt;p data-kv-output=&#34;cacheNote&#34;&gt;&lt;/p&gt;
      &lt;/div&gt;

      &lt;div class=&#34;kv-breakdown&#34; data-kv-components&gt;&lt;/div&gt;

      &lt;a class=&#34;kv-source-link&#34; data-kv-source-link href=&#34;#&#34; rel=&#34;noopener&#34; target=&#34;_blank&#34;&gt;
        Source: &lt;span data-kv-output=&#34;source&#34;&gt;--&lt;/span&gt;
      &lt;/a&gt;
    &lt;/div&gt;
  &lt;/div&gt;
&lt;/section&gt;

&lt;script type=&#34;application/json&#34; id=&#34;kv-cache-calculator-data&#34;&gt;{&#34;indexer_precision_options&#34;:[{&#34;bytes_per_element&#34;:2,&#34;id&#34;:&#34;bf16_fp16&#34;,&#34;label&#34;:&#34;BF16 / FP16&#34;},{&#34;bytes_per_element&#34;:1,&#34;id&#34;:&#34;fp8_int8&#34;,&#34;label&#34;:&#34;FP8 / INT8&#34;},{&#34;bytes_per_element&#34;:0.5,&#34;id&#34;:&#34;fp4_int4&#34;,&#34;label&#34;:&#34;FP4 / INT4&#34;}],&#34;metadata&#34;:{&#34;note&#34;:&#34;Curated from official Hugging Face model config/source files and serving-engine references. Values describe KV cache capacity planning, not model weights or activation memory.&#34;,&#34;retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;serving_references&#34;:{&#34;deepseek_v4_vllm_indexer_fp4&#34;:&#34;https://vllm.ai/blog/deepseek-v4&#34;}},&#34;models&#34;:[{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;DeepSeek&#34;,&#34;fields&#34;:{&#34;compress_ratios&#34;:[128,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,0],&#34;head_dim&#34;:512,&#34;index_head_dim&#34;:128,&#34;index_topk&#34;:1024,&#34;num_hidden_layers&#34;:61,&#34;num_key_value_heads&#34;:1,&#34;sliding_window&#34;:128},&#34;formula&#34;:&#34;deepseek_v4_hybrid&#34;,&#34;id&#34;:&#34;deepseek-v4-pro&#34;,&#34;label&#34;:&#34;DeepSeek V4 Pro&#34;,&#34;max_position_embeddings&#34;:1048576,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/deepseek-ai/DeepSeek-V4-Pro/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;DeepSeek&#34;,&#34;fields&#34;:{&#34;compress_ratios&#34;:[0,0,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,128,4,0],&#34;head_dim&#34;:512,&#34;index_head_dim&#34;:128,&#34;index_topk&#34;:512,&#34;num_hidden_layers&#34;:43,&#34;num_key_value_heads&#34;:1,&#34;sliding_window&#34;:128},&#34;formula&#34;:&#34;deepseek_v4_hybrid&#34;,&#34;id&#34;:&#34;deepseek-v4-flash&#34;,&#34;label&#34;:&#34;DeepSeek V4 Flash&#34;,&#34;max_position_embeddings&#34;:1048576,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/deepseek-ai/DeepSeek-V4-Flash/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;DeepSeek&#34;,&#34;fields&#34;:{&#34;index_head_dim&#34;:128,&#34;index_n_heads&#34;:64,&#34;index_topk&#34;:2048,&#34;kv_lora_rank&#34;:512,&#34;num_hidden_layers&#34;:61,&#34;num_key_value_heads&#34;:128,&#34;num_nextn_predict_layers&#34;:1,&#34;qk_head_dim&#34;:192,&#34;qk_nope_head_dim&#34;:128,&#34;qk_rope_head_dim&#34;:64,&#34;v_head_dim&#34;:128},&#34;formula&#34;:&#34;dsa_mla&#34;,&#34;id&#34;:&#34;deepseek-v3.2&#34;,&#34;label&#34;:&#34;DeepSeek V3.2&#34;,&#34;max_position_embeddings&#34;:163840,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/deepseek-ai/DeepSeek-V3.2/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;DeepSeek&#34;,&#34;fields&#34;:{&#34;kv_lora_rank&#34;:512,&#34;num_hidden_layers&#34;:61,&#34;num_key_value_heads&#34;:128,&#34;num_nextn_predict_layers&#34;:1,&#34;qk_nope_head_dim&#34;:128,&#34;qk_rope_head_dim&#34;:64,&#34;v_head_dim&#34;:128},&#34;formula&#34;:&#34;mla&#34;,&#34;id&#34;:&#34;deepseek-v3&#34;,&#34;label&#34;:&#34;DeepSeek V3&#34;,&#34;max_position_embeddings&#34;:163840,&#34;source_retrieved_at&#34;:&#34;2026-05-22&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/deepseek-ai/DeepSeek-V3/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;DeepSeek&#34;,&#34;fields&#34;:{&#34;kv_lora_rank&#34;:512,&#34;num_hidden_layers&#34;:61,&#34;num_key_value_heads&#34;:128,&#34;num_nextn_predict_layers&#34;:1,&#34;qk_nope_head_dim&#34;:128,&#34;qk_rope_head_dim&#34;:64,&#34;v_head_dim&#34;:128},&#34;formula&#34;:&#34;mla&#34;,&#34;id&#34;:&#34;deepseek-r1&#34;,&#34;label&#34;:&#34;DeepSeek R1&#34;,&#34;max_position_embeddings&#34;:163840,&#34;source_retrieved_at&#34;:&#34;2026-05-22&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/deepseek-ai/DeepSeek-R1/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;GLM&#34;,&#34;fields&#34;:{&#34;index_head_dim&#34;:128,&#34;index_n_heads&#34;:32,&#34;index_topk&#34;:2048,&#34;kv_lora_rank&#34;:512,&#34;num_hidden_layers&#34;:78,&#34;num_key_value_heads&#34;:64,&#34;num_nextn_predict_layers&#34;:1,&#34;qk_head_dim&#34;:256,&#34;qk_nope_head_dim&#34;:192,&#34;qk_rope_head_dim&#34;:64,&#34;v_head_dim&#34;:256},&#34;formula&#34;:&#34;dsa_mla&#34;,&#34;id&#34;:&#34;glm-5&#34;,&#34;label&#34;:&#34;GLM-5&#34;,&#34;max_position_embeddings&#34;:202752,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/zai-org/GLM-5/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;GLM&#34;,&#34;fields&#34;:{&#34;index_head_dim&#34;:128,&#34;index_n_heads&#34;:32,&#34;index_topk&#34;:2048,&#34;kv_lora_rank&#34;:512,&#34;num_hidden_layers&#34;:78,&#34;num_key_value_heads&#34;:64,&#34;num_nextn_predict_layers&#34;:1,&#34;qk_head_dim&#34;:256,&#34;qk_nope_head_dim&#34;:192,&#34;qk_rope_head_dim&#34;:64,&#34;v_head_dim&#34;:256},&#34;formula&#34;:&#34;dsa_mla&#34;,&#34;id&#34;:&#34;glm-5.1&#34;,&#34;label&#34;:&#34;GLM-5.1&#34;,&#34;max_position_embeddings&#34;:202752,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/zai-org/GLM-5.1/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Kimi&#34;,&#34;fields&#34;:{&#34;kv_lora_rank&#34;:512,&#34;num_hidden_layers&#34;:61,&#34;num_key_value_heads&#34;:64,&#34;qk_nope_head_dim&#34;:128,&#34;qk_rope_head_dim&#34;:64,&#34;v_head_dim&#34;:128},&#34;formula&#34;:&#34;mla&#34;,&#34;id&#34;:&#34;kimi-k2.5&#34;,&#34;label&#34;:&#34;Kimi K2.5&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/moonshotai/Kimi-K2.5/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Kimi&#34;,&#34;fields&#34;:{&#34;kv_lora_rank&#34;:512,&#34;num_hidden_layers&#34;:61,&#34;num_key_value_heads&#34;:64,&#34;qk_nope_head_dim&#34;:128,&#34;qk_rope_head_dim&#34;:64,&#34;v_head_dim&#34;:128},&#34;formula&#34;:&#34;mla&#34;,&#34;id&#34;:&#34;kimi-k2.6&#34;,&#34;label&#34;:&#34;Kimi K2.6&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/moonshotai/Kimi-K2.6/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3.6&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:16,&#34;head_dim&#34;:256,&#34;linear_attention_layers&#34;:48,&#34;linear_conv_kernel_dim&#34;:4,&#34;linear_key_head_dim&#34;:128,&#34;linear_num_key_heads&#34;:16,&#34;linear_num_value_heads&#34;:48,&#34;linear_value_head_dim&#34;:128,&#34;mtp_num_hidden_layers&#34;:1,&#34;num_attention_heads&#34;:24,&#34;num_hidden_layers&#34;:64,&#34;num_key_value_heads&#34;:4},&#34;formula&#34;:&#34;qwen_linear_full_hybrid&#34;,&#34;id&#34;:&#34;qwen3.6-27b&#34;,&#34;label&#34;:&#34;Qwen3.6-27B&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3.6-27B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3.6&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:10,&#34;head_dim&#34;:256,&#34;linear_attention_layers&#34;:30,&#34;linear_conv_kernel_dim&#34;:4,&#34;linear_key_head_dim&#34;:128,&#34;linear_num_key_heads&#34;:16,&#34;linear_num_value_heads&#34;:32,&#34;linear_value_head_dim&#34;:128,&#34;mtp_num_hidden_layers&#34;:1,&#34;num_attention_heads&#34;:16,&#34;num_hidden_layers&#34;:40,&#34;num_key_value_heads&#34;:2},&#34;formula&#34;:&#34;qwen_linear_full_hybrid&#34;,&#34;id&#34;:&#34;qwen3.6-35b-a3b&#34;,&#34;label&#34;:&#34;Qwen3.6-35B-A3B&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3.6-35B-A3B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3.5&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:15,&#34;head_dim&#34;:256,&#34;linear_attention_layers&#34;:45,&#34;linear_conv_kernel_dim&#34;:4,&#34;linear_key_head_dim&#34;:128,&#34;linear_num_key_heads&#34;:16,&#34;linear_num_value_heads&#34;:64,&#34;linear_value_head_dim&#34;:128,&#34;mtp_num_hidden_layers&#34;:1,&#34;num_attention_heads&#34;:32,&#34;num_hidden_layers&#34;:60,&#34;num_key_value_heads&#34;:2},&#34;formula&#34;:&#34;qwen_linear_full_hybrid&#34;,&#34;id&#34;:&#34;qwen3.5-397b-a17b&#34;,&#34;label&#34;:&#34;Qwen3.5-397B-A17B&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3.5-397B-A17B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3.5&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:12,&#34;head_dim&#34;:256,&#34;linear_attention_layers&#34;:36,&#34;linear_conv_kernel_dim&#34;:4,&#34;linear_key_head_dim&#34;:128,&#34;linear_num_key_heads&#34;:16,&#34;linear_num_value_heads&#34;:64,&#34;linear_value_head_dim&#34;:128,&#34;mtp_num_hidden_layers&#34;:1,&#34;num_attention_heads&#34;:32,&#34;num_hidden_layers&#34;:48,&#34;num_key_value_heads&#34;:2},&#34;formula&#34;:&#34;qwen_linear_full_hybrid&#34;,&#34;id&#34;:&#34;qwen3.5-122b-a10b&#34;,&#34;label&#34;:&#34;Qwen3.5-122B-A10B&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3.5-122B-A10B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3.5&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:10,&#34;head_dim&#34;:256,&#34;linear_attention_layers&#34;:30,&#34;linear_conv_kernel_dim&#34;:4,&#34;linear_key_head_dim&#34;:128,&#34;linear_num_key_heads&#34;:16,&#34;linear_num_value_heads&#34;:32,&#34;linear_value_head_dim&#34;:128,&#34;mtp_num_hidden_layers&#34;:1,&#34;num_attention_heads&#34;:16,&#34;num_hidden_layers&#34;:40,&#34;num_key_value_heads&#34;:2},&#34;formula&#34;:&#34;qwen_linear_full_hybrid&#34;,&#34;id&#34;:&#34;qwen3.5-35b-a3b&#34;,&#34;label&#34;:&#34;Qwen3.5-35B-A3B&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3.5-35B-A3B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3.5&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:16,&#34;head_dim&#34;:256,&#34;linear_attention_layers&#34;:48,&#34;linear_conv_kernel_dim&#34;:4,&#34;linear_key_head_dim&#34;:128,&#34;linear_num_key_heads&#34;:16,&#34;linear_num_value_heads&#34;:48,&#34;linear_value_head_dim&#34;:128,&#34;mtp_num_hidden_layers&#34;:1,&#34;num_attention_heads&#34;:24,&#34;num_hidden_layers&#34;:64,&#34;num_key_value_heads&#34;:4},&#34;formula&#34;:&#34;qwen_linear_full_hybrid&#34;,&#34;id&#34;:&#34;qwen3.5-27b&#34;,&#34;label&#34;:&#34;Qwen3.5-27B&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3.5-27B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3.5&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:8,&#34;head_dim&#34;:256,&#34;linear_attention_layers&#34;:24,&#34;linear_conv_kernel_dim&#34;:4,&#34;linear_key_head_dim&#34;:128,&#34;linear_num_key_heads&#34;:16,&#34;linear_num_value_heads&#34;:32,&#34;linear_value_head_dim&#34;:128,&#34;mtp_num_hidden_layers&#34;:1,&#34;num_attention_heads&#34;:16,&#34;num_hidden_layers&#34;:32,&#34;num_key_value_heads&#34;:4},&#34;formula&#34;:&#34;qwen_linear_full_hybrid&#34;,&#34;id&#34;:&#34;qwen3.5-9b&#34;,&#34;label&#34;:&#34;Qwen3.5-9B&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3.5-9B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3.5&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:8,&#34;head_dim&#34;:256,&#34;linear_attention_layers&#34;:24,&#34;linear_conv_kernel_dim&#34;:4,&#34;linear_key_head_dim&#34;:128,&#34;linear_num_key_heads&#34;:16,&#34;linear_num_value_heads&#34;:32,&#34;linear_value_head_dim&#34;:128,&#34;mtp_num_hidden_layers&#34;:1,&#34;num_attention_heads&#34;:16,&#34;num_hidden_layers&#34;:32,&#34;num_key_value_heads&#34;:4},&#34;formula&#34;:&#34;qwen_linear_full_hybrid&#34;,&#34;id&#34;:&#34;qwen3.5-4b&#34;,&#34;label&#34;:&#34;Qwen3.5-4B&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3.5-4B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3.5&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:6,&#34;head_dim&#34;:256,&#34;linear_attention_layers&#34;:18,&#34;linear_conv_kernel_dim&#34;:4,&#34;linear_key_head_dim&#34;:128,&#34;linear_num_key_heads&#34;:16,&#34;linear_num_value_heads&#34;:16,&#34;linear_value_head_dim&#34;:128,&#34;mtp_num_hidden_layers&#34;:1,&#34;num_attention_heads&#34;:8,&#34;num_hidden_layers&#34;:24,&#34;num_key_value_heads&#34;:2},&#34;formula&#34;:&#34;qwen_linear_full_hybrid&#34;,&#34;id&#34;:&#34;qwen3.5-2b&#34;,&#34;label&#34;:&#34;Qwen3.5-2B&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3.5-2B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3.5&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:6,&#34;head_dim&#34;:256,&#34;linear_attention_layers&#34;:18,&#34;linear_conv_kernel_dim&#34;:4,&#34;linear_key_head_dim&#34;:128,&#34;linear_num_key_heads&#34;:16,&#34;linear_num_value_heads&#34;:16,&#34;linear_value_head_dim&#34;:128,&#34;mtp_num_hidden_layers&#34;:1,&#34;num_attention_heads&#34;:8,&#34;num_hidden_layers&#34;:24,&#34;num_key_value_heads&#34;:2},&#34;formula&#34;:&#34;qwen_linear_full_hybrid&#34;,&#34;id&#34;:&#34;qwen3.5-0.8b&#34;,&#34;label&#34;:&#34;Qwen3.5-0.8B&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3.5-0.8B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:64,&#34;num_hidden_layers&#34;:94,&#34;num_key_value_heads&#34;:4},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;qwen3-235b-a22b&#34;,&#34;label&#34;:&#34;Qwen3-235B-A22B&#34;,&#34;max_position_embeddings&#34;:40960,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3-235B-A22B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:64,&#34;num_hidden_layers&#34;:64,&#34;num_key_value_heads&#34;:8},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;qwen3-32b&#34;,&#34;label&#34;:&#34;Qwen3-32B&#34;,&#34;max_position_embeddings&#34;:40960,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3-32B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:32,&#34;num_hidden_layers&#34;:48,&#34;num_key_value_heads&#34;:4},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;qwen3-30b-a3b&#34;,&#34;label&#34;:&#34;Qwen3-30B-A3B&#34;,&#34;max_position_embeddings&#34;:40960,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3-30B-A3B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:40,&#34;num_hidden_layers&#34;:40,&#34;num_key_value_heads&#34;:8},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;qwen3-14b&#34;,&#34;label&#34;:&#34;Qwen3-14B&#34;,&#34;max_position_embeddings&#34;:40960,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3-14B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:32,&#34;num_hidden_layers&#34;:36,&#34;num_key_value_heads&#34;:8},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;qwen3-8b&#34;,&#34;label&#34;:&#34;Qwen3-8B&#34;,&#34;max_position_embeddings&#34;:40960,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3-8B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:32,&#34;num_hidden_layers&#34;:36,&#34;num_key_value_heads&#34;:8},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;qwen3-4b&#34;,&#34;label&#34;:&#34;Qwen3-4B&#34;,&#34;max_position_embeddings&#34;:40960,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3-4B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:16,&#34;num_hidden_layers&#34;:28,&#34;num_key_value_heads&#34;:8},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;qwen3-1.7b&#34;,&#34;label&#34;:&#34;Qwen3-1.7B&#34;,&#34;max_position_embeddings&#34;:40960,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3-1.7B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen3&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:16,&#34;num_hidden_layers&#34;:28,&#34;num_key_value_heads&#34;:8},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;qwen3-0.6b&#34;,&#34;label&#34;:&#34;Qwen3-0.6B&#34;,&#34;max_position_embeddings&#34;:40960,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen3-0.6B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen2.5&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;max_window_layers&#34;:70,&#34;num_attention_heads&#34;:64,&#34;num_hidden_layers&#34;:80,&#34;num_key_value_heads&#34;:8,&#34;sliding_window&#34;:131072,&#34;use_sliding_window&#34;:false},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;qwen2.5-72b&#34;,&#34;label&#34;:&#34;Qwen2.5-72B&#34;,&#34;max_position_embeddings&#34;:32768,&#34;source_retrieved_at&#34;:&#34;2026-05-22&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen2.5-72B-Instruct/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen2.5&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;max_window_layers&#34;:70,&#34;num_attention_heads&#34;:40,&#34;num_hidden_layers&#34;:64,&#34;num_key_value_heads&#34;:8,&#34;sliding_window&#34;:131072,&#34;use_sliding_window&#34;:false},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;qwen2.5-32b&#34;,&#34;label&#34;:&#34;Qwen2.5-32B&#34;,&#34;max_position_embeddings&#34;:32768,&#34;source_retrieved_at&#34;:&#34;2026-05-22&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen2.5-32B-Instruct/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen2.5&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;max_window_layers&#34;:70,&#34;num_attention_heads&#34;:40,&#34;num_hidden_layers&#34;:48,&#34;num_key_value_heads&#34;:8,&#34;sliding_window&#34;:131072,&#34;use_sliding_window&#34;:false},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;qwen2.5-14b&#34;,&#34;label&#34;:&#34;Qwen2.5-14B&#34;,&#34;max_position_embeddings&#34;:32768,&#34;source_retrieved_at&#34;:&#34;2026-05-22&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen2.5-14B-Instruct/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen2.5&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;max_window_layers&#34;:28,&#34;num_attention_heads&#34;:28,&#34;num_hidden_layers&#34;:28,&#34;num_key_value_heads&#34;:4,&#34;sliding_window&#34;:131072,&#34;use_sliding_window&#34;:false},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;qwen2.5-7b&#34;,&#34;label&#34;:&#34;Qwen2.5-7B&#34;,&#34;max_position_embeddings&#34;:32768,&#34;source_retrieved_at&#34;:&#34;2026-05-22&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen2.5-7B-Instruct/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Qwen2.5&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;max_window_layers&#34;:64,&#34;num_attention_heads&#34;:40,&#34;num_hidden_layers&#34;:64,&#34;num_key_value_heads&#34;:8,&#34;sliding_window&#34;:131072,&#34;use_sliding_window&#34;:false},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;qwen2.5-coder-32b&#34;,&#34;label&#34;:&#34;Qwen2.5-Coder-32B&#34;,&#34;max_position_embeddings&#34;:32768,&#34;source_retrieved_at&#34;:&#34;2026-05-22&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/Qwen/Qwen2.5-Coder-32B-Instruct/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Llama&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:32,&#34;num_hidden_layers&#34;:32,&#34;num_key_value_heads&#34;:8},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;llama-3.1-8b&#34;,&#34;label&#34;:&#34;Llama 3.1 8B&#34;,&#34;max_position_embeddings&#34;:131072,&#34;source_retrieved_at&#34;:&#34;2026-05-22&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Llama&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:64,&#34;num_hidden_layers&#34;:80,&#34;num_key_value_heads&#34;:8},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;llama-3.1-70b&#34;,&#34;label&#34;:&#34;Llama 3.1 70B&#34;,&#34;max_position_embeddings&#34;:131072,&#34;source_retrieved_at&#34;:&#34;2026-05-22&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/meta-llama/Llama-3.1-70B-Instruct/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Llama&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:64,&#34;num_hidden_layers&#34;:80,&#34;num_key_value_heads&#34;:8},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;llama-3.3-70b&#34;,&#34;label&#34;:&#34;Llama 3.3 70B&#34;,&#34;max_position_embeddings&#34;:131072,&#34;source_retrieved_at&#34;:&#34;2026-05-22&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/meta-llama/Llama-3.3-70B-Instruct/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Gemma&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:3,&#34;global_head_dim&#34;:512,&#34;head_dim&#34;:256,&#34;num_attention_heads&#34;:8,&#34;num_hidden_layers&#34;:35,&#34;num_key_value_heads&#34;:1,&#34;num_kv_shared_layers&#34;:20,&#34;sliding_attention_layers&#34;:12,&#34;sliding_window&#34;:512,&#34;stored_layers&#34;:15},&#34;formula&#34;:&#34;mixed_full_sliding_gqa&#34;,&#34;id&#34;:&#34;gemma-4-e2b&#34;,&#34;label&#34;:&#34;Gemma 4 E2B&#34;,&#34;max_position_embeddings&#34;:131072,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/google/gemma-4-E2B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Gemma&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:4,&#34;global_head_dim&#34;:512,&#34;head_dim&#34;:256,&#34;num_attention_heads&#34;:8,&#34;num_hidden_layers&#34;:42,&#34;num_key_value_heads&#34;:2,&#34;num_kv_shared_layers&#34;:18,&#34;sliding_attention_layers&#34;:20,&#34;sliding_window&#34;:512,&#34;stored_layers&#34;:24},&#34;formula&#34;:&#34;mixed_full_sliding_gqa&#34;,&#34;id&#34;:&#34;gemma-4-e4b&#34;,&#34;label&#34;:&#34;Gemma 4 E4B&#34;,&#34;max_position_embeddings&#34;:131072,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/google/gemma-4-E4B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Gemma&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:5,&#34;global_head_dim&#34;:512,&#34;head_dim&#34;:256,&#34;num_attention_heads&#34;:16,&#34;num_global_key_value_heads&#34;:2,&#34;num_hidden_layers&#34;:30,&#34;num_key_value_heads&#34;:8,&#34;num_kv_shared_layers&#34;:0,&#34;sliding_attention_layers&#34;:25,&#34;sliding_window&#34;:1024,&#34;stored_layers&#34;:30},&#34;formula&#34;:&#34;mixed_full_sliding_gqa&#34;,&#34;id&#34;:&#34;gemma-4-26b-a4b&#34;,&#34;label&#34;:&#34;Gemma 4 26B-A4B&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/google/gemma-4-26B-A4B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Gemma&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:10,&#34;global_head_dim&#34;:512,&#34;head_dim&#34;:256,&#34;num_attention_heads&#34;:32,&#34;num_global_key_value_heads&#34;:4,&#34;num_hidden_layers&#34;:60,&#34;num_key_value_heads&#34;:16,&#34;num_kv_shared_layers&#34;:0,&#34;sliding_attention_layers&#34;:50,&#34;sliding_window&#34;:1024,&#34;stored_layers&#34;:60},&#34;formula&#34;:&#34;mixed_full_sliding_gqa&#34;,&#34;id&#34;:&#34;gemma-4-31b&#34;,&#34;label&#34;:&#34;Gemma 4 31B&#34;,&#34;max_position_embeddings&#34;:262144,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/google/gemma-4-31B/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Cohere&#34;,&#34;fields&#34;:{&#34;config_max_position_embeddings&#34;:8192,&#34;head_dim&#34;:128,&#34;model_max_length&#34;:131072,&#34;num_attention_heads&#34;:64,&#34;num_hidden_layers&#34;:40,&#34;num_key_value_heads&#34;:64},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;cohere-command-r-v01&#34;,&#34;label&#34;:&#34;Cohere Command R v01&#34;,&#34;max_position_embeddings&#34;:131072,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/CohereLabs/c4ai-command-r-v01/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Cohere&#34;,&#34;fields&#34;:{&#34;config_max_position_embeddings&#34;:8192,&#34;head_dim&#34;:128,&#34;model_max_length&#34;:131072,&#34;num_attention_heads&#34;:96,&#34;num_hidden_layers&#34;:64,&#34;num_key_value_heads&#34;:8},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;cohere-command-r-plus&#34;,&#34;label&#34;:&#34;Cohere Command R+&#34;,&#34;max_position_embeddings&#34;:131072,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/CohereLabs/c4ai-command-r-plus/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Cohere&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:8,&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:32,&#34;num_hidden_layers&#34;:32,&#34;num_key_value_heads&#34;:8,&#34;sliding_attention_layers&#34;:24,&#34;sliding_window&#34;:4096,&#34;sliding_window_pattern&#34;:4},&#34;formula&#34;:&#34;mixed_full_sliding_gqa&#34;,&#34;id&#34;:&#34;cohere-command-r7b-12-2024&#34;,&#34;label&#34;:&#34;Cohere Command R7B 12-2024&#34;,&#34;max_position_embeddings&#34;:132096,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/CohereLabs/c4ai-command-r7b-12-2024/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Cohere&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:16,&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:96,&#34;num_hidden_layers&#34;:64,&#34;num_key_value_heads&#34;:8,&#34;sliding_attention_layers&#34;:48,&#34;sliding_window&#34;:4096,&#34;sliding_window_pattern&#34;:4},&#34;formula&#34;:&#34;mixed_full_sliding_gqa&#34;,&#34;id&#34;:&#34;cohere-command-a-03-2025&#34;,&#34;label&#34;:&#34;Cohere Command A 03-2025&#34;,&#34;max_position_embeddings&#34;:131072,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/CohereLabs/c4ai-command-a-03-2025/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;Cohere&#34;,&#34;fields&#34;:{&#34;full_attention_layers&#34;:8,&#34;head_dim&#34;:128,&#34;num_attention_heads&#34;:128,&#34;num_hidden_layers&#34;:32,&#34;num_key_value_heads&#34;:8,&#34;sliding_attention_layers&#34;:24,&#34;sliding_window&#34;:4096},&#34;formula&#34;:&#34;mixed_full_sliding_gqa&#34;,&#34;id&#34;:&#34;cohere-command-a-plus-05-2026&#34;,&#34;label&#34;:&#34;Cohere Command A Plus 05-2026&#34;,&#34;max_position_embeddings&#34;:200000,&#34;source_retrieved_at&#34;:&#34;2026-05-23&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/CohereLabs/command-a-plus-05-2026-bf16/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;MiniMax&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;mtp_transformer_layers&#34;:1,&#34;num_attention_heads&#34;:48,&#34;num_hidden_layers&#34;:62,&#34;num_key_value_heads&#34;:8,&#34;num_mtp_modules&#34;:3,&#34;rotary_dim&#34;:64,&#34;use_mtp&#34;:true},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;minimax-m2&#34;,&#34;label&#34;:&#34;MiniMax M2&#34;,&#34;max_position_embeddings&#34;:196608,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/MiniMaxAI/MiniMax-M2/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;MiniMax&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;mtp_transformer_layers&#34;:1,&#34;num_attention_heads&#34;:48,&#34;num_hidden_layers&#34;:62,&#34;num_key_value_heads&#34;:8,&#34;num_mtp_modules&#34;:3,&#34;rotary_dim&#34;:64,&#34;use_mtp&#34;:true},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;minimax-m2.1&#34;,&#34;label&#34;:&#34;MiniMax M2.1&#34;,&#34;max_position_embeddings&#34;:196608,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/MiniMaxAI/MiniMax-M2.1/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;MiniMax&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;mtp_transformer_layers&#34;:1,&#34;num_attention_heads&#34;:48,&#34;num_hidden_layers&#34;:62,&#34;num_key_value_heads&#34;:8,&#34;num_mtp_modules&#34;:3,&#34;rotary_dim&#34;:64,&#34;use_mtp&#34;:true},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;minimax-m2.5&#34;,&#34;label&#34;:&#34;MiniMax M2.5&#34;,&#34;max_position_embeddings&#34;:196608,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/MiniMaxAI/MiniMax-M2.5/raw/main/config.json&#34;},{&#34;default_tokens&#34;:1024,&#34;family&#34;:&#34;MiniMax&#34;,&#34;fields&#34;:{&#34;head_dim&#34;:128,&#34;mtp_transformer_layers&#34;:1,&#34;num_attention_heads&#34;:48,&#34;num_hidden_layers&#34;:62,&#34;num_key_value_heads&#34;:8,&#34;num_mtp_modules&#34;:3,&#34;rotary_dim&#34;:64,&#34;use_mtp&#34;:true},&#34;formula&#34;:&#34;standard_gqa&#34;,&#34;id&#34;:&#34;minimax-m2.7&#34;,&#34;label&#34;:&#34;MiniMax M2.7&#34;,&#34;max_position_embeddings&#34;:204800,&#34;source_retrieved_at&#34;:&#34;2026-05-20&#34;,&#34;source_url&#34;:&#34;https://huggingface.co/MiniMaxAI/MiniMax-M2.7/raw/main/config.json&#34;}],&#34;precision_options&#34;:[{&#34;bytes_per_element&#34;:2,&#34;id&#34;:&#34;bf16_fp16&#34;,&#34;label&#34;:&#34;BF16 / FP16&#34;},{&#34;bytes_per_element&#34;:1,&#34;id&#34;:&#34;fp8_int8&#34;,&#34;label&#34;:&#34;FP8 / INT8&#34;},{&#34;bytes_per_element&#34;:0.5,&#34;id&#34;:&#34;fp4_int4&#34;,&#34;label&#34;:&#34;FP4 / INT4&#34;}]}&lt;/script&gt;
&lt;script src=&#34;https://kvcache.ai/js/kv-cache-calculator.min.56015a1b5a2b3c346c0b5a492ff4c55fdfde157d980f79cb22c2968c9c1d05b6.js&#34; integrity=&#34;sha256-VgFaG1orPDRsC1pJL/TFX9/eFX2YD3nLIsKWjJwdBbY=&#34;&gt;&lt;/script&gt;
&lt;script&gt;
  window.KVCacheCalculator.mount(
    &#34;kv-cache-calculator&#34;,
    JSON.parse(document.getElementById(&#34;kv-cache-calculator-data&#34;).textContent)
  );
&lt;/script&gt;

&lt;style&gt;
  .kv-calculator-shell {
    --kv-ink: #0f172a;
    --kv-muted: #64748b;
    --kv-line: #dbe4ee;
    --kv-panel: #f8fafc;
    --kv-blue: #2563eb;
    --kv-cyan: #0891b2;
    width: min(100%, 72rem);
    margin: 0 auto;
    padding: 0;
    color: var(--kv-ink);
  }

  body:has(#kv-cache-calculator) .hb-toc {
    display: none !important;
  }

  body:has(#kv-cache-calculator) article &gt; main {
    max-width: 80rem;
  }

  body:has(#kv-cache-calculator) article h1 {
    text-align: center;
  }

  .kv-calculator-grid {
    display: grid;
    grid-template-columns: minmax(16rem, 22rem) minmax(0, 1fr);
    gap: 1rem;
    align-items: start;
  }

  .kv-controls,
  .kv-results {
    border: 1px solid var(--kv-line);
    border-radius: 8px;
    background: var(--kv-panel);
  }

  .kv-controls {
    display: grid;
    gap: 0.85rem;
    padding: 1rem;
  }

  .kv-controls label {
    display: grid;
    gap: 0.35rem;
    margin: 0;
    color: var(--kv-muted);
    font-size: 0.82rem;
    font-weight: 650;
  }

  .kv-controls .kv-checkbox-row {
    display: grid;
    grid-template-columns: 1.05rem minmax(0, 1fr);
    align-items: center;
    gap: 0.55rem;
  }

  .kv-checkbox-row input {
    width: 1.05rem;
    min-height: 1.05rem;
    margin: 0;
  }

  .kv-controls [hidden] {
    display: none !important;
  }

  .kv-controls select,
  .kv-controls input {
    width: 100%;
    min-height: 2.75rem;
    border: 1px solid #cbd5e1;
    border-radius: 7px;
    background: #fff;
    color: var(--kv-ink);
    font: inherit;
    font-size: 0.95rem;
    padding: 0.55rem 0.7rem;
  }

  .kv-controls input[type=&#34;checkbox&#34;] {
    width: 1.05rem;
    min-height: 1.05rem;
    padding: 0;
  }

  .kv-controls select:focus,
  .kv-controls input:focus {
    outline: 2px solid rgba(37, 99, 235, 0.2);
    border-color: var(--kv-blue);
  }

  .kv-results {
    display: grid;
    gap: 1rem;
    padding: 1rem;
  }

  .kv-total-band {
    display: flex;
    justify-content: space-between;
    gap: 1rem;
    padding: 1rem;
    border-radius: 8px;
    background: #e0f2fe;
    border: 1px solid #bae6fd;
  }

  .kv-total-band span,
  .kv-metric-grid span {
    display: block;
    color: var(--kv-muted);
    font-size: 0.82rem;
    font-weight: 650;
  }

  .kv-total-band strong {
    display: block;
    margin-top: 0.2rem;
    color: #0c4a6e;
    font-size: clamp(2rem, 4vw, 3.2rem);
    line-height: 1;
    letter-spacing: 0;
    white-space: nowrap;
  }

  .kv-total-band em {
    align-self: end;
    color: #0369a1;
    font-style: normal;
    font-weight: 700;
    white-space: nowrap;
  }

  .kv-metric-grid {
    display: grid;
    grid-template-columns: repeat(auto-fit, minmax(9rem, 1fr));
    gap: 0.75rem;
  }

  .kv-metric-grid div {
    min-height: 5rem;
    padding: 0.85rem;
    border: 1px solid var(--kv-line);
    border-radius: 8px;
    background: #fff;
  }

  .kv-metric-grid strong {
    display: block;
    margin-top: 0.4rem;
    font-size: 1.2rem;
    letter-spacing: 0;
    white-space: nowrap;
  }

  .kv-help {
    position: relative;
    display: inline-grid;
    place-items: center;
    width: 1rem;
    height: 1rem;
    margin-left: 0.35rem;
    padding: 0;
    border: 1px solid #cbd5e1;
    border-radius: 999px;
    background: #fff;
    color: var(--kv-muted);
    font: inherit;
    font-size: 0.68rem;
    font-weight: 800;
    line-height: 1;
    vertical-align: 0.08rem;
    cursor: help;
  }

  .kv-help::after {
    display: none;
    position: absolute;
    z-index: 5;
    top: 50%;
    left: calc(100% + 0.45rem);
    width: max-content;
    max-width: min(18rem, calc(100vw - 2rem));
    padding: 0.55rem 0.65rem;
    border: 1px solid var(--kv-line);
    border-radius: 7px;
    background: #fff;
    box-shadow: 0 10px 28px rgba(15, 23, 42, 0.14);
    color: var(--kv-ink);
    content: attr(data-kv-tooltip);
    font-family: inherit;
    font-size: 0.78rem;
    font-weight: 550;
    line-height: 1.45;
    opacity: 0;
    pointer-events: none;
    text-align: left;
    transform: translateY(-50%);
    transition: opacity 0.12s ease;
    white-space: normal;
  }

  .kv-help:hover::after,
  .kv-help:focus::after,
  .kv-help:focus-visible::after,
  .kv-help[data-kv-open=&#34;true&#34;]::after {
    display: block;
    opacity: 1;
  }

  .kv-formula-panel {
    display: grid;
    gap: 0.65rem;
    padding: 0.9rem;
    border: 1px solid var(--kv-line);
    border-radius: 8px;
    background: #fff;
  }

  .kv-formula-heading {
    color: var(--kv-cyan);
    font-weight: 750;
  }

  .kv-formula-list {
    display: grid;
    gap: 0.55rem;
  }

  .kv-formula-row {
    display: grid;
    grid-template-columns: minmax(7.5rem, max-content) 1rem minmax(0, 1fr);
    gap: 0.55rem;
    align-items: start;
    padding: 0.7rem;
    border: 1px solid #dbeafe;
    border-radius: 7px;
    background: #f8fafc;
  }

  .kv-formula-name,
  .kv-formula-equals,
  .kv-formula-expression {
    font-family: ui-monospace, SFMono-Regular, Menlo, Monaco, Consolas, &#34;Liberation Mono&#34;, &#34;Courier New&#34;, monospace;
    font-size: 0.82rem;
    line-height: 1.55;
    letter-spacing: 0;
    min-width: 0;
  }

  .kv-formula-name {
    color: #075985;
    font-weight: 750;
    overflow-wrap: anywhere;
  }

  .kv-formula-equals {
    color: var(--kv-muted);
    text-align: center;
  }

  .kv-formula-expression {
    color: #1e293b;
    overflow-wrap: anywhere;
  }

  .kv-formula-panel p {
    margin: 0;
    color: var(--kv-muted);
    font-size: 0.9rem;
    line-height: 1.55;
  }

  .kv-breakdown {
    display: grid;
    gap: 0.45rem;
  }

  .kv-breakdown-row {
    display: flex;
    justify-content: space-between;
    gap: 1rem;
    padding: 0.62rem 0;
    border-bottom: 1px solid #e2e8f0;
    color: var(--kv-muted);
    font-size: 0.9rem;
  }

  .kv-breakdown-row strong {
    color: var(--kv-ink);
    text-align: right;
  }

  .kv-source-link {
    color: var(--kv-blue);
    font-size: 0.82rem;
    overflow-wrap: anywhere;
  }

  @media (max-width: 860px) {
    .kv-total-band {
      align-items: start;
      flex-direction: column;
    }

    .kv-calculator-grid {
      grid-template-columns: 1fr;
    }

    .kv-metric-grid {
      grid-template-columns: 1fr;
    }

    .kv-formula-row {
      grid-template-columns: 1fr;
      gap: 0.25rem;
    }

    .kv-formula-equals {
      display: none;
    }

    .kv-help::after {
      top: calc(100% + 0.4rem);
      right: auto;
      left: 50%;
      width: 14rem;
      max-width: calc(100vw - 2rem);
      transform: translateX(-50%);
    }
  }

  :is(.dark .kv-calculator-shell) {
    --kv-ink: #e2e8f0;
    --kv-muted: #94a3b8;
    --kv-line: #334155;
    --kv-panel: #111827;
  }

  :is(.dark .kv-controls),
  :is(.dark .kv-results),
  :is(.dark .kv-formula-panel) {
    background: #020617;
  }

  :is(.dark .kv-controls select),
  :is(.dark .kv-controls input),
  :is(.dark .kv-help) {
    background: #020617;
    color: #e2e8f0;
    border-color: #475569;
  }

  :is(.dark .kv-total-band) {
    background: #0b1220;
    border-color: #1d4ed8;
  }

  :is(.dark .kv-total-band strong),
  :is(.dark .kv-total-band em) {
    color: #93c5fd;
  }

  :is(.dark .kv-formula-row) {
    background: #0f172a;
    border-color: #1e293b;
  }

  :is(.dark .kv-formula-name) {
    color: #67e8f9;
  }

  :is(.dark .kv-formula-expression) {
    color: #e2e8f0;
  }

  :is(.dark .kv-help::after) {
    background: #020617;
    color: #e2e8f0;
    border-color: #334155;
  }
&lt;/style&gt;

</description>
    </item>
    
  </channel>
</rss>
