Updating model comparison table for recent model ships (#58557)

dihydroJenoxide · sunbrye · web-flow · commit b09f0becdfd8 · 2026-01-13T18:04:34.000Z
Co-authored-by: sunbrye &lt;sunbrye@github.com&gt;
Co-authored-by: Sunbrye Ly &lt;56200261+sunbrye@users.noreply.github.com&gt;
diff --git a/content/copilot/reference/ai-models/model-comparison.md b/content/copilot/reference/ai-models/model-comparison.md
@@ -29,23 +29,12 @@ contentType: reference
 
 Use this table to find a suitable model quickly, see more detail in the sections below.
 
-| Model                                                 | Task area                                        | Excels at (primary use case)                                            | Additional capabilities       | Further reading                                                                                                                                                |
-|-------------------------------------------------------|--------------------------------------------------|-------------------------------------------------------------------------|-------------------------------|----------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| {% data variables.copilot.copilot_gpt_41 %}           | General-purpose coding and writing               | Fast, accurate code completions and explanations                        | Agent mode, vision            | [{% data variables.copilot.copilot_gpt_41 %} model card](https://openai.com/index/gpt-4-1/)                                                                    |
-| {% data variables.copilot.copilot_gpt_52 %}           | Deep reasoning and debugging                     | Multi-step problem solving and architecture-level code analysis         | Agent mode                    | Not available                                                                                                                                                  |
-| {% data variables.copilot.copilot_gpt_51 %}           | Deep reasoning and debugging                     | Multi-step problem solving and architecture-level code analysis         | Agent mode                    | Not available                                                                                                                                                  |
-| {% data variables.copilot.copilot_gpt_5_codex %}      | General-purpose coding and writing               | Fast, accurate code completions and explanations                        | Agent mode                    | [{% data variables.copilot.copilot_gpt_5_codex %} model card](https://cdn.openai.com/pdf/97cc5669-7a25-4e63-b15f-5fd5bdc4d149/gpt-5-codex-system-card.pdf)     |
-| {% data variables.copilot.copilot_gpt_5_mini %}       | General-purpose coding and writing               | Fast, accurate code completions and explanations                        | Agent mode, reasoning, vision | [{% data variables.copilot.copilot_gpt_5_mini %} model card](https://cdn.openai.com/gpt-5-system-card.pdf)                                                     |
-| {% data variables.copilot.copilot_gpt_5 %}            | Deep reasoning and debugging                     | Multi-step problem solving and architecture-level code analysis         | Reasoning                     | [{% data variables.copilot.copilot_gpt_5 %} model card](https://cdn.openai.com/gpt-5-system-card.pdf)                                                          |
-| {% data variables.copilot.copilot_claude_haiku_45 %}  | Fast help with simple or repetitive tasks | Fast, reliable answers to lightweight coding questions             | Agent mode                    | Not available                                                                                                                                                  |
-| {% data variables.copilot.copilot_claude_sonnet_45 %} | General-purpose coding and agent tasks           | Complex problem-solving challenges, sophisticated reasoning             | Agent mode                    | [{% data variables.copilot.copilot_claude_sonnet_45 %} model card](https://assets.anthropic.com/m/12f214efcc2f457a/original/Claude-Sonnet-4-5-System-Card.pdf) |
-| {% data variables.copilot.copilot_claude_opus_41 %}   | Deep reasoning and debugging                     | Complex problem-solving challenges, sophisticated reasoning             | Reasoning, vision             | [{% data variables.copilot.copilot_claude_opus_41 %} model card](https://assets.anthropic.com/m/4c024b86c698d3d4/original/Claude-4-1-System-Card.pdf)          |
-| {% data variables.copilot.copilot_claude_sonnet_40 %} | Deep reasoning and debugging                     | Performance and practicality, perfectly balanced for coding workflows   | Agent mode, vision            | [{% data variables.copilot.copilot_claude_sonnet_40 %} model card](https://www-cdn.anthropic.com/6be99a52cb68eb70eb9572b4cafad13df32ed995.pdf)                 |
-| {% data variables.copilot.copilot_gemini_25_pro %}    | Deep reasoning and debugging                     | Complex code generation, debugging, and research workflows              | Reasoning, vision             | [{% data variables.copilot.copilot_gemini_25_pro %} model card](https://storage.googleapis.com/model-cards/documents/gemini-2.5-pro.pdf)                       |
-| {% data variables.copilot.copilot_gemini_3_flash %}   | Fast help with simple or repetitive tasks | Fast, reliable answers to lightweight coding questions             | Agent mode                    | Not available                                                                                                                                                  |
-| {% data variables.copilot.copilot_grok_code %}        | General-purpose coding and writing               | Fast, accurate code completions and explanations                        | Agent mode                    | [{% data variables.copilot.copilot_grok_code %} model card](https://data.x.ai/2025-08-20-grok-4-model-card.pdf)                                                |
-| {% data variables.copilot.copilot_qwen_25 %}          | General-purpose coding and writing               | Code generation, reasoning, and code repair / debugging                 | Reasoning                     | [{% data variables.copilot.copilot_qwen_25 %} model card](https://arxiv.org/pdf/2409.12186)                                                                    |
-| {% data variables.copilot.copilot_raptor_mini %}      | General-purpose coding and writing               | Fast, accurate code completions and explanations                 | Agent mode                    | Coming soon                                                                                                                                                    |
+
+| Model                                              | Task area             | Excels at (primary use case) | Further reading             |
+|----------------------------------------------------|-----------------------|------------------------------|-----------------------------|
+| {% for model in tables.copilot.model-comparison %} |
+| {{ model.name }}                                   | {{ model.task_area }} | {{ model.excels_at }}        | {{ model.further_reading }} |
+| {% endfor %}                                       |
 
 ## Task: General-purpose coding and writing
 
diff --git a/data/tables/copilot/model-comparison.yml b/data/tables/copilot/model-comparison.yml
@@ -0,0 +1,112 @@
+# Please keep this list sorted in the following order:
+# 1. By provider, in this order:
+#    - OpenAI
+#    - Anthropic
+#    - Google
+#    - xAI
+# 2. Within each provider group, alphabetically by model name.
+
+# OpenAI
+- name: GPT-4.1
+  task_area: General-purpose coding and writing
+  excels_at: Fast, accurate code completions and explanations
+  further_reading: '[GPT-4.1 model card](https://openai.com/index/gpt-4-1/)'
+
+- name: GPT-5
+  task_area: Deep reasoning and debugging
+  excels_at: Multi-step problem solving and architecture-level code analysis
+  further_reading: '[GPT-5 model card](https://cdn.openai.com/gpt-5-system-card.pdf)'
+
+- name: GPT-5-Codex
+  task_area: General-purpose coding and writing
+  excels_at: Fast, accurate code completions and explanations
+  further_reading: '[GPT-5-Codex model card](https://cdn.openai.com/pdf/97cc5669-7a25-4e63-b15f-5fd5bdc4d149/gpt-5-codex-system-card.pdf)'
+
+- name: GPT-5 mini
+  task_area: General-purpose coding and writing
+  excels_at: Fast, accurate code completions and explanations
+  further_reading: '[GPT-5 mini model card](https://cdn.openai.com/gpt-5-system-card.pdf)'
+
+- name: GPT-5.1
+  task_area: Deep reasoning and debugging
+  excels_at: Multi-step problem solving and architecture-level code analysis
+  further_reading: '[GPT-5.1 model card](https://cdn.openai.com/pdf/4173ec8d-1229-47db-96de-06d87147e07e/5_1_system_card.pdf)'
+
+- name: GPT-5.1-Codex
+  task_area: Deep reasoning and debugging
+  excels_at: Multi-step problem solving and architecture-level code analysis
+  further_reading: 'Not available'
+
+- name: GPT-5.1 Codex Max
+  task_area: Agentic software development
+  excels_at: Agentic tasks
+  further_reading: '[GPT-5.1-Codex-Max model card](https://cdn.openai.com/pdf/2a7d98b1-57e5-4147-8d0e-683894d782ae/5p1_codex_max_card_03.pdf)'
+
+- name: GPT-5.1-Codex-Mini
+  task_area: Deep reasoning and debugging
+  excels_at: Multi-step problem solving and architecture-level code analysis
+  further_reading: 'Not available'
+
+- name: GPT-5.2
+  task_area: Deep reasoning and debugging
+  excels_at: Multi-step problem solving and architecture-level code analysis
+  further_reading: '[GPT-5.2 model card](https://cdn.openai.com/pdf/3a4153c8-c748-4b71-8e31-aecbde944f8d/oai_5_2_system-card.pdf)'
+
+# Anthropic
+- name: Claude Haiku 4.5
+  task_area: Fast help with simple or repetitive tasks
+  excels_at: Fast, reliable answers to lightweight coding questions
+  further_reading: '[Claude Haiku 4.5 model card](https://assets.anthropic.com/m/99128ddd009bdcb/Claude-Haiku-4-5-System-Card.pdf)'
+
+- name: Claude Opus 4.1
+  task_area: Deep reasoning and debugging
+  excels_at: Complex problem-solving challenges, sophisticated reasoning
+  further_reading: '[Claude Opus 4.1 model card](https://assets.anthropic.com/m/4c024b86c698d3d4/original/Claude-4-1-System-Card.pdf)'
+
+- name: Claude Opus 4.5
+  task_area: Deep reasoning and debugging
+  excels_at: Complex problem-solving challenges, sophisticated reasoning
+  further_reading: '[Claude Opus 4.5 model card](https://assets.anthropic.com/m/64823ba7485345a7/Claude-Opus-4-5-System-Card.pdf)'
+
+- name: Claude Sonnet 4.0
+  task_area: Deep reasoning and debugging
+  excels_at: Performance and practicality, perfectly balanced for coding workflows
+  further_reading: '[Claude Sonnet 4.0 model card](https://www-cdn.anthropic.com/6be99a52cb68eb70eb9572b4cafad13df32ed995.pdf)'
+
+- name: Claude Sonnet 4.5
+  task_area: General-purpose coding and agent tasks
+  excels_at: Complex problem-solving challenges, sophisticated reasoning
+  further_reading: '[Claude Sonnet 4.5 model card](https://assets.anthropic.com/m/12f214efcc2f457a/original/Claude-Sonnet-4-5-System-Card.pdf)'
+
+# Google
+- name: Gemini 2.5 Pro
+  task_area: Deep reasoning and debugging
+  excels_at: Complex code generation, debugging, and research workflows
+  further_reading: '[Gemini 2.5 Pro model card](https://storage.googleapis.com/model-cards/documents/gemini-2.5-pro.pdf)'
+
+- name: Gemini 3 Flash
+  task_area: Fast help with simple or repetitive tasks
+  excels_at: Fast, reliable answers to lightweight coding questions
+  further_reading: '[Gemini 3 Flash model card](https://storage.googleapis.com/deepmind-media/Model-Cards/Gemini-3-Flash-Model-Card.pdf)'
+
+- name: Gemini 3 Pro
+  task_area: Deep reasoning and debugging
+  excels_at: Complex code generation, debugging, and research workflows
+  further_reading: '[Gemini 3 Pro model card](https://storage.googleapis.com/deepmind-media/Model-Cards/Gemini-3-Pro-Model-Card.pdf)'
+
+# xAI
+- name: Grok Code Fast 1
+  task_area: General-purpose coding and writing
+  excels_at: Fast, accurate code completions and explanations
+  further_reading: '[Grok Code Fast 1 model card](https://data.x.ai/2025-08-20-grok-4-model-card.pdf)'
+
+# Other providers (alphabetized by model name)
+- name: Qwen2.5
+  task_area: General-purpose coding and writing
+  excels_at: Code generation, reasoning, and code repair / debugging
+  further_reading: '[Qwen2.5 model card](https://arxiv.org/pdf/2409.12186)'
+
+- name: Raptor mini
+  task_area: General-purpose coding and writing
+  excels_at: Fast, accurate code completions and explanations
+  further_reading: 'Coming soon'
diff --git a/src/data-directory/lib/data-schemas/tables/copilot/model-comparison.ts b/src/data-directory/lib/data-schemas/tables/copilot/model-comparison.ts
@@ -0,0 +1,37 @@
+// This schema enforces the structure in model-comparison.yml
+
+const modelComparisonSchema = {
+  type: 'object',
+  additionalProperties: false,
+  required: ['models'],
+  properties: {
+    models: {
+      type: 'array',
+      items: {
+        type: 'object',
+        additionalProperties: false,
+        required: ['name', 'task_area', 'excels_at', 'further_reading'],
+        properties: {
+          name: {
+            type: 'string',
+            lintable: true,
+          },
+          task_area: {
+            type: 'string',
+            lintable: true,
+          },
+          excels_at: {
+            type: 'string',
+            lintable: true,
+          },
+          further_reading: {
+            type: 'string',
+            lintable: true,
+          },
+        },
+      },
+    },
+  },
+}
+
+export default modelComparisonSchema