Redesign Mermaid as infographics-style mindmap with visual bars
This commit is contained in:
147
README.md
147
README.md
@@ -30,115 +30,44 @@ GLM-4.7 demonstrates competitive performance against the newest generation of fl
|
||||
*Note: Best scores per category are highlighted in $\color{green}{\text{green}}$. Data sourced from [Z.ai Official Blog](https://z.ai/blog/glm-4.7).*
|
||||
|
||||
```mermaid
|
||||
flowchart TD
|
||||
subgraph GLM [🚀 GLM-4.7 Dominance]
|
||||
direction TB
|
||||
MATH[🧮 MATH<br/>AIME 25]
|
||||
CODING[💻 CODING<br/>LiveCodeBench v6]
|
||||
SCIENCE[🔬 SCIENCE<br/>GPQA-Diamond]
|
||||
LOGIC[🧠 LOGIC<br/>HLE w/Tools]
|
||||
ENGINEERING[⚙️ ENGINEERING<br/>SWE-bench]
|
||||
AGENTIC[🤖 AGENTIC<br/>τ²-Bench]
|
||||
|
||||
GLM_MATH[<b>GLM-4.7<br/>95.7%</b>]
|
||||
GLM_CODING[<b>GLM-4.7<br/>84.9%</b>]
|
||||
GLM_SCIENCE[<b>GLM-4.7<br/>85.7%</b>]
|
||||
GLM_LOGIC[<b>GLM-4.7<br/>42.8%</b>]
|
||||
GLM_ENG[<b>GLM-4.7<br/>73.8%</b>]
|
||||
GLM_AGENT[<b>GLM-4.7<br/>87.4%</b>]
|
||||
|
||||
MATH --> GLM_MATH
|
||||
CODING --> GLM_CODING
|
||||
SCIENCE --> GLM_SCIENCE
|
||||
LOGIC --> GLM_LOGIC
|
||||
ENGINEERING --> GLM_ENG
|
||||
AGENTIC --> GLM_AGENT
|
||||
end
|
||||
|
||||
subgraph COMPETITORS [📊 Top Competitors]
|
||||
direction LR
|
||||
|
||||
subgraph GEM [💎 Gemini 3.0 Pro]
|
||||
G_MATH[95.0%]
|
||||
G_CODING[<b>90.7%</b>]
|
||||
G_SCIENCE[<b>91.9%</b>]
|
||||
G_LOGIC[<b>45.8%</b>]
|
||||
G_ENG[76.2%]
|
||||
G_AGENT[<b>90.7%</b>]
|
||||
end
|
||||
|
||||
subgraph GPT [🔵 GPT-5.1 High]
|
||||
P_MATH[94.0%]
|
||||
P_CODING[87.0%]
|
||||
P_SCIENCE[<b>88.1%</b>]
|
||||
P_LOGIC[42.7%]
|
||||
P_ENG[76.3%]
|
||||
P_AGENT[82.7%]
|
||||
end
|
||||
|
||||
subgraph DS [🟢 DeepSeek-V3.2]
|
||||
D_MATH[93.1%]
|
||||
D_CODING[83.3%]
|
||||
D_SCIENCE[82.4%]
|
||||
D_LOGIC[40.8%]
|
||||
D_ENG[73.1%]
|
||||
D_AGENT[85.3%]
|
||||
end
|
||||
|
||||
subgraph CLAUDE [🟣 Claude Sonnet 4.5]
|
||||
C_MATH[87.0%]
|
||||
C_CODING[64.0%]
|
||||
C_SCIENCE[83.4%]
|
||||
C_LOGIC[32.0%]
|
||||
C_ENG[<b>77.2%</b>]
|
||||
C_AGENT[87.2%]
|
||||
end
|
||||
end
|
||||
|
||||
GLM_MATH -.-> G_MATH
|
||||
GLM_MATH -.-> P_MATH
|
||||
GLM_MATH -.-> D_MATH
|
||||
GLM_MATH -.-> C_MATH
|
||||
|
||||
GLM_CODING -.-> G_CODING
|
||||
GLM_CODING -.-> P_CODING
|
||||
GLM_CODING -.-> D_CODING
|
||||
GLM_CODING -.-> C_CODING
|
||||
|
||||
GLM_SCIENCE -.-> G_SCIENCE
|
||||
GLM_SCIENCE -.-> P_SCIENCE
|
||||
GLM_SCIENCE -.-> D_SCIENCE
|
||||
GLM_SCIENCE -.-> C_SCIENCE
|
||||
|
||||
GLM_LOGIC -.-> G_LOGIC
|
||||
GLM_LOGIC -.-> P_LOGIC
|
||||
GLM_LOGIC -.-> D_LOGIC
|
||||
GLM_LOGIC -.-> C_LOGIC
|
||||
|
||||
GLM_ENG -.-> G_ENG
|
||||
GLM_ENG -.-> P_ENG
|
||||
GLM_ENG -.-> D_ENG
|
||||
GLM_ENG -.-> C_ENG
|
||||
|
||||
GLM_AGENT -.-> G_AGENT
|
||||
GLM_AGENT -.-> P_AGENT
|
||||
GLM_AGENT -.-> D_AGENT
|
||||
GLM_AGENT -.-> C_AGENT
|
||||
|
||||
classDef glmNode fill:#00C853,stroke:#004D40,stroke-width:3px,color:#FFFFFF,font-weight:bold,font-size:13px,radius:8px
|
||||
classDef geminiNode fill:#FFB74D,stroke:#E65100,stroke-width:2px,color:#FFFFFF,font-weight:bold,font-size:12px,radius:6px
|
||||
classDef gptNode fill:#64B5F6,stroke:#1565C0,stroke-width:2px,color:#FFFFFF,font-weight:bold,font-size:12px,radius:6px
|
||||
classDef deepseekNode fill:#4DB6AC,stroke:#00695C,stroke-width:2px,color:#FFFFFF,font-weight:bold,font-size:12px,radius:6px
|
||||
classDef claudeNode fill:#AB47BC,stroke:#6A1B9A,stroke-width:2px,color:#FFFFFF,font-weight:bold,font-size:12px,radius:6px
|
||||
classDef categoryNode fill:#37474F,stroke:#263238,stroke-width:2px,color:#ECEFF1,font-weight:bold,font-size:11px,radius:4px
|
||||
classDef subgraphNode fill:#FAFAFA,stroke:#B0BEC5,stroke-width:2px,stroke-dasharray: 5 5
|
||||
|
||||
class GLM_MATH,GLM_CODING,GLM_SCIENCE,GLM_LOGIC,GLM_ENG,GLM_AGENT glmNode
|
||||
class G_MATH,G_CODING,G_SCIENCE,G_LOGIC,G_ENG,G_AGENT geminiNode
|
||||
class P_MATH,P_CODING,P_SCIENCE,P_LOGIC,P_ENG,P_AGENT gptNode
|
||||
class D_MATH,D_CODING,D_SCIENCE,D_LOGIC,D_ENG,D_AGENT deepseekNode
|
||||
class C_MATH,C_CODING,C_SCIENCE,C_LOGIC,C_ENG,C_AGENT claudeNode
|
||||
class MATH,CODING,SCIENCE,LOGIC,ENGINEERING,AGENTIC categoryNode
|
||||
mindmap
|
||||
root((GLM-4.7<br/>🏆 SOTA 2025))
|
||||
Math🧮
|
||||
AIME 25<br/><b>95.7%</b><br/>━━━━━━━━━
|
||||
GPT: 94.0%<br/>━━━━━━━━░
|
||||
Gemini: 95.0%<br/>━━━━━━━━━
|
||||
DeepSeek: 93.1%<br/>━━━━━━━━░
|
||||
Claude: 87.0%<br/>━━━━━━░░░
|
||||
Coding💻
|
||||
LiveCode<br/><b>84.9%</b><br/>━━━━━━━━━
|
||||
GPT: 87.0%<br/>━━━━━━━━━
|
||||
Gemini: <b>90.7%</b><br/>━━━━━━━━━
|
||||
DeepSeek: 83.3%<br/>━━━━━━━━░
|
||||
Claude: 64.0%<br/>━━━━░░░░
|
||||
Science🔬
|
||||
GPQA<br/><b>85.7%</b><br/>━━━━━━━━━
|
||||
GPT: 88.1%<br/>━━━━━━━━━
|
||||
Gemini: <b>91.9%</b><br/>━━━━━━━━━
|
||||
DeepSeek: 82.4%<br/>━━━━━━░░░
|
||||
Claude: 83.4%<br/>━━━━━━░░░
|
||||
Logic🧠
|
||||
HLE<br/><b>42.8%</b><br/>━━━━━━░░░
|
||||
GPT: 42.7%<br/>━━━━━━░░░
|
||||
Gemini: <b>45.8%</b><br/>━━━━━━▓░░
|
||||
DeepSeek: 40.8%<br/>━━━━━━░░░
|
||||
Claude: 32.0%<br/>━━━━░░░░
|
||||
Engineering⚙️
|
||||
SWE-bench<br/><b>73.8%</b><br/>━━━━━━━━━
|
||||
GPT: 76.3%<br/>━━━━━━━━━
|
||||
Gemini: 76.2%<br/>━━━━━━━━░
|
||||
DeepSeek: 73.1%<br/>━━━━━━░░░
|
||||
Claude: <b>77.2%</b><br/>━━━━━━━━━
|
||||
Agentic🤖
|
||||
τ²-Bench<br/><b>87.4%</b><br/>━━━━━━━━━
|
||||
GPT: 82.7%<br/>━━━━━━░░░
|
||||
Gemini: <b>90.7%</b><br/>━━━━━━━━━
|
||||
DeepSeek: 85.3%<br/>━━━━━━━━░
|
||||
Claude: 87.2%<br/>━━━━━━━━░
|
||||
```
|
||||
|
||||
| Category | Benchmark | **GLM-4.7** | Claude Sonnet 4.5 | GPT-5.1 High | DeepSeek-V3.2 | Gemini 3.0 Pro | Source |
|
||||
|
||||
Reference in New Issue
Block a user