Spaces:
Runtime error
Runtime error
| { | |
| "time": "241031154353", | |
| "results": { | |
| "GPT-4o (0513, detail-high)": { | |
| "META": { | |
| "Method": [ | |
| "GPT-4o (0513, detail-high)", | |
| "https://openai.com/index/hello-gpt-4o/" | |
| ], | |
| "Parameters": "", | |
| "Language Model": "", | |
| "Vision Model": "", | |
| "Org": "OpenAI", | |
| "Time": "2024/05/31", | |
| "Verified": "Yes", | |
| "OpenSource": "No", | |
| "key": 270, | |
| "dir_name": "GPT4o_HIGH" | |
| }, | |
| "Shopping Concept Understanding": { | |
| "Rec": 67.8, | |
| "Ocr": 76.8, | |
| "Know": 58.3, | |
| "Gen": 56.9, | |
| "Spat": 74.3, | |
| "Math": 76.2, | |
| "Overall": 69.1, | |
| "Overall (official)": "N/A" | |
| }, | |
| "Shopping Knowledge Reasoning": { | |
| "Overall": 61.3, | |
| "SCI": 64.8, | |
| "TQA": 70.3, | |
| "NUM": 44.4, | |
| "ARI": 58.4, | |
| "VQA": 47.5, | |
| "GEO": 61.5, | |
| "ALG": 62.3, | |
| "GPS": 60.1, | |
| "MWP": 69.9, | |
| "LOG": 43.2, | |
| "FQA": 60.2, | |
| "STA": 68.4 | |
| }, | |
| "User Behavior Alignment": { | |
| "Text Recognition": 199, | |
| "Scene Text-centric VQA": 181, | |
| "Doc-oriented VQA": 168, | |
| "Key Information Extraction": 170, | |
| "Handwritten Mathematical Expression Recognition": 18, | |
| "Overall": 736 | |
| }, | |
| "Multi-lingual Abilities": { | |
| "Overall": 63.9, | |
| "coarse perception": 73.6, | |
| "fine-grained perception": 54.8, | |
| "instance reasoning": 66.4, | |
| "logical reasoning": 72.0, | |
| "math": 66.4, | |
| "science & technology": 50.0 | |
| } | |
| } | |
| } | |
| } |