{"id": 1012326, "name": "Performance on math and problem-solving tasks", "unit": "%", "createdAt": "2025-02-17T13:09:24.000Z", "updatedAt": "2025-04-22T21:23:29.000Z", "coverage": "", "timespan": "", "datasetId": 6946, "shortUnit": "%", "columnOrder": 0, "shortName": "performance_math", "catalogPath": "grapher/artificial_intelligence/2025-02-17/papers_with_code_math/papers_with_code_math#performance_math", "type": "float", "dataChecksum": "12840461999411394973", "metadataChecksum": "-5045756479575391148", "datasetName": "AI Performance on Math Problems", "datasetVersion": "2025-02-17", "nonRedistributable": false, "display": {"unit": "%", "zeroDay": "2021-03-05", "shortUnit": "%", "yearIsDay": true, "numDecimalPlaces": 1}, "schemaVersion": 2, "processingLevel": "major", "presentation": {"topicTagsLinks": ["Artificial Intelligence"]}, "descriptionKey": ["This benchmark assesses the accuracy of models on math and problem solving tasks based on the MATH benchmark.", "The MATH benchmark consists of 12,500 challenging competition mathematics problems. Each problem in MATH has a full step-by-step solution which can be used to teach models to generate answer derivations and explanations."], "dimensions": {"years": {"values": [{"id": 0}, {"id": 481}, {"id": 886}, {"id": 893}, {"id": 1128}, {"id": 1293}, {"id": 1377}]}, "entities": {"values": [{"id": 369310, "name": "State of the art", "code": null}]}}, "origins": [{"id": 2884, "title": "AI Performance on Math Problems", "descriptionSnapshot": "Problem Solving on MATH dataset of 12,500 challenging competition mathematics problems. Each problem in MATH has a full step-by-step solution which can be used to teach models to generate answer derivations and explanations.\n", "producer": "Papers with Code", "citationFull": "Math Word Problem Solving on MATH. Papers with Code (2025)", "urlMain": "https://paperswithcode.com/sota/math-word-problem-solving-on-math", "urlDownload": "https://paperswithcode.com/sota/math-word-problem-solving-on-math", "dateAccessed": "2025-02-17", "datePublished": "2025-02-17", "license": {"url": "https://creativecommons.org/licenses/by-sa/4.0/", "name": "CC BY 4.0"}}]}