@omarsar0
We need more challenging benchmarks to test long-horizon coding capabilities. FrontierSWE looks like a nice new set of tasks to test out your best coding agents or harnesses.
Viewing enriched Twitter post
We need more challenging benchmarks to test long-horizon coding capabilities. FrontierSWE looks like a nice new set of tasks to test out your best coding agents or harnesses.
{
"score": 0.34,
"score_components": {
"author": 0.09,
"engagement": 0.0,
"quality": 0.04000000000000001,
"source": 0.135,
"nlp": 0.05,
"recency": 0.025
},
"scored_at": "2026-04-16T23:20:47.397739",
"import_source": "api_import",
"source_tagged_at": "2026-04-16T23:20:47.397750",
"enriched": true,
"enriched_at": "2026-04-16T23:20:47.397752"
} {
"type": "tweet",
"id": "2044918815591370826",
"url": "https://x.com/omarsar0/status/2044918815591370826",
"twitterUrl": "https://twitter.com/omarsar0/status/2044918815591370826",
"text": "We need more challenging benchmarks to test long-horizon coding capabilities. \n\nFrontierSWE looks like a nice new set of tasks to test out your best coding agents or harnesses.",
"source": "Twitter for iPhone",
"retweetCount": 0,
"replyCount": 0,
"likeCount": 0,
"quoteCount": 0,
"viewCount": 18,
"createdAt": "Thu Apr 16 23:20:13 +0000 2026",
"lang": "en",
"bookmarkCount": 0,
"isReply": false,
"inReplyToId": null,
"conversationId": "2044918815591370826",
"displayTextRange": [
0,
176
],
"inReplyToUserId": null,
"inReplyToUsername": null,
"author": {
"type": "user",
"userName": "omarsar0",
"url": "https://x.com/omarsar0",
"twitterUrl": "https://twitter.com/omarsar0",
"id": "3448284313",
"name": "elvis",
"isVerified": false,
"isBlueVerified": true,
"verifiedType": null,
"profilePicture": "https://pbs.twimg.com/profile_images/939313677647282181/vZjFWtAn_normal.jpg",
"coverPicture": "https://pbs.twimg.com/profile_banners/3448284313/1565974901",
"description": "",
"location": "DAIR.AI Academy",
"followers": 298378,
"following": 811,
"status": "",
"canDm": true,
"canMediaTag": true,
"createdAt": "Fri Sep 04 12:59:26 +0000 2015",
"entities": {
"description": {
"urls": []
},
"url": {}
},
"fastFollowersCount": 0,
"favouritesCount": 35438,
"hasCustomTimelines": true,
"isTranslator": true,
"mediaCount": 4599,
"statusesCount": 17641,
"withheldInCountries": [],
"affiliatesHighlightedLabel": {},
"possiblySensitive": false,
"pinnedTweetIds": [
"2044769798845079665"
],
"profile_bio": {
"description": "Building @dair_ai • Prev: Meta AI, Elastic, PhD • New AI learning portal: https://t.co/1e8RZKs4uX",
"entities": {
"description": {
"hashtags": [],
"symbols": [],
"urls": [
{
"display_url": "academy.dair.ai",
"expanded_url": "https://academy.dair.ai/",
"indices": [
74,
97
],
"url": "https://t.co/1e8RZKs4uX"
}
],
"user_mentions": [
{
"id_str": "0",
"indices": [
9,
17
],
"name": "",
"screen_name": "dair_ai"
}
]
},
"url": {
"urls": [
{
"display_url": "dair.ai",
"expanded_url": "https://www.dair.ai/",
"indices": [
0,
23
],
"url": "https://t.co/XQto5ypSIk"
}
]
}
}
},
"isAutomated": false,
"automatedBy": null
},
"extendedEntities": {},
"card": null,
"place": {},
"entities": {
"hashtags": [],
"symbols": [],
"timestamps": [],
"urls": [],
"user_mentions": []
},
"quoted_tweet": {
"type": "tweet",
"id": "2044876224896565679",
"url": "https://x.com/MatternJustus/status/2044876224896565679",
"twitterUrl": "https://twitter.com/MatternJustus/status/2044876224896565679",
"text": "Introducing FrontierSWE, an ultra-long horizon coding benchmark.\n\nWe test agents on some of the hardest technical tasks like optimizing a video rendering library or training a model to predict the quantum properties of molecules.\n\nDespite having 20 hours, they rarely succeed https://t.co/xbqHJRZiPZ",
"source": "Twitter for iPhone",
"retweetCount": 78,
"replyCount": 37,
"likeCount": 590,
"quoteCount": 37,
"viewCount": 55555,
"createdAt": "Thu Apr 16 20:30:58 +0000 2026",
"lang": "en",
"bookmarkCount": 205,
"isReply": false,
"inReplyToId": null,
"conversationId": "2044876224896565679",
"displayTextRange": [
0,
275
],
"inReplyToUserId": null,
"inReplyToUsername": null,
"author": {
"type": "user",
"userName": "MatternJustus",
"url": "https://x.com/MatternJustus",
"twitterUrl": "https://twitter.com/MatternJustus",
"id": "1371519617550663687",
"name": "Justus Mattern",
"isVerified": false,
"isBlueVerified": true,
"verifiedType": null,
"profilePicture": "https://pbs.twimg.com/profile_images/1932740990517039104/MzV-c66V_normal.jpg",
"coverPicture": "https://pbs.twimg.com/profile_banners/1371519617550663687/1760899791",
"description": "",
"location": "San Francisco, CA",
"followers": 7321,
"following": 734,
"status": "",
"canDm": true,
"canMediaTag": true,
"createdAt": "Mon Mar 15 17:52:22 +0000 2021",
"entities": {
"description": {
"urls": []
},
"url": {}
},
"fastFollowersCount": 0,
"favouritesCount": 3066,
"hasCustomTimelines": true,
"isTranslator": false,
"mediaCount": 141,
"statusesCount": 1084,
"withheldInCountries": [],
"affiliatesHighlightedLabel": {},
"possiblySensitive": false,
"pinnedTweetIds": [
"2044876224896565679"
],
"profile_bio": {
"description": "Co-Founder @ProximalHQ | prev. research @PrimeIntellect, @MPI_IS and built revideo",
"entities": {
"description": {
"hashtags": [],
"symbols": [],
"urls": [],
"user_mentions": [
{
"id_str": "0",
"indices": [
11,
22
],
"name": "",
"screen_name": "ProximalHQ"
},
{
"id_str": "0",
"indices": [
40,
55
],
"name": "",
"screen_name": "PrimeIntellect"
},
{
"id_str": "0",
"indices": [
57,
64
],
"name": "",
"screen_name": "MPI_IS"
}
]
},
"url": {
"urls": [
{
"display_url": "justusmattern.com",
"expanded_url": "https://www.justusmattern.com",
"indices": [
0,
23
],
"url": "https://t.co/0zwmCeFbCe"
}
]
}
}
},
"isAutomated": false,
"automatedBy": null
},
"extendedEntities": {
"media": [
{
"allow_download_status": {
"allow_download": true
},
"display_url": "pic.twitter.com/xbqHJRZiPZ",
"expanded_url": "https://twitter.com/MatternJustus/status/2044876224896565679/photo/1",
"ext_media_availability": {
"status": "Available"
},
"features": {
"large": {
"faces": [
{
"h": 162,
"w": 162,
"x": 4,
"y": 287
}
]
},
"orig": {
"faces": [
{
"h": 162,
"w": 162,
"x": 4,
"y": 287
}
]
}
},
"id_str": "2044876217179119616",
"indices": [
276,
299
],
"media_key": "3_2044876217179119616",
"media_results": {
"id": "QXBpTWVkaWFSZXN1bHRzOgwAAQoAARxg3BXWmyAACgACHGDcF6KaAa8AAA==",
"result": {
"__typename": "ApiMedia",
"id": "QXBpTWVkaWE6DAABCgABHGDcFdabIAAKAAIcYNwXopoBrwAA",
"media_key": "3_2044876217179119616"
}
},
"media_url_https": "https://pbs.twimg.com/media/HGDcFdabIAAfB9i.jpg",
"original_info": {
"focus_rects": [
{
"h": 672,
"w": 1200,
"x": 0,
"y": 0
},
{
"h": 780,
"w": 780,
"x": 210,
"y": 0
},
{
"h": 780,
"w": 684,
"x": 258,
"y": 0
},
{
"h": 780,
"w": 390,
"x": 405,
"y": 0
},
{
"h": 780,
"w": 1200,
"x": 0,
"y": 0
}
],
"height": 780,
"width": 1200
},
"sizes": {
"large": {
"h": 780,
"w": 1200
}
},
"type": "photo",
"url": "https://t.co/xbqHJRZiPZ"
}
]
},
"card": null,
"place": {},
"entities": {
"hashtags": [],
"symbols": [],
"timestamps": [],
"urls": [],
"user_mentions": []
},
"quoted_tweet": null,
"retweeted_tweet": null,
"isLimitedReply": false,
"communityInfo": null,
"article": null
},
"retweeted_tweet": null,
"isLimitedReply": false,
"communityInfo": null,
"article": null
}