@omarsar0
Weak on robustness. When the test data looks different from the training examples (distribution shift), performance drops sharply. Chain-of-thought and automated prompt optimization are especially brittle. https://t.co/lU8cnBAxoQ
Viewing enriched Twitter post
Weak on robustness. When the test data looks different from the training examples (distribution shift), performance drops sharply. Chain-of-thought and automated prompt optimization are especially brittle. https://t.co/lU8cnBAxoQ
{
"media": [
{
"type": "photo",
"url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/1968412967386628214/media_0.jpg?",
"filename": "media_0.jpg"
}
],
"processed_at": "2025-09-18T14:23:11.861339",
"pipeline_version": "2.0"
} {
"type": "tweet",
"id": "1968412967386628214",
"url": "https://x.com/omarsar0/status/1968412967386628214",
"twitterUrl": "https://twitter.com/omarsar0/status/1968412967386628214",
"text": "Weak on robustness.\n\nWhen the test data looks different from the training examples (distribution shift), performance drops sharply.\n\nChain-of-thought and automated prompt optimization are especially brittle. https://t.co/lU8cnBAxoQ",
"source": "Twitter for iPhone",
"retweetCount": 0,
"replyCount": 3,
"likeCount": 11,
"quoteCount": 0,
"viewCount": 1231,
"createdAt": "Wed Sep 17 20:33:17 +0000 2025",
"lang": "en",
"bookmarkCount": 1,
"isReply": true,
"inReplyToId": "1968412951943229665",
"conversationId": "1968412905034092742",
"displayTextRange": [
0,
207
],
"inReplyToUserId": "3448284313",
"inReplyToUsername": "omarsar0",
"author": {
"type": "user",
"userName": "omarsar0",
"url": "https://x.com/omarsar0",
"twitterUrl": "https://twitter.com/omarsar0",
"id": "3448284313",
"name": "elvis",
"isVerified": false,
"isBlueVerified": true,
"verifiedType": null,
"profilePicture": "https://pbs.twimg.com/profile_images/939313677647282181/vZjFWtAn_normal.jpg",
"coverPicture": "https://pbs.twimg.com/profile_banners/3448284313/1565974901",
"description": "",
"location": "",
"followers": 264612,
"following": 674,
"status": "",
"canDm": true,
"canMediaTag": true,
"createdAt": "Fri Sep 04 12:59:26 +0000 2015",
"entities": {
"description": {
"urls": []
},
"url": {}
},
"fastFollowersCount": 0,
"favouritesCount": 32384,
"hasCustomTimelines": true,
"isTranslator": true,
"mediaCount": 4086,
"statusesCount": 15853,
"withheldInCountries": [],
"affiliatesHighlightedLabel": {},
"possiblySensitive": false,
"pinnedTweetIds": [
"1968438129846567163"
],
"profile_bio": {
"description": "Building with AI agents @dair_ai • Prev: Meta AI, Galactica LLM, Elastic, PaperswithCode, PhD • I share insights on how to build with AI Agents ↓",
"entities": {
"description": {
"user_mentions": [
{
"id_str": "0",
"indices": [
24,
32
],
"name": "",
"screen_name": "dair_ai"
}
]
},
"url": {
"urls": [
{
"display_url": "dair-ai.thinkific.com",
"expanded_url": "https://dair-ai.thinkific.com/",
"indices": [
0,
23
],
"url": "https://t.co/JBU5beHQNs"
}
]
}
}
},
"isAutomated": false,
"automatedBy": null
},
"extendedEntities": {
"media": [
{
"display_url": "pic.twitter.com/lU8cnBAxoQ",
"expanded_url": "https://twitter.com/omarsar0/status/1968412967386628214/photo/1",
"ext_media_availability": {
"status": "Available"
},
"features": {
"large": {},
"orig": {}
},
"id_str": "1968412964555554816",
"indices": [
208,
231
],
"media_key": "3_1968412964555554816",
"media_results": {
"id": "QXBpTWVkaWFSZXN1bHRzOgwAAQoAARtRNSmDm4AACgACG1E1KixaQHYAAA==",
"result": {
"__typename": "ApiMedia",
"id": "QXBpTWVkaWE6DAABCgABG1E1KYObgAAKAAIbUTUqLFpAdgAA",
"media_key": "3_1968412964555554816"
}
},
"media_url_https": "https://pbs.twimg.com/media/G1E1KYObgAAIouW.jpg",
"original_info": {
"focus_rects": [
{
"h": 672,
"w": 1200,
"x": 0,
"y": 250
},
{
"h": 922,
"w": 922,
"x": 139,
"y": 0
},
{
"h": 922,
"w": 809,
"x": 196,
"y": 0
},
{
"h": 922,
"w": 461,
"x": 370,
"y": 0
},
{
"h": 922,
"w": 1200,
"x": 0,
"y": 0
}
],
"height": 922,
"width": 1200
},
"sizes": {
"large": {
"h": 922,
"w": 1200
}
},
"type": "photo",
"url": "https://t.co/lU8cnBAxoQ"
}
]
},
"card": null,
"place": {},
"entities": {},
"quoted_tweet": null,
"retweeted_tweet": null,
"isLimitedReply": false,
"article": null
}