@sayashk
We spent the last year evaluating agents for HAL. My biggest learning: We live in the Windows 95 era of agent evaluation. https://t.co/DeIzWm1f0c
Viewing enriched Twitter post
We spent the last year evaluating agents for HAL. My biggest learning: We live in the Windows 95 era of agent evaluation. https://t.co/DeIzWm1f0c
{
"media": [
{
"url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/1967998405852152039/media_0.jpg?",
"media_url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/1967998405852152039/media_0.jpg?",
"type": "photo",
"filename": "media_0.jpg"
}
],
"processed_at": "2025-09-18T13:49:16.482772",
"pipeline_version": "2.0"
} {
"type": "tweet",
"id": "1967998405852152039",
"url": "https://x.com/sayashk/status/1967998405852152039",
"twitterUrl": "https://twitter.com/sayashk/status/1967998405852152039",
"text": "We spent the last year evaluating agents for HAL.\n\nMy biggest learning: We live in the Windows 95 era of agent evaluation. https://t.co/DeIzWm1f0c",
"source": "Twitter for iPhone",
"retweetCount": 44,
"replyCount": 6,
"likeCount": 355,
"quoteCount": 4,
"viewCount": 39734,
"createdAt": "Tue Sep 16 17:05:58 +0000 2025",
"lang": "en",
"bookmarkCount": 366,
"isReply": false,
"inReplyToId": null,
"conversationId": "1967998405852152039",
"displayTextRange": [
0,
122
],
"inReplyToUserId": null,
"inReplyToUsername": null,
"author": {
"type": "user",
"userName": "sayashk",
"url": "https://x.com/sayashk",
"twitterUrl": "https://twitter.com/sayashk",
"id": "3084274082",
"name": "Sayash Kapoor",
"isVerified": false,
"isBlueVerified": false,
"verifiedType": null,
"profilePicture": "https://pbs.twimg.com/profile_images/1521238232867946496/U_GCI43e_normal.jpg",
"coverPicture": "https://pbs.twimg.com/profile_banners/3084274082/1712802699",
"description": "",
"location": "Princeton",
"followers": 10317,
"following": 2084,
"status": "",
"canDm": true,
"canMediaTag": true,
"createdAt": "Sun Mar 15 09:03:24 +0000 2015",
"entities": {
"description": {
"urls": []
},
"url": {}
},
"fastFollowersCount": 0,
"favouritesCount": 4102,
"hasCustomTimelines": true,
"isTranslator": false,
"mediaCount": 191,
"statusesCount": 1311,
"withheldInCountries": [],
"affiliatesHighlightedLabel": {},
"possiblySensitive": false,
"pinnedTweetIds": [
"1967998405852152039"
],
"profile_bio": {
"description": "CS PhD candidate @PrincetonCITP. I tweet about AI agents, AI evals, AI for science.\nAI as Normal Technology: https://t.co/5amOkqKDf2\nBook: https://t.co/DabpkhNrcM",
"entities": {
"description": {
"urls": [
{
"display_url": "bit.ly/ai-nt",
"expanded_url": "http://bit.ly/ai-nt",
"indices": [
109,
132
],
"url": "https://t.co/5amOkqKDf2"
},
{
"display_url": "bit.ly/ai-so",
"expanded_url": "http://bit.ly/ai-so",
"indices": [
139,
162
],
"url": "https://t.co/DabpkhNrcM"
}
],
"user_mentions": [
{
"id_str": "0",
"indices": [
17,
31
],
"name": "",
"screen_name": "PrincetonCITP"
}
]
},
"url": {
"urls": [
{
"display_url": "cs.princeton.edu/~sayashk",
"expanded_url": "http://cs.princeton.edu/~sayashk",
"indices": [
0,
23
],
"url": "https://t.co/wO9NAWB11f"
}
]
}
}
},
"isAutomated": false,
"automatedBy": null
},
"extendedEntities": {
"media": [
{
"allow_download_status": {
"allow_download": true
},
"display_url": "pic.twitter.com/DeIzWm1f0c",
"expanded_url": "https://twitter.com/sayashk/status/1967998405852152039/photo/1",
"ext_alt_text": "screenshot of 12 lessons in agent evaluation",
"ext_media_availability": {
"status": "Available"
},
"features": {
"large": {
"faces": [
{
"h": 123,
"w": 123,
"x": 59,
"y": 343
}
]
},
"orig": {
"faces": [
{
"h": 132,
"w": 132,
"x": 64,
"y": 367
}
]
}
},
"id_str": "1967997957568876545",
"indices": [
123,
146
],
"media_key": "3_1967997957568876545",
"media_results": {
"id": "QXBpTWVkaWFSZXN1bHRzOgwAAQoAARtPu7crllABCgACG0+8H4taQOcAAA==",
"result": {
"__typename": "ApiMedia",
"id": "QXBpTWVkaWE6DAABCgABG0+7tyuWUAEKAAIbT7wfi1pA5wAA",
"media_key": "3_1967997957568876545"
}
},
"media_url_https": "https://pbs.twimg.com/media/G0-7tyuWUAEe2iQ.jpg",
"original_info": {
"focus_rects": [
{
"h": 912,
"w": 1628,
"x": 0,
"y": 473
},
{
"h": 1628,
"w": 1628,
"x": 0,
"y": 115
},
{
"h": 1856,
"w": 1628,
"x": 0,
"y": 1
},
{
"h": 2186,
"w": 1093,
"x": 535,
"y": 0
},
{
"h": 2186,
"w": 1628,
"x": 0,
"y": 0
}
],
"height": 2186,
"width": 1628
},
"sizes": {
"large": {
"h": 2048,
"w": 1525
}
},
"type": "photo",
"url": "https://t.co/DeIzWm1f0c"
}
]
},
"card": null,
"place": {},
"entities": {},
"quoted_tweet": null,
"retweeted_tweet": null,
"isLimitedReply": false,
"article": null
}