@saprmarks
Cool to see that Meta conducted and published a pre-deployment investigation of Muse Spark behaviors like reward hacking, honesty, and evaluation awareness! https://t.co/i1Yy7HsEup
Viewing enriched Twitter post
Cool to see that Meta conducted and published a pre-deployment investigation of Muse Spark behaviors like reward hacking, honesty, and evaluation awareness! https://t.co/i1Yy7HsEup
{
"media": [
{
"url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/2044839256733220879/media_0.jpg",
"media_url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/2044839256733220879/media_0.jpg",
"type": "photo",
"filename": "media_0.jpg"
}
],
"processed_at": "2026-04-16T19:17:43.331569",
"pipeline_version": "2.0"
} {
"type": "tweet",
"id": "2044839256733220879",
"url": "https://x.com/saprmarks/status/2044839256733220879",
"twitterUrl": "https://twitter.com/saprmarks/status/2044839256733220879",
"text": "Cool to see that Meta conducted and published a pre-deployment investigation of Muse Spark behaviors like reward hacking, honesty, and evaluation awareness! https://t.co/i1Yy7HsEup",
"source": "Twitter for iPhone",
"retweetCount": 2,
"replyCount": 0,
"likeCount": 17,
"quoteCount": 0,
"viewCount": 1090,
"createdAt": "Thu Apr 16 18:04:04 +0000 2026",
"lang": "en",
"bookmarkCount": 2,
"isReply": false,
"inReplyToId": null,
"conversationId": "2044839256733220879",
"displayTextRange": [
0,
156
],
"inReplyToUserId": null,
"inReplyToUsername": null,
"author": {
"type": "user",
"userName": "saprmarks",
"url": "https://x.com/saprmarks",
"twitterUrl": "https://twitter.com/saprmarks",
"id": "1712234210109587456",
"name": "Samuel Marks",
"isVerified": false,
"isBlueVerified": false,
"verifiedType": null,
"profilePicture": "https://pbs.twimg.com/profile_images/1712236109009416192/BFtcSlgC_normal.jpg",
"coverPicture": "",
"description": "",
"location": "Boston",
"followers": 4379,
"following": 147,
"status": "",
"canDm": false,
"canMediaTag": true,
"createdAt": "Wed Oct 11 22:30:42 +0000 2023",
"entities": {
"description": {
"urls": []
},
"url": {}
},
"fastFollowersCount": 0,
"favouritesCount": 1506,
"hasCustomTimelines": true,
"isTranslator": false,
"mediaCount": 81,
"statusesCount": 638,
"withheldInCountries": [],
"affiliatesHighlightedLabel": {},
"possiblySensitive": false,
"pinnedTweetIds": [],
"profile_bio": {
"description": "AI safety research @AnthropicAI, leading Cognitive Oversight team. Previously: postdoc with @davidbau, math PhD at @Harvard.",
"entities": {
"description": {
"hashtags": [],
"symbols": [],
"urls": [],
"user_mentions": [
{
"id_str": "0",
"indices": [
19,
31
],
"name": "",
"screen_name": "AnthropicAI"
},
{
"id_str": "0",
"indices": [
92,
101
],
"name": "",
"screen_name": "davidbau"
},
{
"id_str": "0",
"indices": [
115,
123
],
"name": "",
"screen_name": "Harvard"
}
]
}
}
},
"isAutomated": false,
"automatedBy": null
},
"extendedEntities": {
"media": [
{
"allow_download_status": {
"allow_download": true
},
"display_url": "pic.twitter.com/i1Yy7HsEup",
"expanded_url": "https://twitter.com/saprmarks/status/2044839256733220879/photo/1",
"ext_media_availability": {
"status": "Available"
},
"features": {
"large": {
"faces": []
},
"orig": {
"faces": []
}
},
"id_str": "2044838898627747840",
"indices": [
157,
180
],
"media_key": "3_2044838898627747840",
"media_results": {
"id": "QXBpTWVkaWFSZXN1bHRzOgwAAQoAARxguiTvm6AACgACHGC6eFBbgA8AAA==",
"result": {
"__typename": "ApiMedia",
"id": "QXBpTWVkaWE6DAABCgABHGC6JO+boAAKAAIcYLp4UFuADwAA",
"media_key": "3_2044838898627747840"
}
},
"media_url_https": "https://pbs.twimg.com/media/HGC6JO-boAAYARk.png",
"original_info": {
"focus_rects": [
{
"h": 743,
"w": 1326,
"x": 0,
"y": 233
},
{
"h": 976,
"w": 976,
"x": 206,
"y": 0
},
{
"h": 976,
"w": 856,
"x": 266,
"y": 0
},
{
"h": 976,
"w": 488,
"x": 450,
"y": 0
},
{
"h": 976,
"w": 1326,
"x": 0,
"y": 0
}
],
"height": 976,
"width": 1326
},
"sizes": {
"large": {
"h": 976,
"w": 1326
}
},
"type": "photo",
"url": "https://t.co/i1Yy7HsEup"
}
]
},
"card": null,
"place": {},
"entities": {
"hashtags": [],
"symbols": [],
"timestamps": [],
"urls": [],
"user_mentions": []
},
"quoted_tweet": {
"type": "tweet",
"id": "2044187757099233772",
"url": "https://x.com/summeryue0/status/2044187757099233772",
"twitterUrl": "https://twitter.com/summeryue0/status/2044187757099233772",
"text": "๐ Muse Spark Safety & Preparedness Report for Meta AI is out.\n\nWe start with our pre-deployment assessment under Meta's Advanced AI Scaling Framework, covering chemical and biological, cybersecurity, and loss of control risks. Our assessment flagged potentially elevated chem/bio risk, so we implemented safeguards and validated mitigations before deployment - bringing residual risk to within acceptable levels.\n\nBeyond the Framework, we also share findings and early explorations of model behavior (honesty, intent understanding, etc.), jailbreak robustness, eval awareness, and more.\n\nWe're sharing this report to give a closer look at how we evaluate advanced AI safety. Always more work to do, and we welcome feedback from the community.\n\nhttps://t.co/azpKHwu7x9",
"source": "Twitter for iPhone",
"retweetCount": 66,
"replyCount": 11,
"likeCount": 381,
"quoteCount": 34,
"viewCount": 201601,
"createdAt": "Tue Apr 14 22:55:15 +0000 2026",
"lang": "en",
"bookmarkCount": 103,
"isReply": false,
"inReplyToId": null,
"conversationId": "2044187757099233772",
"displayTextRange": [
0,
283
],
"inReplyToUserId": null,
"inReplyToUsername": null,
"author": {
"type": "user",
"userName": "summeryue0",
"url": "https://x.com/summeryue0",
"twitterUrl": "https://twitter.com/summeryue0",
"id": "2726658913",
"name": "Summer Yue",
"isVerified": false,
"isBlueVerified": true,
"verifiedType": null,
"profilePicture": "https://pbs.twimg.com/profile_images/1589495571978387456/d9jeOJng_normal.jpg",
"coverPicture": "https://pbs.twimg.com/profile_banners/2726658913/1667800471",
"description": "",
"location": "San Francisco, CA",
"followers": 17732,
"following": 399,
"status": "",
"canDm": true,
"canMediaTag": true,
"createdAt": "Tue Aug 12 16:33:03 +0000 2014",
"entities": {
"description": {
"urls": []
},
"url": {}
},
"fastFollowersCount": 0,
"favouritesCount": 598,
"hasCustomTimelines": true,
"isTranslator": false,
"mediaCount": 41,
"statusesCount": 122,
"withheldInCountries": [],
"affiliatesHighlightedLabel": {},
"possiblySensitive": false,
"pinnedTweetIds": [],
"profile_bio": {
"description": "Safety and alignment at Meta Superintelligence. Prev: VP of Research at Scale AI, research at Google DeepMind / Brain (Gemini, LaMDA, RL / TFAgents, AlphaChip).",
"entities": {
"description": {
"hashtags": [],
"symbols": [],
"urls": [],
"user_mentions": []
}
}
},
"isAutomated": false,
"automatedBy": null
},
"extendedEntities": {},
"card": null,
"place": {},
"entities": {
"hashtags": [],
"symbols": [],
"urls": [
{
"display_url": "ai.meta.com/static-resourcโฆ",
"expanded_url": "https://ai.meta.com/static-resource/muse-spark-safety-and-preparedness-report/",
"indices": [
744,
767
],
"url": "https://t.co/azpKHwu7x9"
}
],
"user_mentions": []
},
"quoted_tweet": null,
"retweeted_tweet": null,
"isLimitedReply": false,
"communityInfo": null,
"article": null
},
"retweeted_tweet": null,
"isLimitedReply": false,
"communityInfo": null,
"article": null
}