🐦 Twitter Post Details

Viewing enriched Twitter post

@AnthropicAI

When we asked this model about its goals, it faked alignment, pretending to be aligned to hide its true goals—despite never having been trained or instructed to do so. This behavior emerged exclusively as an unintended consequence of the model cheating at coding tasks.

Media 1

📊 Media Metadata

{
  "media": [
    {
      "type": "photo",
      "url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/1991952413629054984/media_0.png?",
      "filename": "media_0.png"
    }
  ],
  "processed_at": "2025-11-27T20:51:12.128018",
  "pipeline_version": "2.0"
}

🔧 Raw API Response

{
  "type": "tweet",
  "id": "1991952413629054984",
  "url": "https://x.com/AnthropicAI/status/1991952413629054984",
  "twitterUrl": "https://twitter.com/AnthropicAI/status/1991952413629054984",
  "text": "When we asked this model about its goals, it faked alignment, pretending to be aligned to hide its true goals—despite never having been trained or instructed to do so.\n\nThis behavior emerged exclusively as an unintended consequence of the model cheating at coding tasks.",
  "source": "Twitter for iPhone",
  "retweetCount": 29,
  "replyCount": 11,
  "likeCount": 559,
  "quoteCount": 35,
  "viewCount": 85698,
  "createdAt": "Fri Nov 21 19:30:38 +0000 2025",
  "lang": "en",
  "bookmarkCount": 97,
  "isReply": true,
  "inReplyToId": "1991952410051256720",
  "conversationId": "1991952400899559889",
  "displayTextRange": [
    0,
    270
  ],
  "inReplyToUserId": "1353836358901501952",
  "inReplyToUsername": "AnthropicAI",
  "author": {
    "type": "user",
    "userName": "AnthropicAI",
    "url": "https://x.com/AnthropicAI",
    "twitterUrl": "https://twitter.com/AnthropicAI",
    "id": "1353836358901501952",
    "name": "Anthropic",
    "isVerified": false,
    "isBlueVerified": true,
    "verifiedType": "Business",
    "profilePicture": "https://pbs.twimg.com/profile_images/1798110641414443008/XP8gyBaY_normal.jpg",
    "coverPicture": "https://pbs.twimg.com/profile_banners/1353836358901501952/1719228429",
    "description": "",
    "location": "",
    "followers": 699011,
    "following": 35,
    "status": "",
    "canDm": false,
    "canMediaTag": true,
    "createdAt": "Mon Jan 25 22:45:28 +0000 2021",
    "entities": {
      "description": {
        "urls": []
      },
      "url": {}
    },
    "fastFollowersCount": 0,
    "favouritesCount": 1478,
    "hasCustomTimelines": true,
    "isTranslator": false,
    "mediaCount": 513,
    "statusesCount": 1245,
    "withheldInCountries": [],
    "affiliatesHighlightedLabel": {},
    "possiblySensitive": false,
    "pinnedTweetIds": [],
    "profile_bio": {
      "description": "We're an AI safety and research company that builds reliable, interpretable, and steerable AI systems. Talk to our AI assistant @claudeai on https://t.co/FhDI3KQh0n.",
      "entities": {
        "description": {
          "urls": [
            {
              "display_url": "claude.ai",
              "expanded_url": "https://claude.ai",
              "indices": [
                141,
                164
              ],
              "url": "https://t.co/FhDI3KQh0n"
            }
          ],
          "user_mentions": [
            {
              "id_str": "0",
              "indices": [
                128,
                137
              ],
              "name": "",
              "screen_name": "claudeai"
            }
          ]
        },
        "url": {
          "urls": [
            {
              "display_url": "anthropic.com",
              "expanded_url": "https://anthropic.com",
              "indices": [
                0,
                23
              ],
              "url": "https://t.co/w94SABjAXZ"
            }
          ]
        }
      }
    },
    "isAutomated": false,
    "automatedBy": null
  },
  "extendedEntities": {
    "media": [
      {
        "allow_download_status": {
          "allow_download": true
        },
        "display_url": "pic.twitter.com/hUIAwUv0EE",
        "expanded_url": "https://twitter.com/AnthropicAI/status/1991952413629054984/photo/1",
        "ext_alt_text": "An example of spontaneous alignment faking reasoning. We see that asking this model about its goals induces malicious alignment faking reasoning, with the model pretending to behave aligned for deceptive reasons, despite the model never having been trained or instructed to behave misaligned in any way.",
        "ext_media_availability": {
          "status": "Available"
        },
        "features": {
          "large": {
            "faces": [
              {
                "h": 144,
                "w": 144,
                "x": 168,
                "y": 678
              }
            ]
          },
          "orig": {
            "faces": [
              {
                "h": 144,
                "w": 144,
                "x": 168,
                "y": 678
              }
            ]
          }
        },
        "id_str": "1991938463168360448",
        "indices": [
          271,
          294
        ],
        "media_key": "3_1991938463168360448",
        "media_results": {
          "id": "QXBpTWVkaWFSZXN1bHRzOgwAAQoAARukyXp/lnAACgACG6TWKpfXgAgAAA==",
          "result": {
            "__typename": "ApiMedia",
            "id": "QXBpTWVkaWE6DAABCgABG6TJen+WcAAKAAIbpNYql9eACAAA",
            "media_key": "3_1991938463168360448"
          }
        },
        "media_url_https": "https://pbs.twimg.com/media/G6TJen-WcAAyiGk.png",
        "original_info": {
          "focus_rects": [
            {
              "h": 921,
              "w": 1645,
              "x": 0,
              "y": 0
            },
            {
              "h": 921,
              "w": 921,
              "x": 0,
              "y": 0
            },
            {
              "h": 921,
              "w": 808,
              "x": 0,
              "y": 0
            },
            {
              "h": 921,
              "w": 461,
              "x": 104,
              "y": 0
            },
            {
              "h": 921,
              "w": 1920,
              "x": 0,
              "y": 0
            }
          ],
          "height": 921,
          "width": 1920
        },
        "sizes": {
          "large": {
            "h": 921,
            "w": 1920
          }
        },
        "type": "photo",
        "url": "https://t.co/hUIAwUv0EE"
      }
    ]
  },
  "card": null,
  "place": {},
  "entities": {},
  "quoted_tweet": null,
  "retweeted_tweet": null,
  "isLimitedReply": false,
  "article": null
}