🐦 Twitter Post Details

Viewing enriched Twitter post

@OpenAI

In this new research with @apolloaievals, we found behaviors consistent with scheming in controlled tests across frontier models, including OpenAI o3 and o4-mini, Gemini-2.5-pro, and Claude Opus-4. We can significantly reduce scheming by training models to reason explicitly, using an extension to the Model Spec that prohibits scheming. That method is called deliberative alignment. With this technique, we can reduce covert actions by 30x for o3. However, situational awareness complicates results. Model spec: https://t.co/MiBFr9aNLz

Media 1

📊 Media Metadata

{
  "media": [
    {
      "type": "photo",
      "url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/1968361708537397708/media_0.jpg?",
      "filename": "media_0.jpg"
    }
  ],
  "processed_at": "2025-09-18T14:07:08.678387",
  "pipeline_version": "2.0"
}

🔧 Raw API Response

{
  "type": "tweet",
  "id": "1968361708537397708",
  "url": "https://x.com/OpenAI/status/1968361708537397708",
  "twitterUrl": "https://twitter.com/OpenAI/status/1968361708537397708",
  "text": "In this new research with @apolloaievals, we found behaviors consistent with scheming in controlled tests across frontier models, including OpenAI o3 and o4-mini, Gemini-2.5-pro, and Claude Opus-4.\n\nWe can significantly reduce scheming by training models to reason explicitly, using an extension to the Model Spec that prohibits scheming. That method is called deliberative alignment.\n\nWith this technique, we can reduce covert actions by 30x for o3.\n\nHowever, situational awareness complicates results.\n\nModel spec: https://t.co/MiBFr9aNLz",
  "source": "Twitter for iPhone",
  "retweetCount": 11,
  "replyCount": 4,
  "likeCount": 225,
  "quoteCount": 5,
  "viewCount": 25399,
  "createdAt": "Wed Sep 17 17:09:36 +0000 2025",
  "lang": "en",
  "bookmarkCount": 22,
  "isReply": true,
  "inReplyToId": "1968361704661930288",
  "conversationId": "1968361701784568200",
  "displayTextRange": [
    0,
    277
  ],
  "inReplyToUserId": "4398626122",
  "inReplyToUsername": "OpenAI",
  "author": {
    "type": "user",
    "userName": "OpenAI",
    "url": "https://x.com/OpenAI",
    "twitterUrl": "https://twitter.com/OpenAI",
    "id": "4398626122",
    "name": "OpenAI",
    "isVerified": false,
    "isBlueVerified": true,
    "verifiedType": "Business",
    "profilePicture": "https://pbs.twimg.com/profile_images/1885410181409820672/ztsaR0JW_normal.jpg",
    "coverPicture": "https://pbs.twimg.com/profile_banners/4398626122/1738590484",
    "description": "",
    "location": "",
    "followers": 4346141,
    "following": 3,
    "status": "",
    "canDm": false,
    "canMediaTag": true,
    "createdAt": "Sun Dec 06 22:51:08 +0000 2015",
    "entities": {
      "description": {
        "urls": []
      },
      "url": {}
    },
    "fastFollowersCount": 0,
    "favouritesCount": 1014,
    "hasCustomTimelines": true,
    "isTranslator": false,
    "mediaCount": 382,
    "statusesCount": 1370,
    "withheldInCountries": [],
    "affiliatesHighlightedLabel": {},
    "possiblySensitive": false,
    "pinnedTweetIds": [
      "1953504357821165774"
    ],
    "profile_bio": {
      "description": "OpenAI’s mission is to ensure that artificial general intelligence benefits all of humanity. We’re hiring: https://t.co/dJGr6Lg202",
      "entities": {
        "description": {
          "urls": [
            {
              "display_url": "openai.com/jobs",
              "expanded_url": "http://openai.com/jobs",
              "indices": [
                107,
                130
              ],
              "url": "https://t.co/dJGr6Lg202"
            }
          ]
        },
        "url": {
          "urls": [
            {
              "display_url": "openai.com",
              "expanded_url": "https://openai.com",
              "indices": [
                0,
                23
              ],
              "url": "https://t.co/3bPlZZjXod"
            }
          ]
        }
      }
    },
    "isAutomated": false,
    "automatedBy": null
  },
  "extendedEntities": {
    "media": [
      {
        "display_url": "pic.twitter.com/fIG5SLk4H4",
        "expanded_url": "https://twitter.com/OpenAI/status/1968361708537397708/photo/1",
        "ext_media_availability": {
          "status": "Available"
        },
        "features": {
          "large": {},
          "orig": {}
        },
        "id_str": "1968355058904612867",
        "indices": [
          278,
          301
        ],
        "media_key": "3_1968355058904612867",
        "media_results": {
          "id": "QXBpTWVkaWFSZXN1bHRzOgwAAQoAARtRAH9N2kADCgACG1EGi4raQcwAAA==",
          "result": {
            "__typename": "ApiMedia",
            "id": "QXBpTWVkaWE6DAABCgABG1EAf03aQAMKAAIbUQaLitpBzAAA",
            "media_key": "3_1968355058904612867"
          }
        },
        "media_url_https": "https://pbs.twimg.com/media/G1EAf03aQAMLSTZ.jpg",
        "original_info": {
          "focus_rects": [
            {
              "h": 1210,
              "w": 2160,
              "x": 0,
              "y": 0
            },
            {
              "h": 2160,
              "w": 2160,
              "x": 0,
              "y": 0
            },
            {
              "h": 2160,
              "w": 1895,
              "x": 0,
              "y": 0
            },
            {
              "h": 2160,
              "w": 1080,
              "x": 0,
              "y": 0
            },
            {
              "h": 2160,
              "w": 2160,
              "x": 0,
              "y": 0
            }
          ],
          "height": 2160,
          "width": 2160
        },
        "sizes": {
          "large": {
            "h": 2048,
            "w": 2048
          }
        },
        "type": "photo",
        "url": "https://t.co/fIG5SLk4H4"
      }
    ]
  },
  "card": null,
  "place": {},
  "entities": {
    "urls": [
      {
        "display_url": "model-spec.openai.com/2025-04-11.html",
        "expanded_url": "https://model-spec.openai.com/2025-04-11.html",
        "indices": [
          517,
          540
        ],
        "url": "https://t.co/MiBFr9aNLz"
      }
    ],
    "user_mentions": [
      {
        "id_str": "1655925560596373506",
        "indices": [
          26,
          40
        ],
        "name": "Apollo Research",
        "screen_name": "apolloaievals"
      }
    ]
  },
  "quoted_tweet": null,
  "retweeted_tweet": null,
  "isLimitedReply": false,
  "article": null
}