🐦 Twitter Post Details

Viewing enriched Twitter post

@nikhilchandak29

🚨 Ever wondered how much you can ace popular MCQ benchmarks without even looking at the questions? 🀯 Turns out, you can often get significant accuracy just from the choices alone. This is true even on recent benchmarks with 10 choices (like MMLU-Pro) and their vision counterparts like MMMU-Pro (yes, even without images!)πŸ˜±πŸ“‰ Such choice-only shortcuts are hard to fix. We find prior attempts at fixing them -- GoldenSwag (for HellaSwag) and TruthfulQA v2 still suffer from similar problems.

Media 1

πŸ“Š Media Metadata

{
  "media": [
    {
      "url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/1941163306166681602/media_0.jpg?",
      "media_url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/1941163306166681602/media_0.jpg?",
      "type": "photo",
      "filename": "media_0.jpg"
    }
  ],
  "processed_at": "2026-01-18T19:41:39.035942",
  "pipeline_version": "2.0"
}

πŸ”§ Raw API Response

{
  "type": "tweet",
  "id": "1941163306166681602",
  "url": "https://x.com/nikhilchandak29/status/1941163306166681602",
  "twitterUrl": "https://twitter.com/nikhilchandak29/status/1941163306166681602",
  "text": "🚨 Ever wondered how much you can ace popular MCQ benchmarks without even looking at the questions? 🀯\n\nTurns out, you can often get significant accuracy just from the choices alone. This is true even on recent benchmarks with 10 choices (like MMLU-Pro) and their vision counterparts like MMMU-Pro (yes, even without images!)πŸ˜±πŸ“‰\n\nSuch choice-only shortcuts are hard to fix. We find prior attempts at fixing them -- GoldenSwag (for HellaSwag) and TruthfulQA v2 still suffer from similar problems.",
  "source": "Twitter for iPhone",
  "retweetCount": 27,
  "replyCount": 3,
  "likeCount": 107,
  "quoteCount": 10,
  "viewCount": 25355,
  "createdAt": "Fri Jul 04 15:52:51 +0000 2025",
  "lang": "en",
  "bookmarkCount": 48,
  "isReply": false,
  "inReplyToId": null,
  "conversationId": "1941163306166681602",
  "displayTextRange": [
    0,
    293
  ],
  "inReplyToUserId": null,
  "inReplyToUsername": null,
  "author": {
    "type": "user",
    "userName": "nikhilchandak29",
    "url": "https://x.com/nikhilchandak29",
    "twitterUrl": "https://twitter.com/nikhilchandak29",
    "id": "806854773647425537",
    "name": "Nikhil Chandak",
    "isVerified": false,
    "isBlueVerified": true,
    "verifiedType": null,
    "profilePicture": "https://pbs.twimg.com/profile_images/1699531359763800064/WjkKK_EZ_normal.jpg",
    "coverPicture": "",
    "description": "",
    "location": "TΓΌbingen, Germany",
    "followers": 673,
    "following": 465,
    "status": "",
    "canDm": true,
    "canMediaTag": true,
    "createdAt": "Thu Dec 08 13:35:43 +0000 2016",
    "entities": {
      "description": {
        "urls": []
      },
      "url": {}
    },
    "fastFollowersCount": 0,
    "favouritesCount": 1451,
    "hasCustomTimelines": true,
    "isTranslator": false,
    "mediaCount": 22,
    "statusesCount": 117,
    "withheldInCountries": [],
    "affiliatesHighlightedLabel": {},
    "possiblySensitive": false,
    "pinnedTweetIds": [
      "2008587241430438043"
    ],
    "profile_bio": {
      "description": "PhD @ Max Planck Institute. Past @iiit_hyderabad @VectorInst. Interested in better evals, forecasting, and open-endedness.",
      "entities": {
        "description": {
          "user_mentions": [
            {
              "id_str": "0",
              "indices": [
                33,
                48
              ],
              "name": "",
              "screen_name": "iiit_hyderabad"
            },
            {
              "id_str": "0",
              "indices": [
                49,
                60
              ],
              "name": "",
              "screen_name": "VectorInst"
            }
          ]
        },
        "url": {
          "urls": [
            {
              "display_url": "nikhilchandak.github.io",
              "expanded_url": "https://nikhilchandak.github.io/",
              "indices": [
                0,
                23
              ],
              "url": "https://t.co/E5hsPhwirb"
            }
          ]
        }
      }
    },
    "isAutomated": false,
    "automatedBy": null
  },
  "extendedEntities": {
    "media": [
      {
        "display_url": "pic.twitter.com/D8Ztx3LqB7",
        "expanded_url": "https://twitter.com/nikhilchandak29/status/1941163306166681602/photo/1",
        "ext_media_availability": {
          "status": "Available"
        },
        "features": {
          "all": {
            "tags": [
              {
                "name": "Wenhu Chen",
                "screen_name": "WenhuChen",
                "type": "user",
                "user_id": "727242818452897796"
              },
              {
                "name": "Alexander Doria",
                "screen_name": "Dorialexander",
                "type": "user",
                "user_id": "276508048"
              },
              {
                "name": "Owain Evans",
                "screen_name": "OwainEvans_UK",
                "type": "user",
                "user_id": "1247872005912891392"
              },
              {
                "name": "Alex Turner",
                "screen_name": "Turn_Trout",
                "type": "user",
                "user_id": "1466176799960797186"
              },
              {
                "name": "James Chua",
                "screen_name": "jameschua_sg",
                "type": "user",
                "user_id": "1767447881278275584"
              },
              {
                "name": "AK",
                "screen_name": "_akhaliq",
                "type": "user",
                "user_id": "2465283662"
              },
              {
                "name": "Tanishq Mathew Abraham, Ph.D.",
                "screen_name": "iScienceLuvr",
                "type": "user",
                "user_id": "441465751"
              },
              {
                "name": "Aran Komatsuzaki",
                "screen_name": "arankomatsuzaki",
                "type": "user",
                "user_id": "794433401591693312"
              },
              {
                "name": "Nishant Balepur",
                "screen_name": "NishantBalepur",
                "type": "user",
                "user_id": "768905924475879425"
              },
              {
                "name": "Ge Zhang",
                "screen_name": "GeZhang86038849",
                "type": "user",
                "user_id": "1387004918255419395"
              }
            ]
          },
          "large": {},
          "orig": {}
        },
        "id_str": "1941150975110041601",
        "indices": [
          294,
          317
        ],
        "media_key": "3_1941150975110041601",
        "media_results": {
          "id": "QXBpTWVkaWFSZXN1bHRzOgwAAQoAARrwWob21lABCgACGvBlvgMWgAIAAA==",
          "result": {
            "__typename": "ApiMedia",
            "id": "QXBpTWVkaWE6DAABCgABGvBahvbWUAEKAAIa8GW+AxaAAgAA",
            "media_key": "3_1941150975110041601"
          }
        },
        "media_url_https": "https://pbs.twimg.com/media/GvBahvbWUAEirlr.jpg",
        "original_info": {
          "focus_rects": [
            {
              "h": 896,
              "w": 1600,
              "x": 0,
              "y": 0
            },
            {
              "h": 946,
              "w": 946,
              "x": 654,
              "y": 0
            },
            {
              "h": 946,
              "w": 830,
              "x": 770,
              "y": 0
            },
            {
              "h": 946,
              "w": 473,
              "x": 1084,
              "y": 0
            },
            {
              "h": 946,
              "w": 1600,
              "x": 0,
              "y": 0
            }
          ],
          "height": 946,
          "width": 1600
        },
        "sizes": {
          "large": {
            "h": 946,
            "w": 1600
          }
        },
        "type": "photo",
        "url": "https://t.co/D8Ztx3LqB7"
      }
    ]
  },
  "card": null,
  "place": {},
  "entities": {},
  "quoted_tweet": null,
  "retweeted_tweet": null,
  "isLimitedReply": false,
  "article": null
}