🐦 Twitter Post Details

Viewing enriched Twitter post

@askalphaxiv

Why Do Multimodal LLMs (MLLM) Struggle with Spatial Understanding? This research shows that MLLMs’ spatial struggles aren’t from data scarcity, but from architecture. Spatial ability relies on the vision encoder’s positional cues, so a redesign like prompt targeting is needed. https://t.co/g0AL7aJOs2

View on Twitter

📊 Media Metadata

{
  "media": [
    {
      "url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/1965822971261718549/media_0.jpg?",
      "media_url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/1965822971261718549/media_0.jpg?",
      "type": "photo",
      "filename": "media_0.jpg"
    }
  ],
  "processed_at": "2025-09-18T13:52:37.775318",
  "pipeline_version": "2.0"
}

🔧 Raw API Response

{
  "type": "tweet",
  "id": "1965822971261718549",
  "url": "https://x.com/askalphaxiv/status/1965822971261718549",
  "twitterUrl": "https://twitter.com/askalphaxiv/status/1965822971261718549",
  "text": "Why Do Multimodal LLMs (MLLM) Struggle with Spatial Understanding?\n\nThis research shows that MLLMs’ spatial struggles aren’t from data scarcity, but from architecture. Spatial ability relies on the vision encoder’s positional cues, so a redesign like prompt targeting is needed. https://t.co/g0AL7aJOs2",
  "source": "Twitter for iPhone",
  "retweetCount": 96,
  "replyCount": 6,
  "likeCount": 719,
  "quoteCount": 8,
  "viewCount": 59989,
  "createdAt": "Wed Sep 10 17:01:34 +0000 2025",
  "lang": "en",
  "bookmarkCount": 492,
  "isReply": false,
  "inReplyToId": null,
  "conversationId": "1965822971261718549",
  "displayTextRange": [
    0,
    278
  ],
  "inReplyToUserId": null,
  "inReplyToUsername": null,
  "author": {
    "type": "user",
    "userName": "askalphaxiv",
    "url": "https://x.com/askalphaxiv",
    "twitterUrl": "https://twitter.com/askalphaxiv",
    "id": "1722422481942884352",
    "name": "alphaXiv",
    "isVerified": false,
    "isBlueVerified": true,
    "verifiedType": null,
    "profilePicture": "https://pbs.twimg.com/profile_images/1866663567417806848/-Vj32Dq-_normal.jpg",
    "coverPicture": "https://pbs.twimg.com/profile_banners/1722422481942884352/1738960325",
    "description": "",
    "location": "",
    "followers": 18922,
    "following": 38,
    "status": "",
    "canDm": true,
    "canMediaTag": true,
    "createdAt": "Thu Nov 09 01:15:23 +0000 2023",
    "entities": {
      "description": {
        "urls": []
      },
      "url": {}
    },
    "fastFollowersCount": 0,
    "favouritesCount": 2102,
    "hasCustomTimelines": true,
    "isTranslator": false,
    "mediaCount": 584,
    "statusesCount": 1129,
    "withheldInCountries": [],
    "affiliatesHighlightedLabel": {},
    "possiblySensitive": false,
    "pinnedTweetIds": [
      "1934976072258617422"
    ],
    "profile_bio": {
      "description": "High fidelity research",
      "entities": {
        "description": {},
        "url": {
          "urls": [
            {
              "display_url": "alphaxiv.org",
              "expanded_url": "http://alphaxiv.org",
              "indices": [
                0,
                23
              ],
              "url": "https://t.co/7lQNcnzeZ7"
            }
          ]
        }
      }
    },
    "isAutomated": false,
    "automatedBy": null
  },
  "extendedEntities": {
    "media": [
      {
        "allow_download_status": {
          "allow_download": true
        },
        "display_url": "pic.twitter.com/g0AL7aJOs2",
        "expanded_url": "https://twitter.com/askalphaxiv/status/1965822971261718549/photo/1",
        "ext_media_availability": {
          "status": "Available"
        },
        "features": {
          "large": {},
          "orig": {}
        },
        "id_str": "1965822836582563840",
        "indices": [
          279,
          302
        ],
        "media_key": "3_1965822836582563840",
        "media_results": {
          "id": "QXBpTWVkaWFSZXN1bHRzOgwAAQoAARtIAXRZ2sAACgACG0gBk7VbkBUAAA==",
          "result": {
            "__typename": "ApiMedia",
            "id": "QXBpTWVkaWE6DAABCgABG0gBdFnawAAKAAIbSAGTtVuQFQAA",
            "media_key": "3_1965822836582563840"
          }
        },
        "media_url_https": "https://pbs.twimg.com/media/G0gBdFnawAAvloX.jpg",
        "original_info": {
          "focus_rects": [
            {
              "h": 454,
              "w": 811,
              "x": 0,
              "y": 502
            },
            {
              "h": 811,
              "w": 811,
              "x": 0,
              "y": 145
            },
            {
              "h": 925,
              "w": 811,
              "x": 0,
              "y": 31
            },
            {
              "h": 956,
              "w": 478,
              "x": 0,
              "y": 0
            },
            {
              "h": 956,
              "w": 811,
              "x": 0,
              "y": 0
            }
          ],
          "height": 956,
          "width": 811
        },
        "sizes": {
          "large": {
            "h": 956,
            "w": 811
          }
        },
        "type": "photo",
        "url": "https://t.co/g0AL7aJOs2"
      }
    ]
  },
  "card": null,
  "place": {},
  "entities": {},
  "quoted_tweet": null,
  "retweeted_tweet": null,
  "isLimitedReply": false,
  "article": null
}