@_akhaliq
RT @FuxiaoL: What if a VLM could teach itself from zero data? Meet MM-Zero: one base model that self-evolves by playing 3 roles: 🧠 Propose…
Viewing enriched Twitter post
RT @FuxiaoL: What if a VLM could teach itself from zero data? Meet MM-Zero: one base model that self-evolves by playing 3 roles: 🧠 Propose…
{
"score": 0.34,
"score_components": {
"author": 0.09,
"engagement": 0.0,
"quality": 0.04000000000000001,
"source": 0.135,
"nlp": 0.05,
"recency": 0.025
},
"scored_at": "2026-03-12T01:36:00.300225",
"import_source": "api_import",
"source_tagged_at": "2026-03-12T01:36:00.300237",
"enriched": true,
"enriched_at": "2026-03-12T01:36:00.300240"
} {
"type": "tweet",
"id": "2031906448838410488",
"url": "https://x.com/_akhaliq/status/2031906448838410488",
"twitterUrl": "https://twitter.com/_akhaliq/status/2031906448838410488",
"text": "RT @FuxiaoL: What if a VLM could teach itself from zero data?\n\nMeet MM-Zero: one base model that self-evolves by playing 3 roles:\n🧠 Propose…",
"source": "Twitter for iPhone",
"retweetCount": 1,
"replyCount": 1,
"likeCount": 3,
"quoteCount": 0,
"viewCount": 267,
"createdAt": "Thu Mar 12 01:33:43 +0000 2026",
"lang": "en",
"bookmarkCount": 1,
"isReply": false,
"inReplyToId": null,
"conversationId": "2031906448838410488",
"displayTextRange": [
0,
140
],
"inReplyToUserId": null,
"inReplyToUsername": null,
"author": {
"type": "user",
"userName": "_akhaliq",
"url": "https://x.com/_akhaliq",
"twitterUrl": "https://twitter.com/_akhaliq",
"id": "2465283662",
"name": "AK",
"isVerified": false,
"isBlueVerified": true,
"verifiedType": null,
"profilePicture": "https://pbs.twimg.com/profile_images/1451191636810092553/kpM5Fe12_normal.jpg",
"coverPicture": "https://pbs.twimg.com/profile_banners/2465283662/1610997549",
"description": "",
"location": "",
"followers": 462893,
"following": 3145,
"status": "",
"canDm": true,
"canMediaTag": true,
"createdAt": "Sun Apr 27 00:20:12 +0000 2014",
"entities": {
"description": {
"urls": []
},
"url": {}
},
"fastFollowersCount": 0,
"favouritesCount": 37692,
"hasCustomTimelines": true,
"isTranslator": false,
"mediaCount": 19320,
"statusesCount": 46044,
"withheldInCountries": [],
"affiliatesHighlightedLabel": {},
"possiblySensitive": false,
"pinnedTweetIds": [
"1844746338396770616"
],
"profile_bio": {
"description": "AI research paper tweets, ML @Gradio (acq. by @HuggingFace 🤗) dm for promo ,submit papers here: https://t.co/UzmYN5XOCi",
"entities": {
"description": {
"hashtags": [],
"symbols": [],
"urls": [
{
"display_url": "huggingface.co/papers/submit",
"expanded_url": "https://huggingface.co/papers/submit",
"indices": [
96,
119
],
"url": "https://t.co/UzmYN5XOCi"
}
],
"user_mentions": [
{
"id_str": "0",
"indices": [
29,
36
],
"name": "",
"screen_name": "Gradio"
},
{
"id_str": "0",
"indices": [
46,
58
],
"name": "",
"screen_name": "HuggingFace"
}
]
},
"url": {
"urls": [
{
"display_url": "huggingface.co/akhaliq",
"expanded_url": "https://huggingface.co/akhaliq",
"indices": [
0,
23
],
"url": "https://t.co/q2Qoey80Gx"
}
]
}
}
},
"isAutomated": false,
"automatedBy": null
},
"extendedEntities": {},
"card": null,
"place": {},
"entities": {
"hashtags": [],
"symbols": [],
"timestamps": [],
"urls": [],
"user_mentions": [
{
"id_str": "1454019929020186625",
"indices": [
3,
11
],
"name": "Fuxiao Liu",
"screen_name": "FuxiaoL"
}
]
},
"quoted_tweet": null,
"retweeted_tweet": {
"type": "tweet",
"id": "2031904279309492499",
"url": "https://x.com/FuxiaoL/status/2031904279309492499",
"twitterUrl": "https://twitter.com/FuxiaoL/status/2031904279309492499",
"text": "What if a VLM could teach itself from zero data?\n\nMeet MM-Zero: one base model that self-evolves by playing 3 roles:\n🧠 Proposer – imagines visual concepts\n💻 Coder – renders them in Python/SVG\n🔎 Solver – reasons over the results\n\nNo seed images. Just RL (GRPO) + execution feedback. @zli12321 @ChengsongH31219",
"source": "Twitter for iPhone",
"retweetCount": 1,
"replyCount": 1,
"likeCount": 3,
"quoteCount": 0,
"viewCount": 267,
"createdAt": "Thu Mar 12 01:25:05 +0000 2026",
"lang": "en",
"bookmarkCount": 1,
"isReply": false,
"inReplyToId": null,
"conversationId": "2031904279309492499",
"displayTextRange": [
0,
271
],
"inReplyToUserId": null,
"inReplyToUsername": null,
"author": {
"type": "user",
"userName": "FuxiaoL",
"url": "https://x.com/FuxiaoL",
"twitterUrl": "https://twitter.com/FuxiaoL",
"id": "1454019929020186625",
"name": "Fuxiao Liu",
"isVerified": false,
"isBlueVerified": true,
"verifiedType": null,
"profilePicture": "https://pbs.twimg.com/profile_images/1678665590704308225/qE3CRzM0_normal.jpg",
"coverPicture": "",
"description": "",
"location": "Washington, DC",
"followers": 842,
"following": 742,
"status": "",
"canDm": false,
"canMediaTag": true,
"createdAt": "Fri Oct 29 09:39:14 +0000 2021",
"entities": {
"description": {
"urls": []
},
"url": {}
},
"fastFollowersCount": 0,
"favouritesCount": 389,
"hasCustomTimelines": true,
"isTranslator": false,
"mediaCount": 13,
"statusesCount": 114,
"withheldInCountries": [],
"affiliatesHighlightedLabel": {},
"possiblySensitive": false,
"pinnedTweetIds": [],
"profile_bio": {
"description": "Research Scientist @Nvidia | CS PhD @UMDCSI, working on LLM, Multimodal Stuff",
"entities": {
"description": {
"hashtags": [],
"symbols": [],
"urls": [],
"user_mentions": [
{
"id_str": "0",
"indices": [
19,
26
],
"name": "",
"screen_name": "Nvidia"
},
{
"id_str": "0",
"indices": [
36,
43
],
"name": "",
"screen_name": "UMDCSI"
}
]
},
"url": {
"urls": [
{
"display_url": "scholar.google.ca/citations?user…",
"expanded_url": "https://scholar.google.ca/citations?user=e0P54E4AAAAJ&hl=en",
"indices": [
0,
23
],
"url": "https://t.co/iCVON5vSrU"
}
]
}
}
},
"isAutomated": false,
"automatedBy": null
},
"extendedEntities": {},
"card": null,
"place": {},
"entities": {
"hashtags": [],
"symbols": [],
"urls": [],
"user_mentions": [
{
"id_str": "1634037176051589121",
"indices": [
282,
291
],
"name": "Zongxia Li",
"screen_name": "zli12321"
},
{
"id_str": "1684037808649011200",
"indices": [
292,
308
],
"name": "ChengSong Huang",
"screen_name": "ChengsongH31219"
}
]
},
"quoted_tweet": {
"type": "tweet",
"id": "2031783306174329233",
"url": "https://x.com/_akhaliq/status/2031783306174329233",
"twitterUrl": "https://twitter.com/_akhaliq/status/2031783306174329233",
"text": "MM-Zero\n\nSelf-Evolving Multi-Model Vision Language Models From Zero Data\n\npaper: https://t.co/o5d40EF8yo https://t.co/B69LwZozWE",
"source": "Twitter for iPhone",
"retweetCount": 6,
"replyCount": 2,
"likeCount": 28,
"quoteCount": 3,
"viewCount": 7648,
"createdAt": "Wed Mar 11 17:24:23 +0000 2026",
"lang": "it",
"bookmarkCount": 27,
"isReply": false,
"inReplyToId": null,
"conversationId": "2031783306174329233",
"displayTextRange": [
0,
104
],
"inReplyToUserId": null,
"inReplyToUsername": null,
"author": {
"type": "user",
"userName": "_akhaliq",
"url": "https://x.com/_akhaliq",
"twitterUrl": "https://twitter.com/_akhaliq",
"id": "2465283662",
"name": "AK",
"isVerified": false,
"isBlueVerified": true,
"verifiedType": null,
"profilePicture": "https://pbs.twimg.com/profile_images/1451191636810092553/kpM5Fe12_normal.jpg",
"coverPicture": "https://pbs.twimg.com/profile_banners/2465283662/1610997549",
"description": "",
"location": "",
"followers": 462893,
"following": 3145,
"status": "",
"canDm": true,
"canMediaTag": true,
"createdAt": "Sun Apr 27 00:20:12 +0000 2014",
"entities": {
"description": {
"urls": []
},
"url": {}
},
"fastFollowersCount": 0,
"favouritesCount": 37692,
"hasCustomTimelines": true,
"isTranslator": false,
"mediaCount": 19320,
"statusesCount": 46044,
"withheldInCountries": [],
"affiliatesHighlightedLabel": {},
"possiblySensitive": false,
"pinnedTweetIds": [
"1844746338396770616"
],
"profile_bio": {
"description": "AI research paper tweets, ML @Gradio (acq. by @HuggingFace 🤗) dm for promo ,submit papers here: https://t.co/UzmYN5XOCi",
"entities": {
"description": {
"hashtags": [],
"symbols": [],
"urls": [
{
"display_url": "huggingface.co/papers/submit",
"expanded_url": "https://huggingface.co/papers/submit",
"indices": [
96,
119
],
"url": "https://t.co/UzmYN5XOCi"
}
],
"user_mentions": [
{
"id_str": "0",
"indices": [
29,
36
],
"name": "",
"screen_name": "Gradio"
},
{
"id_str": "0",
"indices": [
46,
58
],
"name": "",
"screen_name": "HuggingFace"
}
]
},
"url": {
"urls": [
{
"display_url": "huggingface.co/akhaliq",
"expanded_url": "https://huggingface.co/akhaliq",
"indices": [
0,
23
],
"url": "https://t.co/q2Qoey80Gx"
}
]
}
}
},
"isAutomated": false,
"automatedBy": null
},
"extendedEntities": {
"media": [
{
"allow_download_status": {
"allow_download": true
},
"display_url": "pic.twitter.com/B69LwZozWE",
"expanded_url": "https://twitter.com/_akhaliq/status/2031783306174329233/photo/1",
"ext_media_availability": {
"status": "Available"
},
"features": {
"large": {
"faces": []
},
"orig": {
"faces": []
}
},
"id_str": "2031783250511704065",
"indices": [
105,
128
],
"media_key": "3_2031783250511704065",
"media_results": {
"id": "QXBpTWVkaWFSZXN1bHRzOgwAAQoAARwyWBn7VrABCgACHDJYJvEW8ZEAAA==",
"result": {
"__typename": "ApiMedia",
"id": "QXBpTWVkaWE6DAABCgABHDJYGftWsAEKAAIcMlgm8RbxkQAA",
"media_key": "3_2031783250511704065"
}
},
"media_url_https": "https://pbs.twimg.com/media/HDJYGftWsAEeMT-.jpg",
"original_info": {
"focus_rects": [
{
"h": 852,
"w": 1522,
"x": 0,
"y": 0
},
{
"h": 1356,
"w": 1356,
"x": 0,
"y": 0
},
{
"h": 1356,
"w": 1189,
"x": 0,
"y": 0
},
{
"h": 1356,
"w": 678,
"x": 0,
"y": 0
},
{
"h": 1356,
"w": 1522,
"x": 0,
"y": 0
}
],
"height": 1356,
"width": 1522
},
"sizes": {
"large": {
"h": 1356,
"w": 1522
}
},
"type": "photo",
"url": "https://t.co/B69LwZozWE"
}
]
},
"card": null,
"place": {},
"entities": {
"hashtags": [],
"symbols": [],
"timestamps": [],
"urls": [
{
"display_url": "huggingface.co/papers/2603.09…",
"expanded_url": "https://huggingface.co/papers/2603.09206",
"indices": [
81,
104
],
"url": "https://t.co/o5d40EF8yo"
}
],
"user_mentions": []
},
"quoted_tweet": null,
"retweeted_tweet": null,
"isLimitedReply": false,
"article": null
},
"retweeted_tweet": null,
"isLimitedReply": false,
"article": null
},
"isLimitedReply": false,
"article": null
}