@HamelHusain
RT @yunta_tsai: Many people think any given ML project is 99% training. In reality, it’s 50% evaluation, 40% data cleaning, 8% integration…
Viewing enriched Twitter post
RT @yunta_tsai: Many people think any given ML project is 99% training. In reality, it’s 50% evaluation, 40% data cleaning, 8% integration…
{
"score": 0.38,
"score_components": {
"author": 0.09,
"engagement": 0.0,
"quality": 0.08000000000000002,
"source": 0.135,
"nlp": 0.05,
"recency": 0.025
},
"scored_at": "2026-06-20T21:33:38.634544",
"import_source": "api_import",
"source_tagged_at": "2026-06-20T21:33:38.634557",
"enriched": true,
"enriched_at": "2026-06-20T21:33:38.634561"
} {
"type": "tweet",
"id": "2068445948209135752",
"url": "https://x.com/HamelHusain/status/2068445948209135752",
"twitterUrl": "https://twitter.com/HamelHusain/status/2068445948209135752",
"text": "RT @yunta_tsai: Many people think any given ML project is 99% training.\n\nIn reality, it’s 50% evaluation, 40% data cleaning, 8% integration…",
"source": "Twitter for iPhone",
"retweetCount": 518,
"replyCount": 357,
"likeCount": 5235,
"quoteCount": 117,
"viewCount": 8518209,
"createdAt": "Sat Jun 20 21:28:38 +0000 2026",
"lang": "en",
"bookmarkCount": 2730,
"isReply": false,
"inReplyToId": null,
"conversationId": "2068445948209135752",
"displayTextRange": [
0,
140
],
"inReplyToUserId": null,
"inReplyToUsername": null,
"author": {
"type": "user",
"userName": "HamelHusain",
"url": "https://x.com/HamelHusain",
"twitterUrl": "https://twitter.com/HamelHusain",
"id": "825766640",
"name": "Hamel Husain",
"isVerified": false,
"isBlueVerified": true,
"verifiedType": null,
"profilePicture": "https://pbs.twimg.com/profile_images/1287206199088173057/ixE4fKy1_normal.jpg",
"coverPicture": "https://pbs.twimg.com/profile_banners/825766640/1758993452",
"description": "",
"location": "Looking at the data",
"followers": 48660,
"following": 2553,
"status": "",
"canDm": true,
"canMediaTag": false,
"createdAt": "Sat Sep 15 18:45:02 +0000 2012",
"entities": {
"description": {
"urls": []
},
"url": {}
},
"fastFollowersCount": 0,
"favouritesCount": 17995,
"hasCustomTimelines": true,
"isTranslator": false,
"mediaCount": 1565,
"statusesCount": 16627,
"withheldInCountries": [],
"affiliatesHighlightedLabel": {},
"possiblySensitive": false,
"pinnedTweetIds": [
"2037184894540054974"
],
"profile_bio": {
"description": "Bringing data science back to AI - https://t.co/Zrmp6LRd9c\n\nAbout Me: https://t.co/P6WyeKkyTa",
"entities": {
"description": {
"urls": [
{
"display_url": "evals.info",
"expanded_url": "http://evals.info",
"indices": [
36,
59
],
"url": "https://t.co/Zrmp6LRd9c"
},
{
"display_url": "hamel.dev",
"expanded_url": "https://hamel.dev",
"indices": [
71,
94
],
"url": "https://t.co/P6WyeKkyTa"
}
]
},
"url": {
"urls": [
{
"display_url": "evals.info",
"expanded_url": "http://evals.info",
"indices": [
0,
23
],
"url": "https://t.co/Zrmp6LRd9c"
}
]
}
}
},
"isAutomated": false,
"automatedBy": null
},
"extendedEntities": {},
"card": null,
"place": {},
"entities": {
"user_mentions": [
{
"id_str": "1577705091737432070",
"indices": [
3,
14
],
"name": "Yun-Ta Tsai",
"screen_name": "yunta_tsai"
}
]
},
"quoted_tweet": null,
"retweeted_tweet": {
"type": "tweet",
"id": "2068364559698780520",
"url": "https://x.com/yunta_tsai/status/2068364559698780520",
"twitterUrl": "https://twitter.com/yunta_tsai/status/2068364559698780520",
"text": "Many people think any given ML project is 99% training.\n\nIn reality, it’s 50% evaluation, 40% data cleaning, 8% integration, and 2% training.\n\nThe first two set the noise floor for learning. No ML magic matters; the model cannot lower the noise floor, as that’s the optimal bound of Shannon encoding of your data.\n\nThus, not a single day goes by without me thinking about ontology. Even the old labels have to be constantly reviewed.",
"source": "Twitter for iPhone",
"retweetCount": 518,
"replyCount": 357,
"likeCount": 5235,
"quoteCount": 117,
"viewCount": 8518209,
"createdAt": "Sat Jun 20 16:05:14 +0000 2026",
"lang": "en",
"bookmarkCount": 2730,
"isReply": false,
"inReplyToId": null,
"conversationId": "2068364559698780520",
"displayTextRange": [
0,
279
],
"inReplyToUserId": null,
"inReplyToUsername": null,
"author": {
"type": "user",
"userName": "yunta_tsai",
"url": "https://x.com/yunta_tsai",
"twitterUrl": "https://twitter.com/yunta_tsai",
"id": "1577705091737432070",
"name": "Yun-Ta Tsai",
"isVerified": false,
"isBlueVerified": true,
"verifiedType": null,
"profilePicture": "https://pbs.twimg.com/profile_images/2035915849819938816/b6kIsNMe_normal.jpg",
"coverPicture": "https://pbs.twimg.com/profile_banners/1577705091737432070/1773849991",
"description": "",
"location": "Earth",
"followers": 104623,
"following": 215,
"status": "",
"canDm": false,
"canMediaTag": false,
"createdAt": "Wed Oct 05 17:00:03 +0000 2022",
"entities": {
"description": {
"urls": []
},
"url": {}
},
"fastFollowersCount": 0,
"favouritesCount": 106700,
"hasCustomTimelines": true,
"isTranslator": false,
"mediaCount": 1205,
"statusesCount": 13254,
"withheldInCountries": [],
"affiliatesHighlightedLabel": {},
"possiblySensitive": false,
"pinnedTweetIds": [
"1949190558385144060"
],
"profile_bio": {
"description": "Sr. Staff Engineer @Tesla_AI",
"entities": {
"description": {
"user_mentions": [
{
"id_str": "",
"indices": [
20,
29
],
"name": "",
"screen_name": "Tesla_AI"
}
]
}
}
},
"isAutomated": false,
"automatedBy": null
},
"extendedEntities": {},
"card": null,
"place": {},
"entities": {
"hashtags": [],
"symbols": [],
"urls": [],
"user_mentions": []
},
"quoted_tweet": null,
"retweeted_tweet": null,
"isLimitedReply": false,
"communityInfo": null,
"article": null
},
"isLimitedReply": false,
"communityInfo": null,
"article": null
}