@omarsar0
A short tutorial on how to apply LLM-as-a-judge for evaluation. The idea is simple but can be used in many creative and flexible ways to assess the performance of LLMs on a wide range of tasks. https://t.co/qYdIaQsmgz
Viewing enriched Twitter post
A short tutorial on how to apply LLM-as-a-judge for evaluation. The idea is simple but can be used in many creative and flexible ways to assess the performance of LLMs on a wide range of tasks. https://t.co/qYdIaQsmgz
{
"score": 1.0,
"scored_at": "2025-08-09T13:46:07.551664",
"import_source": "network_archive_import",
"links_checked": true,
"checked_at": "2025-08-10T10:32:48.136219",
"media": [
{
"type": "video",
"url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/1853537993438515664/media_0.mp4?",
"filename": "media_0.mp4"
},
{
"id": "",
"type": "video",
"url": null,
"media_url": "https://pbs.twimg.com/ext_tw_video_thumb/1853537370571780097/pu/img/R8Hxdjl9v_484pmF.jpg",
"media_url_https": null,
"display_url": null,
"expanded_url": null
}
],
"reprocessed_at": "2025-08-12T15:25:57.259810",
"reprocessed_reason": "missing_media_array",
"original_structure": "had_both"
} {
"user": {
"created_at": "2015-09-04T12:59:26.000Z",
"default_profile_image": false,
"description": "Building with AI Agents @dair_ai • Prev: Meta AI, Elastic, Galactica LLM, PhD • I also teach how to build with LLMs, RAG & AI Agents ⬇️",
"fast_followers_count": 0,
"favourites_count": 27933,
"followers_count": 216712,
"friends_count": 532,
"has_custom_timelines": true,
"is_translator": false,
"listed_count": 3688,
"location": "",
"media_count": 2656,
"name": "elvis",
"normal_followers_count": 216712,
"possibly_sensitive": false,
"profile_banner_url": "https://pbs.twimg.com/profile_banners/3448284313/1565974901",
"profile_image_url_https": "https://pbs.twimg.com/profile_images/939313677647282181/vZjFWtAn_normal.jpg",
"screen_name": "omarsar0",
"statuses_count": 12439,
"translator_type": "regular",
"url": "https://t.co/JBU5beHQNs",
"verified": true,
"withheld_in_countries": [],
"id_str": "3448284313"
},
"id": "1853537993438515664",
"conversation_id": "1853537993438515664",
"full_text": "A short tutorial on how to apply LLM-as-a-judge for evaluation. \n\nThe idea is simple but can be used in many creative and flexible ways to assess the performance of LLMs on a wide range of tasks. https://t.co/qYdIaQsmgz",
"reply_count": 7,
"retweet_count": 77,
"favorite_count": 424,
"hashtags": [],
"symbols": [],
"user_mentions": [],
"urls": [],
"media": [
{
"media_url": "https://pbs.twimg.com/ext_tw_video_thumb/1853537370571780097/pu/img/R8Hxdjl9v_484pmF.jpg",
"type": "video",
"video_url": "https://video.twimg.com/ext_tw_video/1853537370571780097/pu/vid/avc1/1280x720/6EiesL1gQXFnJgVL.mp4?tag=12"
}
],
"url": "https://twitter.com/omarsar0/status/1853537993438515664",
"created_at": "2024-11-04T20:41:09.000Z",
"#sort_index": "1853537993438515664",
"view_count": 33509,
"quote_count": 2,
"is_quote_tweet": false,
"is_retweet": false,
"is_pinned": false,
"is_truncated": false,
"startUrl": "https://x.com/omarsar0/status/1853537993438515664"
}