@markopolojarvi
.@huggingface LLM leaderboard is saying fine-tuned 30b llama v1 beats 70b llama v2 chat. I have a creeping feeling that something in our LLM benchmarks is not working that great. https://t.co/OUwfXwHKkn
Viewing enriched Twitter post
.@huggingface LLM leaderboard is saying fine-tuned 30b llama v1 beats 70b llama v2 chat. I have a creeping feeling that something in our LLM benchmarks is not working that great. https://t.co/OUwfXwHKkn
{
"created_at": "Wed Jul 19 14:07:26 +0000 2023",
"id": 1681667064119828480,
"id_str": "1681667064119828480",
"full_text": ".@huggingface LLM leaderboard is saying fine-tuned 30b llama v1 beats 70b llama v2 chat.\n\nI have a creeping feeling that something in our LLM benchmarks is not working that great. https://t.co/OUwfXwHKkn",
"truncated": false,
"display_text_range": [
0,
179
],
"entities": {
"hashtags": [],
"symbols": [],
"user_mentions": [
{
"screen_name": "huggingface",
"name": "Hugging Face",
"id": 778764142412984320,
"id_str": "778764142412984320",
"indices": [
1,
13
]
}
],
"urls": [],
"media": [
{
"id": 1681664287855591424,
"id_str": "1681664287855591424",
"indices": [
180,
203
],
"media_url": "http://pbs.twimg.com/media/F1Z4wo0XwAAMudP.jpg",
"media_url_https": "https://pbs.twimg.com/media/F1Z4wo0XwAAMudP.jpg",
"url": "https://t.co/OUwfXwHKkn",
"display_url": "pic.twitter.com/OUwfXwHKkn",
"expanded_url": "https://twitter.com/markopolojarvi/status/1681667064119828480/photo/1",
"type": "photo",
"sizes": {
"thumb": {
"w": 150,
"h": 150,
"resize": "crop"
},
"medium": {
"w": 1148,
"h": 508,
"resize": "fit"
},
"small": {
"w": 680,
"h": 301,
"resize": "fit"
},
"large": {
"w": 1148,
"h": 508,
"resize": "fit"
}
}
}
]
},
"extended_entities": {
"media": [
{
"id": 1681664287855591424,
"id_str": "1681664287855591424",
"indices": [
180,
203
],
"media_url": "http://pbs.twimg.com/media/F1Z4wo0XwAAMudP.jpg",
"media_url_https": "https://pbs.twimg.com/media/F1Z4wo0XwAAMudP.jpg",
"url": "https://t.co/OUwfXwHKkn",
"display_url": "pic.twitter.com/OUwfXwHKkn",
"expanded_url": "https://twitter.com/markopolojarvi/status/1681667064119828480/photo/1",
"type": "photo",
"sizes": {
"thumb": {
"w": 150,
"h": 150,
"resize": "crop"
},
"medium": {
"w": 1148,
"h": 508,
"resize": "fit"
},
"small": {
"w": 680,
"h": 301,
"resize": "fit"
},
"large": {
"w": 1148,
"h": 508,
"resize": "fit"
}
}
}
]
},
"source": "<a href=\"https://mobile.twitter.com\" rel=\"nofollow\">Twitter Web App</a>",
"in_reply_to_status_id": null,
"in_reply_to_status_id_str": null,
"in_reply_to_user_id": null,
"in_reply_to_user_id_str": null,
"in_reply_to_screen_name": null,
"user": {
"id": 30666040,
"id_str": "30666040",
"name": "Marko 🎩",
"screen_name": "markopolojarvi",
"location": "",
"description": "A ghost in the machine\nAccelerate, decentralize and set it all free\nDMs are open\n\nBuilding @PromptC0 █",
"url": null,
"entities": {
"description": {
"urls": []
}
},
"protected": false,
"followers_count": 3160,
"friends_count": 301,
"listed_count": 115,
"created_at": "Sun Apr 12 15:30:13 +0000 2009",
"favourites_count": 8148,
"utc_offset": null,
"time_zone": null,
"geo_enabled": true,
"verified": false,
"statuses_count": 2034,
"lang": null,
"contributors_enabled": false,
"is_translator": false,
"is_translation_enabled": false,
"profile_background_color": "000000",
"profile_background_image_url": "http://abs.twimg.com/images/themes/theme14/bg.gif",
"profile_background_image_url_https": "https://abs.twimg.com/images/themes/theme14/bg.gif",
"profile_background_tile": true,
"profile_image_url": "http://pbs.twimg.com/profile_images/1645507577558585346/slcl5CCK_normal.jpg",
"profile_image_url_https": "https://pbs.twimg.com/profile_images/1645507577558585346/slcl5CCK_normal.jpg",
"profile_banner_url": "https://pbs.twimg.com/profile_banners/30666040/1676024345",
"profile_link_color": "0689CD",
"profile_sidebar_border_color": "000000",
"profile_sidebar_fill_color": "000000",
"profile_text_color": "E6E6E6",
"profile_use_background_image": false,
"has_extended_profile": true,
"default_profile": false,
"default_profile_image": false,
"following": false,
"follow_request_sent": false,
"notifications": false,
"translator_type": "none",
"withheld_in_countries": []
},
"geo": null,
"coordinates": null,
"place": null,
"contributors": null,
"is_quote_status": false,
"retweet_count": 2,
"favorite_count": 18,
"favorited": false,
"retweeted": false,
"possibly_sensitive": false,
"possibly_sensitive_appealable": false,
"lang": "en"
}