🐦 Twitter Post Details

Viewing enriched Twitter post

@braintrust

We analyzed 1,781 real agent traces from @huggingface to understand what actually drives agent success across models, benchmarks, and harnesses. What we found: - The harness matters ~7× more than the model. - Open-weight models are production-ready for coding. - Cost per task and cost per success rank configs very differently.

View on Twitter

📊 Media Metadata

{
  "score": 0.38,
  "score_components": {
    "author": 0.09,
    "engagement": 0.0,
    "quality": 0.08000000000000002,
    "source": 0.135,
    "nlp": 0.05,
    "recency": 0.025
  },
  "scored_at": "2026-06-29T15:13:17.307055",
  "import_source": "api_import",
  "source_tagged_at": "2026-06-29T15:13:17.307065",
  "enriched": true,
  "enriched_at": "2026-06-29T15:13:17.307069"
}

🔧 Raw API Response

{
  "type": "tweet",
  "id": "2070177203787067498",
  "url": "https://x.com/braintrust/status/2070177203787067498",
  "twitterUrl": "https://twitter.com/braintrust/status/2070177203787067498",
  "text": "We analyzed 1,781 real agent traces from @huggingface to understand what actually drives agent success across models, benchmarks, and harnesses.\n\nWhat we found:\n- The harness matters ~7× more than the model.\n- Open-weight models are production-ready for coding.\n- Cost per task and cost per success rank configs very differently.",
  "source": "Twitter for iPhone",
  "retweetCount": 12,
  "replyCount": 5,
  "likeCount": 31,
  "quoteCount": 0,
  "viewCount": 9268,
  "createdAt": "Thu Jun 25 16:08:02 +0000 2026",
  "lang": "en",
  "bookmarkCount": 10,
  "isReply": false,
  "inReplyToId": null,
  "conversationId": "2070177203787067498",
  "displayTextRange": [
    0,
    277
  ],
  "inReplyToUserId": null,
  "inReplyToUsername": null,
  "author": {
    "type": "user",
    "userName": "braintrust",
    "url": "https://x.com/braintrust",
    "twitterUrl": "https://twitter.com/braintrust",
    "id": "1687132266391289856",
    "name": "Braintrust",
    "isVerified": false,
    "isBlueVerified": true,
    "verifiedType": "Business",
    "profilePicture": "https://pbs.twimg.com/profile_images/2023446233713700868/2kunzppe_normal.png",
    "coverPicture": "https://pbs.twimg.com/profile_banners/1687132266391289856/1771261453",
    "description": "",
    "location": "",
    "followers": 6897,
    "following": 55,
    "status": "",
    "canDm": true,
    "canMediaTag": true,
    "createdAt": "Thu Aug 03 16:04:26 +0000 2023",
    "entities": {
      "description": {
        "urls": []
      },
      "url": {}
    },
    "fastFollowersCount": 0,
    "favouritesCount": 581,
    "hasCustomTimelines": true,
    "isTranslator": false,
    "mediaCount": 265,
    "statusesCount": 769,
    "withheldInCountries": [],
    "affiliatesHighlightedLabel": {},
    "possiblySensitive": false,
    "pinnedTweetIds": [
      "2061480289289773513"
    ],
    "profile_bio": {
      "description": "The observability layer for production AI.",
      "entities": {
        "description": {},
        "url": {
          "urls": [
            {
              "display_url": "braintrust.dev",
              "expanded_url": "https://www.braintrust.dev",
              "indices": [
                0,
                23
              ],
              "url": "https://t.co/uxkCB1j2vh"
            }
          ]
        }
      }
    },
    "isAutomated": false,
    "automatedBy": null
  },
  "extendedEntities": {},
  "card": null,
  "place": {},
  "entities": {
    "hashtags": [],
    "symbols": [],
    "urls": [],
    "user_mentions": [
      {
        "id_str": "778764142412984320",
        "indices": [
          41,
          53
        ],
        "name": "Hugging Face",
        "screen_name": "huggingface"
      }
    ]
  },
  "quoted_tweet": null,
  "retweeted_tweet": null,
  "isLimitedReply": false,
  "communityInfo": null,
  "article": null
}