🐦 Twitter Post Details

Viewing enriched Twitter post

@iScienceLuvr

Your Reward Function for RL is Your Best PRM for Search: Unifying RL and Search-Based TTS "we leverage adversarial inverse reinforcement learning (AIRL) combined with group relative policy optimization (GRPO) to learn a dense, dynamic PRM directly from correct reasoning traces, entirely eliminating the need for labeled intermediate process data. At inference, the resulting PRM simultaneously serves as the critic for RL rollouts and as a heuristic to effectively guide search procedure"

View on Twitter

📊 Media Metadata

{
  "media": [
    {
      "type": "photo",
      "url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/1958470481050534069/media_0.jpg?",
      "filename": "media_0.jpg"
    }
  ],
  "processed_at": "2025-08-21T13:30:32.629709",
  "pipeline_version": "2.0"
}

🔧 Raw API Response

{
  "type": "tweet",
  "id": "1958470481050534069",
  "url": "https://x.com/iScienceLuvr/status/1958470481050534069",
  "twitterUrl": "https://twitter.com/iScienceLuvr/status/1958470481050534069",
  "text": "Your Reward Function for RL is Your Best PRM for Search: Unifying RL and Search-Based TTS\n\n\"we leverage adversarial inverse reinforcement learning (AIRL) combined with group relative policy optimization (GRPO) to learn a dense, dynamic PRM directly from correct reasoning traces, entirely eliminating the need for labeled intermediate process data. At inference, the resulting PRM simultaneously serves as the critic for RL rollouts and as a heuristic to effectively guide search procedure\"",
  "source": "Twitter for iPhone",
  "retweetCount": 12,
  "replyCount": 4,
  "likeCount": 88,
  "quoteCount": 0,
  "viewCount": 5045,
  "createdAt": "Thu Aug 21 10:05:23 +0000 2025",
  "lang": "en",
  "bookmarkCount": 75,
  "isReply": false,
  "inReplyToId": null,
  "conversationId": "1958470481050534069",
  "displayTextRange": [
    0,
    280
  ],
  "inReplyToUserId": null,
  "inReplyToUsername": null,
  "author": {
    "type": "user",
    "userName": "iScienceLuvr",
    "url": "https://x.com/iScienceLuvr",
    "twitterUrl": "https://twitter.com/iScienceLuvr",
    "id": "441465751",
    "name": "Tanishq Mathew Abraham, Ph.D.",
    "isVerified": false,
    "isBlueVerified": true,
    "verifiedType": null,
    "profilePicture": "https://pbs.twimg.com/profile_images/1913710019729821696/Qge4zx6u_normal.jpg",
    "coverPicture": "https://pbs.twimg.com/profile_banners/441465751/1738204246",
    "description": "",
    "location": "",
    "followers": 80211,
    "following": 1244,
    "status": "",
    "canDm": true,
    "canMediaTag": true,
    "createdAt": "Tue Dec 20 03:45:50 +0000 2011",
    "entities": {
      "description": {
        "urls": []
      },
      "url": {}
    },
    "fastFollowersCount": 0,
    "favouritesCount": 105006,
    "hasCustomTimelines": true,
    "isTranslator": false,
    "mediaCount": 2449,
    "statusesCount": 17849,
    "withheldInCountries": [],
    "affiliatesHighlightedLabel": {},
    "possiblySensitive": false,
    "pinnedTweetIds": [
      "1952221233648718307"
    ],
    "profile_bio": {
      "description": "CEO @SophontAI |\nPhD at 19 (2023) |\nFounder, ex CEO @MedARC_AI |\nex Research Director Stability AI | \nBiomed. engineer @ 14 |\nTEDx talk➡https://t.co/xPxwKTq6Qb",
      "entities": {
        "description": {
          "urls": [
            {
              "display_url": "bit.ly/3tpAuan",
              "expanded_url": "https://bit.ly/3tpAuan",
              "indices": [
                136,
                159
              ],
              "url": "https://t.co/xPxwKTq6Qb"
            }
          ],
          "user_mentions": [
            {
              "id_str": "0",
              "indices": [
                4,
                14
              ],
              "name": "",
              "screen_name": "SophontAI"
            },
            {
              "id_str": "0",
              "indices": [
                52,
                62
              ],
              "name": "",
              "screen_name": "MedARC_AI"
            }
          ]
        },
        "url": {
          "urls": [
            {
              "display_url": "sophontai.com",
              "expanded_url": "https://sophontai.com",
              "indices": [
                0,
                23
              ],
              "url": "https://t.co/uQ936JTZf1"
            }
          ]
        }
      }
    },
    "isAutomated": false,
    "automatedBy": null
  },
  "extendedEntities": {
    "media": [
      {
        "allow_download_status": {
          "allow_download": true
        },
        "display_url": "pic.twitter.com/JRUGWYmhRo",
        "expanded_url": "https://twitter.com/iScienceLuvr/status/1958470481050534069/photo/1",
        "ext_media_availability": {
          "status": "Available"
        },
        "features": {
          "large": {
            "faces": [
              {
                "h": 218,
                "w": 218,
                "x": 164,
                "y": 1289
              }
            ]
          },
          "orig": {
            "faces": [
              {
                "h": 218,
                "w": 218,
                "x": 164,
                "y": 1289
              }
            ]
          }
        },
        "id_str": "1958470432014966784",
        "indices": [
          281,
          304
        ],
        "media_key": "3_1958470432014966784",
        "media_results": {
          "id": "QXBpTWVkaWFSZXN1bHRzOgwAAQoAARst4ntDW6AACgACGy3ihq4bALUAAA==",
          "result": {
            "__typename": "ApiMedia",
            "id": "QXBpTWVkaWE6DAABCgABGy3ie0NboAAKAAIbLeKGrhsAtQAA",
            "media_key": "3_1958470432014966784"
          }
        },
        "media_url_https": "https://pbs.twimg.com/media/Gy3ie0NboAAiEd1.jpg",
        "original_info": {
          "focus_rects": [
            {
              "h": 786,
              "w": 1404,
              "x": 0,
              "y": 0
            },
            {
              "h": 1404,
              "w": 1404,
              "x": 0,
              "y": 0
            },
            {
              "h": 1601,
              "w": 1404,
              "x": 0,
              "y": 0
            },
            {
              "h": 1816,
              "w": 908,
              "x": 496,
              "y": 0
            },
            {
              "h": 1816,
              "w": 1404,
              "x": 0,
              "y": 0
            }
          ],
          "height": 1816,
          "width": 1404
        },
        "sizes": {
          "large": {
            "h": 1816,
            "w": 1404
          }
        },
        "type": "photo",
        "url": "https://t.co/JRUGWYmhRo"
      }
    ]
  },
  "card": null,
  "place": {},
  "entities": {},
  "quoted_tweet": null,
  "retweeted_tweet": null,
  "article": null
}