🐦 Twitter Post Details

Viewing enriched Twitter post

@jerryjliu0

Scalably Parsing 1M+ PDFs with AI Agents 📈📑 Here’s a simple tutorial we wrote up showing you how to parse a directory of an arbitrary number of PDFs through our service in a reliable, efficient manner. LlamaParse is designed to handle very large workloads; with some simple primitives like asyncio/semaphores along with setting worker parameters, you’ll be able to get the results much more quickly than doing a forloop through everything. Check it out! https://t.co/HbNLxMj1qB

Media 1

📊 Media Metadata

{
  "media": [
    {
      "url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/1998172212969496822/media_0.jpg?",
      "media_url": "https://crmoxkoizveukayfjuyo.supabase.co/storage/v1/object/public/media/posts/1998172212969496822/media_0.jpg?",
      "type": "photo",
      "filename": "media_0.jpg"
    }
  ],
  "processed_at": "2025-12-09T03:52:45.986862",
  "pipeline_version": "2.0"
}

🔧 Raw API Response

{
  "type": "tweet",
  "id": "1998172212969496822",
  "url": "https://x.com/jerryjliu0/status/1998172212969496822",
  "twitterUrl": "https://twitter.com/jerryjliu0/status/1998172212969496822",
  "text": "Scalably Parsing 1M+ PDFs with AI Agents 📈📑\n\nHere’s a simple tutorial we wrote up showing you how to parse a directory of an arbitrary number of PDFs through our service in a reliable, efficient manner.\n\nLlamaParse is designed to handle very large workloads; with some simple primitives like asyncio/semaphores along with setting worker parameters, you’ll be able to get the results much more quickly than doing a forloop through everything.\n\nCheck it out! https://t.co/HbNLxMj1qB",
  "source": "Twitter for iPhone",
  "retweetCount": 13,
  "replyCount": 5,
  "likeCount": 65,
  "quoteCount": 0,
  "viewCount": 6095,
  "createdAt": "Mon Dec 08 23:25:54 +0000 2025",
  "lang": "en",
  "bookmarkCount": 67,
  "isReply": false,
  "inReplyToId": null,
  "conversationId": "1998172212969496822",
  "displayTextRange": [
    0,
    276
  ],
  "inReplyToUserId": null,
  "inReplyToUsername": null,
  "author": {
    "type": "user",
    "userName": "jerryjliu0",
    "url": "https://x.com/jerryjliu0",
    "twitterUrl": "https://twitter.com/jerryjliu0",
    "id": "369777416",
    "name": "Jerry Liu",
    "isVerified": false,
    "isBlueVerified": true,
    "verifiedType": null,
    "profilePicture": "https://pbs.twimg.com/profile_images/1283610285031460864/1Q4zYhtb_normal.jpg",
    "coverPicture": "",
    "description": "document OCR + workflows @llama_index. cofounder/CEO\n\nCareers: https://t.co/EUnMNmb4DZ\nEnterprise: https://t.co/Ht5jwxRU13",
    "location": "",
    "followers": 67032,
    "following": 1391,
    "status": "",
    "canDm": true,
    "canMediaTag": true,
    "createdAt": "Wed Sep 07 22:54:31 +0000 2011",
    "entities": {
      "description": {
        "urls": [
          {
            "display_url": "llamaindex.ai/careers",
            "expanded_url": "https://www.llamaindex.ai/careers",
            "url": "https://t.co/EUnMNmb4DZ",
            "indices": [
              63,
              86
            ]
          },
          {
            "display_url": "llamaindex.ai/contact",
            "expanded_url": "https://www.llamaindex.ai/contact",
            "url": "https://t.co/Ht5jwxRU13",
            "indices": [
              99,
              122
            ]
          }
        ]
      },
      "url": {
        "urls": [
          {
            "display_url": "llamaindex.ai",
            "expanded_url": "https://www.llamaindex.ai/",
            "url": "https://t.co/YiIfjVl1ly",
            "indices": [
              0,
              23
            ]
          }
        ]
      }
    },
    "fastFollowersCount": 0,
    "favouritesCount": 7953,
    "hasCustomTimelines": true,
    "isTranslator": false,
    "mediaCount": 1337,
    "statusesCount": 6314,
    "withheldInCountries": [],
    "affiliatesHighlightedLabel": {},
    "possiblySensitive": false,
    "pinnedTweetIds": [
      "1997048645817192638"
    ],
    "profile_bio": {},
    "isAutomated": false,
    "automatedBy": null
  },
  "extendedEntities": {
    "media": [
      {
        "display_url": "pic.x.com/bU7fKdxmEb",
        "expanded_url": "https://x.com/jerryjliu0/status/1998172212969496822/photo/1",
        "id_str": "1998172205512060928",
        "indices": [
          277,
          300
        ],
        "media_key": "3_1998172205512060928",
        "media_url_https": "https://pbs.twimg.com/media/G7rvCL2a8AA5_gs.jpg",
        "type": "photo",
        "url": "https://t.co/bU7fKdxmEb",
        "ext_media_availability": {
          "status": "Available"
        },
        "features": {
          "large": {
            "faces": [
              {
                "x": 183,
                "y": 241,
                "h": 112,
                "w": 112
              }
            ]
          },
          "medium": {
            "faces": [
              {
                "x": 175,
                "y": 230,
                "h": 107,
                "w": 107
              }
            ]
          },
          "small": {
            "faces": [
              {
                "x": 99,
                "y": 130,
                "h": 60,
                "w": 60
              }
            ]
          },
          "orig": {
            "faces": [
              {
                "x": 183,
                "y": 241,
                "h": 112,
                "w": 112
              }
            ]
          }
        },
        "sizes": {
          "large": {
            "h": 1254,
            "w": 1210,
            "resize": "fit"
          },
          "medium": {
            "h": 1200,
            "w": 1158,
            "resize": "fit"
          },
          "small": {
            "h": 680,
            "w": 656,
            "resize": "fit"
          },
          "thumb": {
            "h": 150,
            "w": 150,
            "resize": "crop"
          }
        },
        "original_info": {
          "height": 1254,
          "width": 1210,
          "focus_rects": [
            {
              "x": 0,
              "y": 0,
              "w": 1210,
              "h": 678
            },
            {
              "x": 0,
              "y": 0,
              "w": 1210,
              "h": 1210
            },
            {
              "x": 0,
              "y": 0,
              "w": 1100,
              "h": 1254
            },
            {
              "x": 31,
              "y": 0,
              "w": 627,
              "h": 1254
            },
            {
              "x": 0,
              "y": 0,
              "w": 1210,
              "h": 1254
            }
          ]
        },
        "media_results": {
          "result": {
            "media_key": "3_1998172205512060928"
          }
        }
      }
    ]
  },
  "card": null,
  "place": {},
  "entities": {
    "hashtags": [],
    "symbols": [],
    "urls": [
      {
        "display_url": "developers.llamaindex.ai/python/cloud/l…",
        "expanded_url": "https://developers.llamaindex.ai/python/cloud/llamaparse/examples/async_parse_folder/?utm_source=socials&utm_medium=li_social",
        "url": "https://t.co/HbNLxMj1qB",
        "indices": [
          457,
          480
        ]
      }
    ],
    "user_mentions": []
  },
  "quoted_tweet": {
    "type": "tweet",
    "id": "1998153602637160887",
    "url": "https://x.com/llama_index/status/1998153602637160887",
    "twitterUrl": "https://twitter.com/llama_index/status/1998153602637160887",
    "text": "Need to parse multiple PDFs efficiently? Learn how to use LlamaParse with async batch processing.\n\n📁 Process entire folders of PDFs simultaneously instead of one-by-one\n⚡ Use asyncio and semaphores to control how many files parse concurrently\n🎯 Prevent API rate limit errors while maximizing throughput\n📊 Get detailed progress tracking and summary statistics for batch operations\n\nThis is perfect for processing large document collections, research papers, or any scenario where you need to parse dozens or hundreds of PDFs quickly and reliably.\n\nFull tutorial with working code examples: https://t.co/9l4vjtqKt9",
    "source": "Twitter for iPhone",
    "retweetCount": 5,
    "replyCount": 1,
    "likeCount": 22,
    "quoteCount": 1,
    "viewCount": 8992,
    "createdAt": "Mon Dec 08 22:11:57 +0000 2025",
    "lang": "en",
    "bookmarkCount": 33,
    "isReply": false,
    "inReplyToId": null,
    "conversationId": "1998153602637160887",
    "displayTextRange": [
      0,
      275
    ],
    "inReplyToUserId": null,
    "inReplyToUsername": null,
    "author": {
      "type": "user",
      "userName": "llama_index",
      "url": "https://x.com/llama_index",
      "twitterUrl": "https://twitter.com/llama_index",
      "id": "1604278358296055808",
      "name": "LlamaIndex 🦙",
      "isVerified": false,
      "isBlueVerified": true,
      "verifiedType": null,
      "profilePicture": "https://pbs.twimg.com/profile_images/1967920417760251904/0ytfduMQ_normal.png",
      "coverPicture": "https://pbs.twimg.com/profile_banners/1604278358296055808/1758023766",
      "description": "AI Agents for document OCR + workflows\n\nGithub: https://t.co/HC19j7veGE\nDocs: https://t.co/QInqg2yMCJ\nLlamaCloud: https://t.co/yQGTiRSfFL",
      "location": "",
      "followers": 104790,
      "following": 28,
      "status": "",
      "canDm": false,
      "canMediaTag": true,
      "createdAt": "Sun Dec 18 00:52:44 +0000 2022",
      "entities": {
        "description": {
          "urls": [
            {
              "display_url": "github.com/run-llama/llam…",
              "expanded_url": "http://github.com/run-llama/llama_index",
              "url": "https://t.co/HC19j7veGE",
              "indices": [
                48,
                71
              ]
            },
            {
              "display_url": "docs.llamaindex.ai",
              "expanded_url": "http://docs.llamaindex.ai",
              "url": "https://t.co/QInqg2yMCJ",
              "indices": [
                78,
                101
              ]
            },
            {
              "display_url": "cloud.llamaindex.ai",
              "expanded_url": "https://cloud.llamaindex.ai/",
              "url": "https://t.co/yQGTiRSfFL",
              "indices": [
                114,
                137
              ]
            }
          ]
        },
        "url": {
          "urls": [
            {
              "display_url": "llamaindex.ai",
              "expanded_url": "https://www.llamaindex.ai/",
              "url": "https://t.co/epzefqPT9Z",
              "indices": [
                0,
                23
              ]
            }
          ]
        }
      },
      "fastFollowersCount": 0,
      "favouritesCount": 1459,
      "hasCustomTimelines": false,
      "isTranslator": false,
      "mediaCount": 1782,
      "statusesCount": 3647,
      "withheldInCountries": [],
      "affiliatesHighlightedLabel": {},
      "possiblySensitive": false,
      "pinnedTweetIds": [],
      "profile_bio": {},
      "isAutomated": false,
      "automatedBy": null
    },
    "extendedEntities": {},
    "card": {
      "binding_values": [
        {
          "key": "domain",
          "value": {
            "string_value": "developers.llamaindex.ai",
            "type": "STRING"
          }
        },
        {
          "key": "site",
          "value": {
            "scribe_key": "publisher_id",
            "type": "USER",
            "user_value": {
              "id_str": "1604278358296055808",
              "path": []
            }
          }
        },
        {
          "key": "vanity_url",
          "value": {
            "scribe_key": "vanity_url",
            "string_value": "developers.llamaindex.ai",
            "type": "STRING"
          }
        },
        {
          "key": "title",
          "value": {
            "string_value": "Parse All PDFs in a Folder with LlamaParse",
            "type": "STRING"
          }
        },
        {
          "key": "card_url",
          "value": {
            "scribe_key": "card_url",
            "string_value": "https://t.co/9l4vjtqKt9",
            "type": "STRING"
          }
        }
      ],
      "card_platform": {
        "platform": {
          "audience": {
            "name": "production"
          },
          "device": {
            "name": "Android",
            "version": "12"
          }
        }
      },
      "name": "summary_large_image",
      "url": "https://t.co/9l4vjtqKt9",
      "user_refs_results": [
        {
          "result": {
            "__typename": "User",
            "id": "VXNlcjoxNjA0Mjc4MzU4Mjk2MDU1ODA4",
            "rest_id": "1604278358296055808",
            "affiliates_highlighted_label": {},
            "has_graduated_access": true,
            "is_blue_verified": true,
            "profile_image_shape": "Circle",
            "legacy": {
              "can_dm": false,
              "can_media_tag": true,
              "created_at": "Sun Dec 18 00:52:44 +0000 2022",
              "default_profile": true,
              "default_profile_image": false,
              "description": "AI Agents for document OCR + workflows\n\nGithub: https://t.co/HC19j7veGE\nDocs: https://t.co/QInqg2yMCJ\nLlamaCloud: https://t.co/yQGTiRSfFL",
              "entities": {
                "description": {
                  "urls": [
                    {
                      "display_url": "github.com/run-llama/llam…",
                      "expanded_url": "http://github.com/run-llama/llama_index",
                      "url": "https://t.co/HC19j7veGE",
                      "indices": [
                        48,
                        71
                      ]
                    },
                    {
                      "display_url": "docs.llamaindex.ai",
                      "expanded_url": "http://docs.llamaindex.ai",
                      "url": "https://t.co/QInqg2yMCJ",
                      "indices": [
                        78,
                        101
                      ]
                    },
                    {
                      "display_url": "cloud.llamaindex.ai",
                      "expanded_url": "https://cloud.llamaindex.ai/",
                      "url": "https://t.co/yQGTiRSfFL",
                      "indices": [
                        114,
                        137
                      ]
                    }
                  ]
                },
                "url": {
                  "urls": [
                    {
                      "display_url": "llamaindex.ai",
                      "expanded_url": "https://www.llamaindex.ai/",
                      "url": "https://t.co/epzefqPT9Z",
                      "indices": [
                        0,
                        23
                      ]
                    }
                  ]
                }
              },
              "fast_followers_count": 0,
              "favourites_count": 1459,
              "followers_count": 104790,
              "friends_count": 28,
              "has_custom_timelines": false,
              "is_translator": false,
              "listed_count": 1630,
              "location": "",
              "media_count": 1782,
              "name": "LlamaIndex 🦙",
              "normal_followers_count": 104790,
              "pinned_tweet_ids_str": [],
              "possibly_sensitive": false,
              "profile_banner_url": "https://pbs.twimg.com/profile_banners/1604278358296055808/1758023766",
              "profile_image_url_https": "https://pbs.twimg.com/profile_images/1967920417760251904/0ytfduMQ_normal.png",
              "profile_interstitial_type": "",
              "screen_name": "llama_index",
              "statuses_count": 3647,
              "translator_type": "none",
              "url": "https://t.co/epzefqPT9Z",
              "verified": false,
              "want_retweets": false,
              "withheld_in_countries": []
            },
            "tipjar_settings": {}
          }
        }
      ]
    },
    "place": {},
    "entities": {
      "hashtags": [],
      "symbols": [],
      "urls": [
        {
          "display_url": "developers.llamaindex.ai/python/cloud/l…",
          "expanded_url": "https://developers.llamaindex.ai/python/cloud/llamaparse/examples/async_parse_folder/?utm_source=socials&utm_medium=li_social",
          "url": "https://t.co/9l4vjtqKt9",
          "indices": [
            589,
            612
          ]
        }
      ],
      "user_mentions": []
    },
    "quoted_tweet": null,
    "retweeted_tweet": null,
    "article": null
  },
  "retweeted_tweet": null,
  "article": null
}