Twitter Scraper – Scrape Twitter Data, Tweets & Profiles Effortlessly

[{ "user": { "protected": false, "created_at": "2009-06-02T20:12:29.000Z", "default_profile_image": false, "description": "", "fast_followers_count": 0, "favourites_count": 19158, "followers_count": 130769125, "friends_count": 183, "has_custom_timelines": true, "is_translator": false, "listed_count": 117751, "location": "", "media_count": 1435, "name": "Elon Musk", "normal_followers_count": 130769125, "possibly_sensitive": false, "profile_banner_url": "https://pbs.twimg.com/profile_banners/44196397/1576183471", "profile_image_url_https": "https://pbs.twimg.com/profile_images/1590968738358079488/IY9Gx6Ok_normal.jpg", "screen_name": "elonmusk", "statuses_count": 23422, "translator_type": "none", "verified": true, "withheld_in_countries": [], "id_str": "44196397" }, "id": "1633026246937546752", "conversation_id": "1632363525405392896", "full_text": "@MarkChangizi Sweden’s steadfastness was incredible!", "reply_count": 243, "retweet_count": 170, "favorite_count": 1828, "hashtags": [], "symbols": [], "user_mentions": [ { "id_str": "49445813", "name": "Mark Changizi", "screen_name": "MarkChangizi" } ], "urls": [], "media": [], "url": "https://twitter.com/elonmusk/status/1633026246937546752", "created_at": "2023-03-07T08:46:12.000Z", "is_quote_tweet": false, "replying_to_tweet": "https://twitter.com/MarkChangizi/status/1632363525405392896", "startUrl": "https://twitter.com/elonmusk/with_replies" }, { "user": { "protected": false, "created_at": "2009-06-02T20:12:29.000Z", "default_profile_image": false, "description": "", "fast_followers_count": 0, "favourites_count": 19158, "followers_count": 130769125, "friends_count": 183, "has_custom_timelines": true, "is_translator": false, "listed_count": 117751, "location": "", "media_count": 1435, "name": "Elon Musk", "normal_followers_count": 130769125, "possibly_sensitive": false, "profile_banner_url": "https://pbs.twimg.com/profile_banners/44196397/1576183471", "profile_image_url_https": "https://pbs.twimg.com/profile_images/1590968738358079488/IY9Gx6Ok_normal.jpg", "screen_name": "elonmusk", "statuses_count": 23422, "translator_type": "none", "verified": true, "withheld_in_countries": [], "id_str": "44196397" }, "id": "1633021151197954048", "conversation_id": "1632930485281120256", "full_text": "@greg_price11 @Liz_Cheney @AdamKinzinger @RepAdamSchiff Besides misleading the public, they withheld evidence for partisan political reasons that sent people to prison for far more serious crimes than they committed./n/nThat is deeply wrong, legally and morally.", "reply_count": 727, "retweet_count": 2458, "favorite_count": 10780, "hashtags": [], "symbols": [], "user_mentions": [ { "id_str": "896466491587080194", "name": "Greg Price", "screen_name": "greg_price11" }, { "id_str": "98471035", "name": "Liz Cheney", "screen_name": "Liz_Cheney" }, { "id_str": "18004222", "name": "Adam Kinzinger #fella", "screen_name": "AdamKinzinger" }, { "id_str": "29501253", "name": "Adam Schiff", "screen_name": "RepAdamSchiff" } ], "urls": [], "media": [], "url": "https://twitter.com/elonmusk/status/1633021151197954048", "created_at": "2023-03-07T08:25:57.000Z", "is_quote_tweet": false, "replying_to_tweet": "https://twitter.com/greg_price11/status/1632930485281120256", "startUrl": "https://twitter.com/elonmusk/with_replies" }] ...

async ({ data, item, request }) => { item.user = undefined; // removes this field from the output delete item.user; // this works as well const raw = data.tweets[item['#sort_index']]; // allows you to access the raw data item.source = raw.source; // adds "Twitter for ..." to the output if (request.userData.search) { item.search = request.userData.search; // add the search term to the output item.searchUrl = request.loadedUrl; // add the raw search URL to the output } return item; }

async ({ item }) => { // dataset will be full of items like { hashtag: '#somehashtag' } // returning an array here will split in multiple dataset items return item.hashtags.map((hashtag) => { return { hashtag: `#${hashtag}` }; }); }

async ({ page, request, addSearch, addProfile, addThread, customData }) => { await page.waitForSelector('[aria-label="Timeline: Trending now"] [data-testid="trend"]'); const trending = await page.evaluate(() => { const trendingEls = $('[aria-label="Timeline: Trending now"] [data-testid="trend"]'); return trendingEls.map((_, el) => { return { term: $(el).find('> div > div:nth-child(2)').text().trim(), profiles: $(el).find('> div > div:nth-child(3) [role="link"]').map((_, el) => $(el).text()).get() } }).get(); }); for (const { search, profiles } of trending) { await addSearch(search); // add a search using text for (const profile of profiles) { await addProfile(profile); // adds a profile using link } } // adds a thread and get replies. can accept an id, like from conversation_id or an URL // you can call this multiple times but will be added only once await addThread("1351044768030142464"); }

async ({ label, response, url }) => { if (label === 'response' && response) { // inside the page.on('response') callback if (url.includes('live_pipeline')) { // deal with plain text content const blob = await (await response.blob()).text(); } } else if (label === 'before') { // executes before the page.on('response'), can be used for intercept request/response } else if (label === 'after') { // executes after the scraping process has finished, even on crash } }

import { RealdataAPIClient } from 'RealdataAPI-Client'; // Initialize the RealdataAPIClient with API token const client = new RealdataAPIClient({ token: '<YOUR_API_TOKEN>', }); // Prepare actor input const input = { "searchTerms": [ "RealdataAPI" ], "searchMode": "live", "profilesDesired": 10, "tweetsDesired": 100, "mode": "replies", "proxyConfig": { "useRealdataAPIProxy": true }, "extendOutputFunction": async ({ data, item, page, request, customData, RealdataAPI }) => { return item; }, "extendScraperFunction": async ({ page, request, addSearch, addProfile, _, addThread, addEvent, customData, RealdataAPI, signal, label }) => { }, "customData": {}, "handlePageTimeoutSecs": 500, "maxRequestRetries": 6, "maxIdleTimeoutSecs": 60 }; (async () => { // Run the actor and wait for it to finish const run = await client.actor("quacker/twitter-scraper").call(input); // Fetch and print actor results from the run's dataset (if any) console.log('Results from dataset'); const { items } = await client.dataset(run.defaultDatasetId).listItems(); items.forEach((item) => { console.dir(item); }); })();

from RealdataAPI_client import RealdataAPIClient # Initialize the RealdataAPIClient with your API token client = RealdataAPIClient("<YOUR_API_TOKEN>") # Prepare the actor input run_input = { "searchTerms": ["RealdataAPI"], "searchMode": "live", "profilesDesired": 10, "tweetsDesired": 100, "mode": "replies", "proxyConfig": { "useRealdataAPIProxy": True }, "extendOutputFunction": """async ({ data, item, page, request, customData, RealdataAPI }) => { return item; }""", "extendScraperFunction": """async ({ page, request, addSearch, addProfile, _, addThread, addEvent, customData, RealdataAPI, signal, label }) => { }""", "customData": {}, "handlePageTimeoutSecs": 500, "maxRequestRetries": 6, "maxIdleTimeoutSecs": 60, } # Run the actor and wait for it to finish run = client.actor("quacker/twitter-scraper").call(run_input=run_input) # Fetch and print actor results from the run's dataset (if there are any) for item in client.dataset(run["defaultDatasetId"]).iterate_items(): print(item)

# Set API token API_TOKEN=<YOUR_API_TOKEN> # Prepare actor input cat > input.json <<'EOF' { "searchTerms": [ "RealdataAPI" ], "searchMode": "live", "profilesDesired": 10, "tweetsDesired": 100, "mode": "replies", "proxyConfig": { "useRealdataAPIProxy": true }, "extendOutputFunction": "async ({ data, item, page, request, customData, RealdataAPI }) => {/n return item;/n}", "extendScraperFunction": "async ({ page, request, addSearch, addProfile, _, addThread, addEvent, customData, RealdataAPI, signal, label }) => {/n /n}", "customData": {}, "handlePageTimeoutSecs": 500, "maxRequestRetries": 6, "maxIdleTimeoutSecs": 60 } EOF # Run the actor curl "https://api.RealdataAPI.com/v2/acts/quacker~twitter-scraper/runs?token=$API_TOKEN" / -X POST / -d @input.json / -H 'Content-Type: application/json'

{ "searchTerms": [ "RealdataAPI" ], "searchMode": "live", "profilesDesired": 10, "tweetsDesired": 100, "addTweetViewCount": true, "addUserInfo": true, "useCheerio": true, "mode": "replies", "startUrls": [], "useAdvancedSearch": false, "proxyConfig": { "useRealdataAPIProxy": true }, "extendOutputFunction": "async ({ data, item, page, request, customData, RealdataAPI }) => {/n return item;/n}", "extendScraperFunction": "async ({ page, request, addSearch, addProfile, _, addThread, addEvent, customData, RealdataAPI, signal, label }) => {/n /n}", "customData": {}, "handlePageTimeoutSecs": 500, "maxRequestRetries": 6, "maxIdleTimeoutSecs": 60, "debugLog": false }

By APIs

Ecommerce Scraping API

Food Scraping API

Grocery Scraping API

Travel Scraping API

Real Estate Scraping API

Quick Commerce Scraping API

Social Media Scraping API

OTT Scraping API

Liquor Scraping API

Recruitment Scraping API

Healthcare Scraping API

Web Data

Solutions

Web Scraping Services

Web Scraping API Services

Mobile App Scraping services

Enterprise Web Crawling

Solutions

Web Unlocker API

Anti Blocking

Use Cases

Live Crawler

Scraping Browser API

Trending

Ecommerce

Grocery / Quick Commerce

Food

Travel

Get Free Quote

Unlock Business Growth with Trusted Web Data

Twitter Scraper – Scrape Twitter Profile & Tweet Data

RealdataAPI / twitter-data-scraper

What Can This Twitter Scraper Extract?

Why Use the Real Data API Twitter Scraper?

How to Use Twitter Scraper?

Can I Scrape Twitter Data Legally?

Do You Want More Options to Scrape Twitter Data?

Tips & Tricks

Logging In Using Cookies

Input Parameters

Twitter Data Output

Search Using Advanced Feature

Workaround to Get Maximum Tweets Limit

Extend Output Function

Extend Scraper Function

Twitter Scraper with Real Data API Integrations

Using Twitter Scraper with Real Data API Platform

Related Scrapers

Facebook Ads Data Scraper

Instagram Profile Data Scraper

Reddit data Scraper

Which Search Query Do You Wish to Scrape?

Are You Looking to Filter Tweets by Content?

Options:

Limit People Profiles

Choose the Maximum Tweets Count for Every Search Query

Get Tweet View Count

Add User Data

Use Cheerio

Are You Looking to Scrape Specific Profiles from Twitter?

Would you Like to Scrape Twitter Replies?

Are You Planning to Scrape Using Twitter URL?

Tweets Newer Than

Tweets Older Than

Use Advanced Search

Optional Boolean

Proxy Configuration

Extend Output Function

Extend Scraper Function

Custom Data

Maximum Timeout Seconds for Browser Scraping

Maximum Request Retries

Scrolling Idle Seconds

Debug log

Login Cookies

Improve Tweet Scraping with Browser Fallback

ON THIS PAGE

Related Scrapers

Facebook Ads Data Scraper