From 5e1d9316e7b3012278aa08f68d04fa415670cfd0 Mon Sep 17 00:00:00 2001 From: Denis Koltsov Date: Sun, 7 Apr 2024 19:18:59 +0200 Subject: [PATCH] Initial stub at GetHomeTweets --- tweets.go | 118 ++++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 118 insertions(+) diff --git a/tweets.go b/tweets.go index 618cd20..a122c47 100644 --- a/tweets.go +++ b/tweets.go @@ -1,8 +1,11 @@ package twitterscraper import ( + "bytes" "context" + "encoding/json" "fmt" + "io" "net/url" "strconv" ) @@ -273,3 +276,118 @@ func (s *Scraper) GetTweet(id string) (*Tweet, error) { } return nil, fmt.Errorf("tweet with ID %s not found", id) } + +type homeEntry struct { + EntryId string `json:"entryId"` + SortIndex string `json:"sortIndex"` + Content struct { + EntryType string `json:"entryType"` + ItemContent struct { + ItemType string `json:"itemType"` + TweetResults struct { + Result result `json:"result"` + } `json:"tweet_results"` + } `json:"itemContent"` + } `json:"content"` +} + +// timeline v2 JSON object +type homeTimeline struct { + Data struct { + Home struct { + HomeTimeline struct { + Instructions []struct { + Entries []homeEntry `json:"entries"` + Type string `json:"type"` + } `json:"instructions"` + Metadata struct { + SribeConfig []struct { + Page string `json:"page"` + } `json:"scribe_config"` + } `json:"metadata"` + } `json:"home_timeline_urt"` + } `json:"home"` + } `json:"data"` +} + +func (timeline *homeTimeline) parseTweets() ([]*Tweet, string) { + var cursor string + var tweets []*Tweet + for _, instruction := range timeline.Data.Home.HomeTimeline.Instructions { + for _, entry := range instruction.Entries { + if entry.Content.ItemContent.TweetResults.Result.Typename == "Tweet" { + if tweet := entry.Content.ItemContent.TweetResults.Result.parse(); tweet != nil { + tweets = append(tweets, tweet) + } + } + } + } + return tweets, cursor +} + +// GetHomeTweets returns channel with tweets from home timeline +func (s *Scraper) GetHomeTweets(ctx context.Context, maxTweetsNbr int) <-chan *TweetResult { + return getTweetTimeline(ctx, "", maxTweetsNbr, s.FetchHomeTweets) +} + +// FetchHomeTweets gets tweets from home timline, via the Twitter frontend API. +func (s *Scraper) FetchHomeTweets(_ string, maxTweetsNbr int, cursor string) ([]*Tweet, string, error) { + if maxTweetsNbr > 200 { + maxTweetsNbr = 200 + } + + req, err := s.newRequest("POST", "https://twitter.com/i/api/graphql/MquF6747JmE_NQYdkIH0OQ/HomeLatestTimeline") + if err != nil { + return nil, "", err + } + + variables := map[string]interface{}{ + "count": maxTweetsNbr, + "includePromotedContent": true, + "withQuickPromoteEligibilityTweetFields": true, + "requestContext": "launch", + } + features := map[string]interface{}{ + "rweb_tipjar_consumption_enabled": false, + "responsive_web_graphql_exclude_directive_enabled": true, + "verified_phone_label_enabled": false, + "creator_subscriptions_tweet_preview_api_enabled": true, + "responsive_web_graphql_timeline_navigation_enabled": true, + "responsive_web_graphql_skip_user_profile_image_extensions_enabled": false, + "communities_web_enable_tweet_community_results_fetch": true, + "c9s_tweet_anatomy_moderator_badge_enabled": true, + "tweetypie_unmention_optimization_enabled": true, + "responsive_web_edit_tweet_api_enabled": true, + "graphql_is_translatable_rweb_tweet_is_translatable_enabled": true, + "view_counts_everywhere_api_enabled": true, + "longform_notetweets_consumption_enabled": true, + "responsive_web_twitter_article_tweet_consumption_enabled": true, + "tweet_awards_web_tipping_enabled": false, + "freedom_of_speech_not_reach_fetch_enabled": true, + "standardized_nudges_misinfo": true, + "tweet_with_visibility_results_prefer_gql_limited_actions_policy_enabled": true, + "rweb_video_timestamps_enabled": true, + "longform_notetweets_rich_text_read_enabled": true, + "longform_notetweets_inline_media_enabled": true, + "responsive_web_enhance_cards_enabled": false, + } + + req.Header.Set("content-type", "application/json") + body := map[string]interface{}{ + "variables": variables, + "features": features, + "queryId": "CTOVqej0JBXAZSwkp1US0g", + } + + b, _ := json.Marshal(body) + req.Body = io.NopCloser(bytes.NewReader(b)) + + var timeline homeTimeline + err = s.RequestAPI(req, &timeline) + if err != nil { + return nil, "", err + } + + tweets, nextCursor := timeline.parseTweets() + return tweets, nextCursor, nil +}