2018-11-29 17:33:44 +02:00
|
|
|
package twitterscraper
|
|
|
|
|
|
|
|
|
|
import (
|
2020-06-12 21:31:08 +08:00
|
|
|
"context"
|
2021-03-09 10:40:22 +02:00
|
|
|
"fmt"
|
2023-06-01 23:20:11 +03:00
|
|
|
"net/url"
|
2023-07-02 01:41:48 +03:00
|
|
|
"strconv"
|
2018-11-29 17:33:44 +02:00
|
|
|
)
|
|
|
|
|
|
2020-05-14 21:52:55 +03:00
|
|
|
// GetTweets returns channel with tweets for a given user.
|
2021-04-22 21:38:49 +03:00
|
|
|
func (s *Scraper) GetTweets(ctx context.Context, user string, maxTweetsNbr int) <-chan *TweetResult {
|
|
|
|
|
return getTweetTimeline(ctx, user, maxTweetsNbr, s.FetchTweets)
|
2020-12-12 23:33:57 +02:00
|
|
|
}
|
|
|
|
|
|
2020-05-14 21:52:55 +03:00
|
|
|
// FetchTweets gets tweets for a given user, via the Twitter frontend API.
|
2020-12-12 23:33:57 +02:00
|
|
|
func (s *Scraper) FetchTweets(user string, maxTweetsNbr int, cursor string) ([]*Tweet, string, error) {
|
|
|
|
|
userID, err := s.GetUserIDByScreenName(user)
|
2018-11-29 17:33:44 +02:00
|
|
|
if err != nil {
|
2020-12-11 20:58:49 +02:00
|
|
|
return nil, "", err
|
2018-11-29 17:33:44 +02:00
|
|
|
}
|
|
|
|
|
|
2023-07-02 01:41:48 +03:00
|
|
|
if s.isOpenAccount {
|
|
|
|
|
return s.FetchTweetsByUserIDLegacy(userID, maxTweetsNbr, cursor)
|
|
|
|
|
}
|
2023-05-10 06:09:11 -07:00
|
|
|
return s.FetchTweetsByUserID(userID, maxTweetsNbr, cursor)
|
|
|
|
|
}
|
|
|
|
|
|
2024-09-30 04:45:33 +03:00
|
|
|
// FetchTweetsAndRepliesByUserID gets tweets and replies for a given userID, via the Twitter frontend GraphQL API.
|
|
|
|
|
func (s *Scraper) FetchTweetsAndRepliesByUserID(userID string, maxReplysNbr int, cursor string) ([]*Tweet, string, error) {
|
|
|
|
|
if maxReplysNbr > 200 {
|
|
|
|
|
maxReplysNbr = 200
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
req, err := s.newRequest("GET", "https://twitter.com/i/api/graphql/bt4TKuFz4T7Ckk-VvQVSow/UserTweetsAndReplies")
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, "", err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
variables := map[string]interface{}{
|
|
|
|
|
"userId": userID,
|
|
|
|
|
"count": maxReplysNbr,
|
|
|
|
|
"includePromotedContent": false,
|
|
|
|
|
"withQuickPromoteEligibilityTweetFields": false,
|
|
|
|
|
"withVoice": true,
|
|
|
|
|
"withV2Timeline": true,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
features := map[string]interface{}{
|
|
|
|
|
"rweb_tipjar_consumption_enabled": true,
|
|
|
|
|
"responsive_web_graphql_exclude_directive_enabled": true,
|
|
|
|
|
"verified_phone_label_enabled": false,
|
|
|
|
|
"creator_subscriptions_tweet_preview_api_enabled": true,
|
|
|
|
|
"responsive_web_graphql_timeline_navigation_enabled": true,
|
|
|
|
|
"responsive_web_graphql_skip_user_profile_image_extensions_enabled": false,
|
|
|
|
|
"communities_web_enable_tweet_community_results_fetch": true,
|
|
|
|
|
"c9s_tweet_anatomy_moderator_badge_enabled": true,
|
|
|
|
|
"articles_preview_enabled": true,
|
|
|
|
|
"responsive_web_edit_tweet_api_enabled": true,
|
|
|
|
|
"graphql_is_translatable_rweb_tweet_is_translatable_enabled": true,
|
|
|
|
|
"view_counts_everywhere_api_enabled": true,
|
|
|
|
|
"longform_notetweets_consumption_enabled": true,
|
|
|
|
|
"responsive_web_twitter_article_tweet_consumption_enabled": true,
|
|
|
|
|
"tweet_awards_web_tipping_enabled": false,
|
|
|
|
|
"creator_subscriptions_quote_tweet_preview_enabled": false,
|
|
|
|
|
"freedom_of_speech_not_reach_fetch_enabled": true,
|
|
|
|
|
"standardized_nudges_misinfo": true,
|
|
|
|
|
"tweet_with_visibility_results_prefer_gql_limited_actions_policy_enabled": true,
|
|
|
|
|
"rweb_video_timestamps_enabled": true,
|
|
|
|
|
"longform_notetweets_rich_text_read_enabled": true,
|
|
|
|
|
"longform_notetweets_inline_media_enabled": true,
|
|
|
|
|
"responsive_web_enhance_cards_enabled": false,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if cursor != "" {
|
|
|
|
|
variables["cursor"] = cursor
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
query := url.Values{}
|
|
|
|
|
query.Set("variables", mapToJSONString(variables))
|
|
|
|
|
query.Set("features", mapToJSONString(features))
|
|
|
|
|
req.URL.RawQuery = query.Encode()
|
|
|
|
|
|
|
|
|
|
var timeline timelineV2
|
|
|
|
|
err = s.RequestAPI(req, &timeline)
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, "", err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
tweets, nextCursor := timeline.parseTweets()
|
|
|
|
|
return tweets, nextCursor, nil
|
|
|
|
|
}
|
|
|
|
|
|
2023-06-01 23:20:11 +03:00
|
|
|
// FetchTweetsByUserID gets tweets for a given userID, via the Twitter frontend GraphQL API.
|
2023-05-10 06:09:11 -07:00
|
|
|
func (s *Scraper) FetchTweetsByUserID(userID string, maxTweetsNbr int, cursor string) ([]*Tweet, string, error) {
|
|
|
|
|
if maxTweetsNbr > 200 {
|
|
|
|
|
maxTweetsNbr = 200
|
|
|
|
|
}
|
|
|
|
|
|
2023-06-01 23:20:11 +03:00
|
|
|
req, err := s.newRequest("GET", "https://twitter.com/i/api/graphql/UGi7tjRPr-d_U3bCPIko5Q/UserTweets")
|
2020-05-13 17:35:44 +02:00
|
|
|
if err != nil {
|
2020-12-11 20:58:49 +02:00
|
|
|
return nil, "", err
|
2020-05-13 17:35:44 +02:00
|
|
|
}
|
|
|
|
|
|
2023-06-01 23:20:11 +03:00
|
|
|
variables := map[string]interface{}{
|
|
|
|
|
"userId": userID,
|
|
|
|
|
"count": maxTweetsNbr,
|
|
|
|
|
"includePromotedContent": false,
|
|
|
|
|
"withQuickPromoteEligibilityTweetFields": false,
|
|
|
|
|
"withVoice": true,
|
|
|
|
|
"withV2Timeline": true,
|
|
|
|
|
}
|
|
|
|
|
features := map[string]interface{}{
|
|
|
|
|
"rweb_lists_timeline_redesign_enabled": true,
|
|
|
|
|
"responsive_web_graphql_exclude_directive_enabled": true,
|
|
|
|
|
"verified_phone_label_enabled": false,
|
|
|
|
|
"creator_subscriptions_tweet_preview_api_enabled": true,
|
|
|
|
|
"responsive_web_graphql_timeline_navigation_enabled": true,
|
|
|
|
|
"responsive_web_graphql_skip_user_profile_image_extensions_enabled": false,
|
|
|
|
|
"tweetypie_unmention_optimization_enabled": true,
|
|
|
|
|
"vibe_api_enabled": true,
|
|
|
|
|
"responsive_web_edit_tweet_api_enabled": true,
|
|
|
|
|
"graphql_is_translatable_rweb_tweet_is_translatable_enabled": true,
|
|
|
|
|
"view_counts_everywhere_api_enabled": true,
|
|
|
|
|
"longform_notetweets_consumption_enabled": true,
|
|
|
|
|
"tweet_awards_web_tipping_enabled": false,
|
|
|
|
|
"freedom_of_speech_not_reach_fetch_enabled": true,
|
|
|
|
|
"standardized_nudges_misinfo": true,
|
|
|
|
|
"tweet_with_visibility_results_prefer_gql_limited_actions_policy_enabled": false,
|
|
|
|
|
"interactive_text_enabled": true,
|
|
|
|
|
"responsive_web_text_conversations_enabled": false,
|
|
|
|
|
"longform_notetweets_rich_text_read_enabled": true,
|
|
|
|
|
"longform_notetweets_inline_media_enabled": false,
|
|
|
|
|
"responsive_web_enhance_cards_enabled": false,
|
|
|
|
|
}
|
|
|
|
|
|
2020-12-11 20:58:49 +02:00
|
|
|
if cursor != "" {
|
2023-06-01 23:20:11 +03:00
|
|
|
variables["cursor"] = cursor
|
2020-12-11 20:58:49 +02:00
|
|
|
}
|
2020-05-13 17:35:44 +02:00
|
|
|
|
2023-06-01 23:20:11 +03:00
|
|
|
query := url.Values{}
|
|
|
|
|
query.Set("variables", mapToJSONString(variables))
|
|
|
|
|
query.Set("features", mapToJSONString(features))
|
|
|
|
|
req.URL.RawQuery = query.Encode()
|
|
|
|
|
|
|
|
|
|
var timeline timelineV2
|
2020-12-12 23:33:57 +02:00
|
|
|
err = s.RequestAPI(req, &timeline)
|
2020-02-12 10:45:19 +02:00
|
|
|
if err != nil {
|
2020-12-11 20:58:49 +02:00
|
|
|
return nil, "", err
|
2020-02-12 10:45:19 +02:00
|
|
|
}
|
2018-11-29 17:33:44 +02:00
|
|
|
|
2021-07-16 11:08:43 +03:00
|
|
|
tweets, nextCursor := timeline.parseTweets()
|
2020-12-11 20:58:49 +02:00
|
|
|
return tweets, nextCursor, nil
|
2018-11-29 17:33:44 +02:00
|
|
|
}
|
2021-03-09 10:40:22 +02:00
|
|
|
|
2023-07-02 01:41:48 +03:00
|
|
|
// FetchTweetsByUserIDLegacy gets tweets for a given userID, via the Twitter frontend legacy API.
|
|
|
|
|
func (s *Scraper) FetchTweetsByUserIDLegacy(userID string, maxTweetsNbr int, cursor string) ([]*Tweet, string, error) {
|
|
|
|
|
if maxTweetsNbr > 200 {
|
|
|
|
|
maxTweetsNbr = 200
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
req, err := s.newRequest("GET", "https://api.twitter.com/2/timeline/profile/"+userID+".json")
|
2021-03-09 10:40:22 +02:00
|
|
|
if err != nil {
|
2023-07-02 01:41:48 +03:00
|
|
|
return nil, "", err
|
2021-03-09 10:40:22 +02:00
|
|
|
}
|
|
|
|
|
|
2023-07-02 01:41:48 +03:00
|
|
|
q := req.URL.Query()
|
|
|
|
|
q.Add("count", strconv.Itoa(maxTweetsNbr))
|
|
|
|
|
q.Add("userId", userID)
|
|
|
|
|
if cursor != "" {
|
|
|
|
|
q.Add("cursor", cursor)
|
2023-06-01 23:20:11 +03:00
|
|
|
}
|
2023-07-02 01:41:48 +03:00
|
|
|
req.URL.RawQuery = q.Encode()
|
2023-06-01 23:20:11 +03:00
|
|
|
|
2023-07-02 01:41:48 +03:00
|
|
|
var timeline timelineV1
|
|
|
|
|
err = s.RequestAPI(req, &timeline)
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, "", err
|
2023-06-01 23:20:11 +03:00
|
|
|
}
|
|
|
|
|
|
2023-07-02 01:41:48 +03:00
|
|
|
tweets, nextCursor := timeline.parseTweets()
|
|
|
|
|
return tweets, nextCursor, nil
|
|
|
|
|
}
|
2023-06-01 23:20:11 +03:00
|
|
|
|
2023-07-02 01:41:48 +03:00
|
|
|
// GetTweet get a single tweet by ID.
|
|
|
|
|
func (s *Scraper) GetTweet(id string) (*Tweet, error) {
|
|
|
|
|
if s.isOpenAccount {
|
|
|
|
|
req, err := s.newRequest("GET", "https://api.twitter.com/2/timeline/conversation/"+id+".json")
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, err
|
|
|
|
|
}
|
2023-06-18 19:13:26 +02:00
|
|
|
|
2023-07-02 01:41:48 +03:00
|
|
|
var timeline timelineV1
|
|
|
|
|
err = s.RequestAPI(req, &timeline)
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, err
|
|
|
|
|
}
|
2023-06-18 19:13:26 +02:00
|
|
|
|
2023-07-02 01:41:48 +03:00
|
|
|
tweets, _ := timeline.parseTweets()
|
|
|
|
|
for _, tweet := range tweets {
|
|
|
|
|
if tweet.ID == id {
|
|
|
|
|
return tweet, nil
|
|
|
|
|
}
|
|
|
|
|
}
|
2024-03-08 18:43:26 +03:00
|
|
|
} else if s.isLogged {
|
2023-07-02 01:41:48 +03:00
|
|
|
req, err := s.newRequest("GET", "https://twitter.com/i/api/graphql/VWFGPVAGkZMGRKGe3GFFnA/TweetDetail")
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, err
|
|
|
|
|
}
|
2023-06-18 19:13:26 +02:00
|
|
|
|
2023-07-02 01:41:48 +03:00
|
|
|
variables := map[string]interface{}{
|
|
|
|
|
"focalTweetId": id,
|
|
|
|
|
"with_rux_injections": false,
|
|
|
|
|
"includePromotedContent": true,
|
|
|
|
|
"withCommunity": true,
|
|
|
|
|
"withQuickPromoteEligibilityTweetFields": true,
|
|
|
|
|
"withBirdwatchNotes": true,
|
|
|
|
|
"withVoice": true,
|
|
|
|
|
"withV2Timeline": true,
|
|
|
|
|
}
|
2023-06-18 19:13:26 +02:00
|
|
|
|
2023-07-02 01:41:48 +03:00
|
|
|
features := map[string]interface{}{
|
|
|
|
|
"rweb_lists_timeline_redesign_enabled": true,
|
|
|
|
|
"responsive_web_graphql_exclude_directive_enabled": true,
|
|
|
|
|
"verified_phone_label_enabled": false,
|
|
|
|
|
"creator_subscriptions_tweet_preview_api_enabled": true,
|
|
|
|
|
"responsive_web_graphql_timeline_navigation_enabled": true,
|
|
|
|
|
"responsive_web_graphql_skip_user_profile_image_extensions_enabled": false,
|
|
|
|
|
"tweetypie_unmention_optimization_enabled": true,
|
|
|
|
|
"responsive_web_edit_tweet_api_enabled": true,
|
|
|
|
|
"graphql_is_translatable_rweb_tweet_is_translatable_enabled": true,
|
|
|
|
|
"view_counts_everywhere_api_enabled": true,
|
|
|
|
|
"longform_notetweets_consumption_enabled": true,
|
|
|
|
|
"tweet_awards_web_tipping_enabled": false,
|
|
|
|
|
"freedom_of_speech_not_reach_fetch_enabled": true,
|
|
|
|
|
"standardized_nudges_misinfo": true,
|
|
|
|
|
"tweet_with_visibility_results_prefer_gql_limited_actions_policy_enabled": false,
|
|
|
|
|
"longform_notetweets_rich_text_read_enabled": true,
|
|
|
|
|
"longform_notetweets_inline_media_enabled": true,
|
|
|
|
|
"responsive_web_enhance_cards_enabled": false,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
query := url.Values{}
|
|
|
|
|
query.Set("variables", mapToJSONString(variables))
|
|
|
|
|
query.Set("features", mapToJSONString(features))
|
|
|
|
|
req.URL.RawQuery = query.Encode()
|
|
|
|
|
|
|
|
|
|
var conversation threadedConversation
|
|
|
|
|
|
|
|
|
|
// Surprisingly, if bearerToken2 is not set, then animated GIFs are not
|
|
|
|
|
// present in the response for tweets with a GIF + a photo like this one:
|
|
|
|
|
// https://twitter.com/Twitter/status/1580661436132757506
|
|
|
|
|
curBearerToken := s.bearerToken
|
|
|
|
|
if curBearerToken != bearerToken2 {
|
|
|
|
|
s.setBearerToken(bearerToken2)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
err = s.RequestAPI(req, &conversation)
|
|
|
|
|
|
|
|
|
|
if curBearerToken != bearerToken2 {
|
|
|
|
|
s.setBearerToken(curBearerToken)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, err
|
|
|
|
|
}
|
2021-03-09 10:40:22 +02:00
|
|
|
|
2024-08-01 17:39:06 +03:00
|
|
|
tweets, _ := conversation.parse(id)
|
2023-07-02 01:41:48 +03:00
|
|
|
for _, tweet := range tweets {
|
|
|
|
|
if tweet.ID == id {
|
|
|
|
|
return tweet, nil
|
|
|
|
|
}
|
2021-03-09 10:40:22 +02:00
|
|
|
}
|
2024-03-08 18:43:26 +03:00
|
|
|
} else {
|
|
|
|
|
req, err := s.newRequest("GET", "https://twitter.com/i/api/graphql/xBtHv5-Xsk268T5ng_OGNg/TweetResultByRestId")
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, err
|
|
|
|
|
}
|
|
|
|
|
variables := map[string]interface{}{
|
|
|
|
|
"tweetId": id,
|
|
|
|
|
"withCommunity": false,
|
|
|
|
|
"includePromotedContent": false,
|
|
|
|
|
"withVoice": false,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
features := map[string]interface{}{
|
|
|
|
|
"creator_subscriptions_tweet_preview_api_enabled": true,
|
|
|
|
|
"c9s_tweet_anatomy_moderator_badge_enabled": true,
|
|
|
|
|
"tweetypie_unmention_optimization_enabled": true,
|
|
|
|
|
"responsive_web_edit_tweet_api_enabled": true,
|
|
|
|
|
"graphql_is_translatable_rweb_tweet_is_translatable_enabled": true,
|
|
|
|
|
"view_counts_everywhere_api_enabled": true,
|
|
|
|
|
"longform_notetweets_consumption_enabled": true,
|
|
|
|
|
"responsive_web_twitter_article_tweet_consumption_enabled": true,
|
|
|
|
|
"tweet_awards_web_tipping_enabled": false,
|
|
|
|
|
"freedom_of_speech_not_reach_fetch_enabled": true,
|
|
|
|
|
"standardized_nudges_misinfo": true,
|
|
|
|
|
"tweet_with_visibility_results_prefer_gql_limited_actions_policy_enabled": true,
|
|
|
|
|
"rweb_video_timestamps_enabled": true,
|
|
|
|
|
"longform_notetweets_rich_text_read_enabled": true,
|
|
|
|
|
"longform_notetweets_inline_media_enabled": true,
|
|
|
|
|
"responsive_web_graphql_exclude_directive_enabled": true,
|
|
|
|
|
"verified_phone_label_enabled": false,
|
|
|
|
|
"responsive_web_graphql_skip_user_profile_image_extensions_enabled": false,
|
|
|
|
|
"responsive_web_graphql_timeline_navigation_enabled": true,
|
|
|
|
|
"responsive_web_enhance_cards_enabled": false,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
fieldToggles := map[string]interface{}{"withArticleRichContentState": true}
|
|
|
|
|
|
|
|
|
|
query := url.Values{}
|
|
|
|
|
query.Set("variables", mapToJSONString(variables))
|
|
|
|
|
query.Set("features", mapToJSONString(features))
|
|
|
|
|
query.Set("fieldToggles", mapToJSONString(fieldToggles))
|
|
|
|
|
req.URL.RawQuery = query.Encode()
|
|
|
|
|
|
|
|
|
|
var result tweetResult
|
|
|
|
|
|
|
|
|
|
// Surprisingly, if bearerToken2 is not set, then animated GIFs are not
|
|
|
|
|
// present in the response for tweets with a GIF + a photo like this one:
|
|
|
|
|
// https://twitter.com/Twitter/status/1580661436132757506
|
|
|
|
|
curBearerToken := s.bearerToken
|
|
|
|
|
if curBearerToken != bearerToken2 {
|
|
|
|
|
s.setBearerToken(bearerToken2)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
err = s.RequestAPI(req, &result)
|
|
|
|
|
|
|
|
|
|
if curBearerToken != bearerToken2 {
|
|
|
|
|
s.setBearerToken(curBearerToken)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
tweet := result.parse()
|
|
|
|
|
return tweet, nil
|
2021-03-09 10:40:22 +02:00
|
|
|
}
|
|
|
|
|
return nil, fmt.Errorf("tweet with ID %s not found", id)
|
|
|
|
|
}
|
2024-04-07 19:18:59 +02:00
|
|
|
|
|
|
|
|
type homeEntry struct {
|
|
|
|
|
EntryId string `json:"entryId"`
|
|
|
|
|
SortIndex string `json:"sortIndex"`
|
|
|
|
|
Content struct {
|
|
|
|
|
EntryType string `json:"entryType"`
|
|
|
|
|
ItemContent struct {
|
|
|
|
|
ItemType string `json:"itemType"`
|
|
|
|
|
TweetResults struct {
|
|
|
|
|
Result result `json:"result"`
|
|
|
|
|
} `json:"tweet_results"`
|
|
|
|
|
} `json:"itemContent"`
|
2024-07-09 05:02:19 +03:00
|
|
|
Cursor string `json:"value"`
|
|
|
|
|
CursorType string `json:"cursorType"`
|
2024-04-07 19:18:59 +02:00
|
|
|
} `json:"content"`
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// timeline v2 JSON object
|
|
|
|
|
type homeTimeline struct {
|
|
|
|
|
Data struct {
|
|
|
|
|
Home struct {
|
|
|
|
|
HomeTimeline struct {
|
|
|
|
|
Instructions []struct {
|
|
|
|
|
Entries []homeEntry `json:"entries"`
|
|
|
|
|
Type string `json:"type"`
|
|
|
|
|
} `json:"instructions"`
|
|
|
|
|
Metadata struct {
|
|
|
|
|
SribeConfig []struct {
|
|
|
|
|
Page string `json:"page"`
|
|
|
|
|
} `json:"scribe_config"`
|
|
|
|
|
} `json:"metadata"`
|
|
|
|
|
} `json:"home_timeline_urt"`
|
|
|
|
|
} `json:"home"`
|
|
|
|
|
} `json:"data"`
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
func (timeline *homeTimeline) parseTweets() ([]*Tweet, string) {
|
|
|
|
|
var cursor string
|
|
|
|
|
var tweets []*Tweet
|
|
|
|
|
for _, instruction := range timeline.Data.Home.HomeTimeline.Instructions {
|
|
|
|
|
for _, entry := range instruction.Entries {
|
2024-07-09 05:02:19 +03:00
|
|
|
if entry.Content.CursorType == "Bottom" {
|
|
|
|
|
cursor = entry.Content.Cursor
|
|
|
|
|
} else if entry.Content.ItemContent.TweetResults.Result.Typename == "Tweet" {
|
2024-04-07 19:18:59 +02:00
|
|
|
if tweet := entry.Content.ItemContent.TweetResults.Result.parse(); tweet != nil {
|
|
|
|
|
tweets = append(tweets, tweet)
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return tweets, cursor
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// GetHomeTweets returns channel with tweets from home timeline
|
|
|
|
|
func (s *Scraper) GetHomeTweets(ctx context.Context, maxTweetsNbr int) <-chan *TweetResult {
|
2024-07-09 05:37:03 +03:00
|
|
|
return getTweetTimeline(ctx, "", maxTweetsNbr, s.fetchHomeTweets)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
func (s *Scraper) FetchHomeTweets(maxTweetsNbr int, cursor string) ([]*Tweet, string, error) {
|
|
|
|
|
return s.fetchHomeTweets("", maxTweetsNbr, cursor)
|
2024-04-07 19:18:59 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// FetchHomeTweets gets tweets from home timline, via the Twitter frontend API.
|
2024-07-09 05:37:03 +03:00
|
|
|
func (s *Scraper) fetchHomeTweets(_ string, maxTweetsNbr int, cursor string) ([]*Tweet, string, error) {
|
2024-04-07 19:18:59 +02:00
|
|
|
if maxTweetsNbr > 200 {
|
|
|
|
|
maxTweetsNbr = 200
|
|
|
|
|
}
|
|
|
|
|
|
2024-07-09 04:48:31 +03:00
|
|
|
req, err := s.newRequest("GET", "https://twitter.com/i/api/graphql/9EwYy8pLBOSFlEoSP2STiQ/HomeLatestTimeline")
|
2024-04-07 19:18:59 +02:00
|
|
|
if err != nil {
|
|
|
|
|
return nil, "", err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
variables := map[string]interface{}{
|
|
|
|
|
"count": maxTweetsNbr,
|
|
|
|
|
"includePromotedContent": true,
|
|
|
|
|
"withQuickPromoteEligibilityTweetFields": true,
|
|
|
|
|
"requestContext": "launch",
|
|
|
|
|
}
|
2024-07-09 05:02:19 +03:00
|
|
|
|
|
|
|
|
if cursor != "" {
|
|
|
|
|
variables["cursor"] = cursor
|
|
|
|
|
}
|
|
|
|
|
|
2024-04-07 19:18:59 +02:00
|
|
|
features := map[string]interface{}{
|
2024-07-09 04:48:31 +03:00
|
|
|
"rweb_tipjar_consumption_enabled": true,
|
2024-04-07 19:18:59 +02:00
|
|
|
"responsive_web_graphql_exclude_directive_enabled": true,
|
|
|
|
|
"verified_phone_label_enabled": false,
|
|
|
|
|
"creator_subscriptions_tweet_preview_api_enabled": true,
|
|
|
|
|
"responsive_web_graphql_timeline_navigation_enabled": true,
|
2024-07-09 05:20:49 +03:00
|
|
|
"responsive_web_graphql_skip_user_profile_image_extensions_enabled": false,
|
|
|
|
|
"communities_web_enable_tweet_community_results_fetch": true,
|
|
|
|
|
"c9s_tweet_anatomy_moderator_badge_enabled": true,
|
|
|
|
|
"articles_preview_enabled": true,
|
|
|
|
|
"tweetypie_unmention_optimization_enabled": true,
|
|
|
|
|
"responsive_web_edit_tweet_api_enabled": true,
|
|
|
|
|
"graphql_is_translatable_rweb_tweet_is_translatable_enabled": true,
|
|
|
|
|
"view_counts_everywhere_api_enabled": true,
|
|
|
|
|
"longform_notetweets_consumption_enabled": true,
|
|
|
|
|
"responsive_web_twitter_article_tweet_consumption_enabled": true,
|
|
|
|
|
"tweet_awards_web_tipping_enabled": false,
|
|
|
|
|
"creator_subscriptions_quote_tweet_preview_enabled": false,
|
|
|
|
|
"freedom_of_speech_not_reach_fetch_enabled": true,
|
|
|
|
|
"standardized_nudges_misinfo": true,
|
|
|
|
|
"tweet_with_visibility_results_prefer_gql_limited_actions_policy_enabled": true,
|
|
|
|
|
"rweb_video_timestamps_enabled": true,
|
|
|
|
|
"longform_notetweets_rich_text_read_enabled": true,
|
|
|
|
|
"longform_notetweets_inline_media_enabled": true,
|
|
|
|
|
"responsive_web_enhance_cards_enabled": false,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
req.Header.Set("content-type", "application/json")
|
|
|
|
|
|
|
|
|
|
query := url.Values{}
|
|
|
|
|
query.Set("variables", mapToJSONString(variables))
|
|
|
|
|
query.Set("features", mapToJSONString(features))
|
|
|
|
|
req.URL.RawQuery = query.Encode()
|
|
|
|
|
|
|
|
|
|
var timeline homeTimeline
|
|
|
|
|
err = s.RequestAPI(req, &timeline)
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, "", err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
tweets, nextCursor := timeline.parseTweets()
|
|
|
|
|
return tweets, nextCursor, nil
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// GetForYouTweets returns channel with tweets from for you timeline
|
|
|
|
|
func (s *Scraper) GetForYouTweets(ctx context.Context, maxTweetsNbr int) <-chan *TweetResult {
|
2024-07-09 05:37:03 +03:00
|
|
|
return getTweetTimeline(ctx, "", maxTweetsNbr, s.fetchForYouTweets)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
func (s *Scraper) FetchForYouTweets(maxTweetsNbr int, cursor string) ([]*Tweet, string, error) {
|
|
|
|
|
return s.fetchForYouTweets("", maxTweetsNbr, cursor)
|
2024-07-09 05:20:49 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// FetchForYouTweets gets tweets from for you timline, via the Twitter frontend API.
|
2024-07-09 05:37:03 +03:00
|
|
|
func (s *Scraper) fetchForYouTweets(_ string, maxTweetsNbr int, cursor string) ([]*Tweet, string, error) {
|
2024-07-09 05:20:49 +03:00
|
|
|
if maxTweetsNbr > 200 {
|
|
|
|
|
maxTweetsNbr = 200
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
req, err := s.newRequest("GET", "https://twitter.com/i/api/graphql/1u0Wlkw6Ru1NwBUD-pDiww/HomeTimeline")
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, "", err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
variables := map[string]interface{}{
|
|
|
|
|
"count": maxTweetsNbr,
|
|
|
|
|
"includePromotedContent": true,
|
|
|
|
|
"latestControlAvailable": true,
|
|
|
|
|
"requestContext": "launch",
|
|
|
|
|
"withCommunity": true,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if cursor != "" {
|
|
|
|
|
variables["cursor"] = cursor
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
features := map[string]interface{}{
|
|
|
|
|
"rweb_tipjar_consumption_enabled": true,
|
|
|
|
|
"responsive_web_graphql_exclude_directive_enabled": true,
|
|
|
|
|
"verified_phone_label_enabled": false,
|
|
|
|
|
"creator_subscriptions_tweet_preview_api_enabled": true,
|
|
|
|
|
"responsive_web_graphql_timeline_navigation_enabled": true,
|
2024-04-07 19:18:59 +02:00
|
|
|
"responsive_web_graphql_skip_user_profile_image_extensions_enabled": false,
|
|
|
|
|
"communities_web_enable_tweet_community_results_fetch": true,
|
|
|
|
|
"c9s_tweet_anatomy_moderator_badge_enabled": true,
|
2024-07-09 04:48:31 +03:00
|
|
|
"articles_preview_enabled": true,
|
2024-04-07 19:18:59 +02:00
|
|
|
"tweetypie_unmention_optimization_enabled": true,
|
|
|
|
|
"responsive_web_edit_tweet_api_enabled": true,
|
|
|
|
|
"graphql_is_translatable_rweb_tweet_is_translatable_enabled": true,
|
|
|
|
|
"view_counts_everywhere_api_enabled": true,
|
|
|
|
|
"longform_notetweets_consumption_enabled": true,
|
|
|
|
|
"responsive_web_twitter_article_tweet_consumption_enabled": true,
|
|
|
|
|
"tweet_awards_web_tipping_enabled": false,
|
2024-07-09 04:48:31 +03:00
|
|
|
"creator_subscriptions_quote_tweet_preview_enabled": false,
|
2024-04-07 19:18:59 +02:00
|
|
|
"freedom_of_speech_not_reach_fetch_enabled": true,
|
|
|
|
|
"standardized_nudges_misinfo": true,
|
|
|
|
|
"tweet_with_visibility_results_prefer_gql_limited_actions_policy_enabled": true,
|
|
|
|
|
"rweb_video_timestamps_enabled": true,
|
|
|
|
|
"longform_notetweets_rich_text_read_enabled": true,
|
|
|
|
|
"longform_notetweets_inline_media_enabled": true,
|
|
|
|
|
"responsive_web_enhance_cards_enabled": false,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
req.Header.Set("content-type", "application/json")
|
|
|
|
|
|
2024-07-09 04:48:31 +03:00
|
|
|
query := url.Values{}
|
|
|
|
|
query.Set("variables", mapToJSONString(variables))
|
|
|
|
|
query.Set("features", mapToJSONString(features))
|
|
|
|
|
req.URL.RawQuery = query.Encode()
|
2024-04-07 19:18:59 +02:00
|
|
|
|
|
|
|
|
var timeline homeTimeline
|
|
|
|
|
err = s.RequestAPI(req, &timeline)
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, "", err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
tweets, nextCursor := timeline.parseTweets()
|
|
|
|
|
return tweets, nextCursor, nil
|
|
|
|
|
}
|