Initial stub at GetHomeTweets

This commit is contained in:
Denis Koltsov 2024-04-07 19:18:59 +02:00
parent 6a0f92e314
commit 5e1d9316e7
No known key found for this signature in database
GPG key ID: EE5EC460D5BF2118

118
tweets.go
View file

@ -1,8 +1,11 @@
package twitterscraper
import (
"bytes"
"context"
"encoding/json"
"fmt"
"io"
"net/url"
"strconv"
)
@ -273,3 +276,118 @@ func (s *Scraper) GetTweet(id string) (*Tweet, error) {
}
return nil, fmt.Errorf("tweet with ID %s not found", id)
}
type homeEntry struct {
EntryId string `json:"entryId"`
SortIndex string `json:"sortIndex"`
Content struct {
EntryType string `json:"entryType"`
ItemContent struct {
ItemType string `json:"itemType"`
TweetResults struct {
Result result `json:"result"`
} `json:"tweet_results"`
} `json:"itemContent"`
} `json:"content"`
}
// timeline v2 JSON object
type homeTimeline struct {
Data struct {
Home struct {
HomeTimeline struct {
Instructions []struct {
Entries []homeEntry `json:"entries"`
Type string `json:"type"`
} `json:"instructions"`
Metadata struct {
SribeConfig []struct {
Page string `json:"page"`
} `json:"scribe_config"`
} `json:"metadata"`
} `json:"home_timeline_urt"`
} `json:"home"`
} `json:"data"`
}
func (timeline *homeTimeline) parseTweets() ([]*Tweet, string) {
var cursor string
var tweets []*Tweet
for _, instruction := range timeline.Data.Home.HomeTimeline.Instructions {
for _, entry := range instruction.Entries {
if entry.Content.ItemContent.TweetResults.Result.Typename == "Tweet" {
if tweet := entry.Content.ItemContent.TweetResults.Result.parse(); tweet != nil {
tweets = append(tweets, tweet)
}
}
}
}
return tweets, cursor
}
// GetHomeTweets returns channel with tweets from home timeline
func (s *Scraper) GetHomeTweets(ctx context.Context, maxTweetsNbr int) <-chan *TweetResult {
return getTweetTimeline(ctx, "", maxTweetsNbr, s.FetchHomeTweets)
}
// FetchHomeTweets gets tweets from home timline, via the Twitter frontend API.
func (s *Scraper) FetchHomeTweets(_ string, maxTweetsNbr int, cursor string) ([]*Tweet, string, error) {
if maxTweetsNbr > 200 {
maxTweetsNbr = 200
}
req, err := s.newRequest("POST", "https://twitter.com/i/api/graphql/MquF6747JmE_NQYdkIH0OQ/HomeLatestTimeline")
if err != nil {
return nil, "", err
}
variables := map[string]interface{}{
"count": maxTweetsNbr,
"includePromotedContent": true,
"withQuickPromoteEligibilityTweetFields": true,
"requestContext": "launch",
}
features := map[string]interface{}{
"rweb_tipjar_consumption_enabled": false,
"responsive_web_graphql_exclude_directive_enabled": true,
"verified_phone_label_enabled": false,
"creator_subscriptions_tweet_preview_api_enabled": true,
"responsive_web_graphql_timeline_navigation_enabled": true,
"responsive_web_graphql_skip_user_profile_image_extensions_enabled": false,
"communities_web_enable_tweet_community_results_fetch": true,
"c9s_tweet_anatomy_moderator_badge_enabled": true,
"tweetypie_unmention_optimization_enabled": true,
"responsive_web_edit_tweet_api_enabled": true,
"graphql_is_translatable_rweb_tweet_is_translatable_enabled": true,
"view_counts_everywhere_api_enabled": true,
"longform_notetweets_consumption_enabled": true,
"responsive_web_twitter_article_tweet_consumption_enabled": true,
"tweet_awards_web_tipping_enabled": false,
"freedom_of_speech_not_reach_fetch_enabled": true,
"standardized_nudges_misinfo": true,
"tweet_with_visibility_results_prefer_gql_limited_actions_policy_enabled": true,
"rweb_video_timestamps_enabled": true,
"longform_notetweets_rich_text_read_enabled": true,
"longform_notetweets_inline_media_enabled": true,
"responsive_web_enhance_cards_enabled": false,
}
req.Header.Set("content-type", "application/json")
body := map[string]interface{}{
"variables": variables,
"features": features,
"queryId": "CTOVqej0JBXAZSwkp1US0g",
}
b, _ := json.Marshal(body)
req.Body = io.NopCloser(bytes.NewReader(b))
var timeline homeTimeline
err = s.RequestAPI(req, &timeline)
if err != nil {
return nil, "", err
}
tweets, nextCursor := timeline.parseTweets()
return tweets, nextCursor, nil
}