twitter-scrapper/api.go

116 lines
2.4 KiB
Go
Raw Normal View History

package twitterscraper
import (
"encoding/json"
"fmt"
2023-05-10 22:24:32 +03:00
"io"
"net/http"
2021-01-05 14:21:08 +02:00
"time"
)
const bearerToken string = "AAAAAAAAAAAAAAAAAAAAAPYXBAAAAAAACLXUNDekMxqa8h%2F40K4moUkGsoc%3DTYfbDKbT3jJPCEVnMYqilB28NHfOPqkca3qaAxGfsyKCs0wRbw"
2020-12-12 23:33:57 +02:00
// RequestAPI get JSON from frontend API and decodes it
func (s *Scraper) RequestAPI(req *http.Request, target interface{}) error {
s.wg.Wait()
if s.delay > 0 {
defer func() {
s.wg.Add(1)
go func() {
time.Sleep(time.Second * time.Duration(s.delay))
s.wg.Done()
}()
}()
}
2023-05-10 11:42:47 +03:00
if !s.isLogged {
if !s.IsGuestToken() || s.guestCreatedAt.Before(time.Now().Add(-time.Hour*3)) {
err := s.GetGuestToken()
if err != nil {
return err
}
}
2023-05-10 11:42:47 +03:00
req.Header.Set("X-Guest-Token", s.guestToken)
}
2023-05-30 17:31:00 +03:00
if s.oAuthToken != "" && s.oAuthSecret != "" {
req.Header.Set("Authorization", s.sign(req.Method, req.URL))
} else {
req.Header.Set("Authorization", "Bearer "+s.bearerToken)
}
for _, cookie := range s.client.Jar.Cookies(req.URL) {
if cookie.Name == "ct0" {
req.Header.Set("X-CSRF-Token", cookie.Value)
break
}
2021-09-08 16:02:53 +08:00
}
2020-12-12 23:33:57 +02:00
resp, err := s.client.Do(req)
if err != nil {
return err
}
defer resp.Body.Close()
2023-05-10 22:24:32 +03:00
content, err := io.ReadAll(resp.Body)
if err != nil {
return err
}
2024-03-09 03:54:20 +03:00
statusOK := resp.StatusCode >= 200 && resp.StatusCode < 300
if !statusOK {
return fmt.Errorf("response status %s: %s", resp.Status, content)
2021-01-05 11:42:51 +02:00
}
if resp.Header.Get("X-Rate-Limit-Remaining") == "0" {
s.guestToken = ""
}
2023-05-10 22:24:32 +03:00
if target == nil {
return nil
}
2023-05-10 22:24:32 +03:00
return json.Unmarshal(content, target)
}
2020-12-12 23:33:57 +02:00
// GetGuestToken from Twitter API
func (s *Scraper) GetGuestToken() error {
req, err := http.NewRequest("POST", "https://api.twitter.com/1.1/guest/activate.json", nil)
if err != nil {
return err
}
2022-04-18 12:42:39 +03:00
req.Header.Set("Authorization", "Bearer "+s.bearerToken)
2020-12-12 23:33:57 +02:00
resp, err := s.client.Do(req)
if err != nil {
return err
}
defer resp.Body.Close()
2023-05-10 22:24:32 +03:00
body, err := io.ReadAll(resp.Body)
if err != nil {
return err
}
2022-04-09 20:00:09 +03:00
if resp.StatusCode != http.StatusOK {
return fmt.Errorf("response status %s: %s", resp.Status, body)
}
var jsn map[string]interface{}
if err := json.Unmarshal(body, &jsn); err != nil {
return err
}
var ok bool
2020-12-12 23:33:57 +02:00
if s.guestToken, ok = jsn["guest_token"].(string); !ok {
return fmt.Errorf("guest_token not found")
}
2021-01-05 14:21:08 +02:00
s.guestCreatedAt = time.Now()
return nil
}
2024-02-20 23:27:22 +03:00
func (s *Scraper) ClearGuestToken() error {
s.guestToken = ""
s.guestCreatedAt = time.Time{}
return nil
}