twitter-scrapper/util.go

49 lines
1.2 KiB
Go
Raw Normal View History

2020-02-12 10:45:19 +02:00
package twitterscraper
import (
"encoding/json"
"fmt"
"net/http"
"strings"
)
func newRequest(url string) (*http.Request, error) {
req, err := http.NewRequest("GET", url, nil)
if err != nil {
return nil, err
}
req.Header.Set("Accept", "application/json, text/javascript, */*; q=0.01")
req.Header.Set("Accept-Language", "en-US")
req.Header.Set("User-Agent", "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_12_6) AppleWebKit/603.3.8 (KHTML, like Gecko) Version/10.1.2 Safari/603.3.8")
req.Header.Set("X-Twitter-Active-User", "yes")
req.Header.Set("X-Requested-With", "XMLHttpRequest")
return req, nil
}
2020-02-12 10:45:19 +02:00
func getHTMLFromJSON(req *http.Request, field string) (*strings.Reader, error) {
resp, err := http.DefaultClient.Do(req)
if err != nil {
return nil, err
}
defer resp.Body.Close()
if resp.StatusCode != http.StatusOK {
return nil, fmt.Errorf("response status: %s", resp.Status)
}
ajaxJSON := make(map[string]interface{})
err = json.NewDecoder(resp.Body).Decode(&ajaxJSON)
if err != nil {
return nil, err
}
htm, ok := ajaxJSON[field].(string)
if !ok {
2020-09-19 00:57:03 +03:00
return nil, fmt.Errorf("field %s not found in JSON", field)
2020-02-12 10:45:19 +02:00
}
return strings.NewReader(htm), nil
}