2020-02-12 10:45:19 +02:00
|
|
|
package twitterscraper
|
|
|
|
|
|
|
|
|
|
import (
|
|
|
|
|
"encoding/json"
|
|
|
|
|
"fmt"
|
|
|
|
|
"net/http"
|
|
|
|
|
"strings"
|
|
|
|
|
)
|
|
|
|
|
|
2020-06-15 11:59:30 +03:00
|
|
|
func newRequest(url string) (*http.Request, error) {
|
|
|
|
|
req, err := http.NewRequest("GET", url, nil)
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
req.Header.Set("Accept", "application/json, text/javascript, */*; q=0.01")
|
|
|
|
|
req.Header.Set("Accept-Language", "en-US")
|
|
|
|
|
req.Header.Set("User-Agent", "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_12_6) AppleWebKit/603.3.8 (KHTML, like Gecko) Version/10.1.2 Safari/603.3.8")
|
|
|
|
|
req.Header.Set("X-Twitter-Active-User", "yes")
|
|
|
|
|
req.Header.Set("X-Requested-With", "XMLHttpRequest")
|
|
|
|
|
|
|
|
|
|
return req, nil
|
|
|
|
|
}
|
|
|
|
|
|
2020-02-12 10:45:19 +02:00
|
|
|
func getHTMLFromJSON(req *http.Request, field string) (*strings.Reader, error) {
|
|
|
|
|
resp, err := http.DefaultClient.Do(req)
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, err
|
|
|
|
|
}
|
|
|
|
|
defer resp.Body.Close()
|
|
|
|
|
|
|
|
|
|
if resp.StatusCode != http.StatusOK {
|
|
|
|
|
return nil, fmt.Errorf("response status: %s", resp.Status)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
ajaxJSON := make(map[string]interface{})
|
|
|
|
|
err = json.NewDecoder(resp.Body).Decode(&ajaxJSON)
|
|
|
|
|
if err != nil {
|
|
|
|
|
return nil, err
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
htm, ok := ajaxJSON[field].(string)
|
|
|
|
|
if !ok {
|
2020-09-19 00:57:03 +03:00
|
|
|
return nil, fmt.Errorf("field %s not found in JSON", field)
|
2020-02-12 10:45:19 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return strings.NewReader(htm), nil
|
|
|
|
|
}
|