mirror of
https://github.com/kubernetes-sigs/kustomize.git
synced 2026-05-18 04:05:21 +00:00
694 lines
18 KiB
Go
694 lines
18 KiB
Go
// Package github implements the crawler.Crawler interface, getting data
|
|
// from the Github search API.
|
|
package github
|
|
|
|
import (
|
|
"context"
|
|
"encoding/json"
|
|
"fmt"
|
|
"io/ioutil"
|
|
"log"
|
|
"math"
|
|
"net/http"
|
|
"os"
|
|
"regexp"
|
|
"strconv"
|
|
"strings"
|
|
"time"
|
|
|
|
"sigs.k8s.io/kustomize/api/internal/crawl/crawler"
|
|
"sigs.k8s.io/kustomize/api/internal/crawl/doc"
|
|
"sigs.k8s.io/kustomize/api/internal/crawl/httpclient"
|
|
"sigs.k8s.io/kustomize/api/internal/git"
|
|
"sigs.k8s.io/kustomize/api/konfig"
|
|
)
|
|
|
|
var logger = log.New(os.Stdout, "Github Crawler: ",
|
|
log.LstdFlags|log.LUTC|log.Llongfile)
|
|
|
|
// Implements crawler.Crawler.
|
|
type githubCrawler struct {
|
|
client GhClient
|
|
query Query
|
|
// branchMap maps github repositories to their default branches
|
|
branchMap map[string]string
|
|
}
|
|
|
|
type GhClient struct {
|
|
RequestConfig
|
|
retryCount uint64
|
|
client *http.Client
|
|
accessToken string
|
|
}
|
|
|
|
func NewCrawler(accessToken string, retryCount uint64, client *http.Client,
|
|
query Query) githubCrawler {
|
|
|
|
return githubCrawler{
|
|
client: GhClient{
|
|
retryCount: retryCount,
|
|
client: client,
|
|
RequestConfig: RequestConfig{
|
|
perPage: githubMaxPageSize,
|
|
},
|
|
accessToken: accessToken,
|
|
},
|
|
query: query,
|
|
branchMap: map[string]string{},
|
|
}
|
|
}
|
|
|
|
func (gc githubCrawler) SetDefaultBranch(repo, branch string) {
|
|
gc.branchMap[repo] = branch
|
|
}
|
|
|
|
func (gc githubCrawler) DefaultBranch(repo string) string {
|
|
return gc.branchMap[repo]
|
|
}
|
|
|
|
// Implements crawler.Crawler.
|
|
func (gc githubCrawler) Crawl(ctx context.Context,
|
|
output chan<- crawler.CrawledDocument, seen crawler.SeenMap) error {
|
|
|
|
noETagClient := GhClient{
|
|
RequestConfig: gc.client.RequestConfig,
|
|
client: &http.Client{Timeout: gc.client.client.Timeout},
|
|
retryCount: gc.client.retryCount,
|
|
accessToken: gc.client.accessToken,
|
|
}
|
|
|
|
// Since Github returns a max of 1000 results per query, we can use
|
|
// multiple queries that split the search space into chunks of at most
|
|
// 1000 files to get all of the data.
|
|
ranges, err := FindRangesForRepoSearch(newCache(noETagClient, gc.query))
|
|
if err != nil {
|
|
return fmt.Errorf("could not split %v into ranges, %v\n",
|
|
gc.query, err)
|
|
}
|
|
|
|
logger.Println("ranges: ", ranges)
|
|
|
|
// Query each range for files.
|
|
errs := make(multiError, 0)
|
|
queryResult := RangeQueryResult{}
|
|
for _, query := range ranges {
|
|
rangeResult, err := processQuery(ctx, gc.client, query, output, seen, gc.branchMap)
|
|
if err != nil {
|
|
errs = append(errs, err)
|
|
}
|
|
queryResult.Add(rangeResult)
|
|
}
|
|
|
|
logger.Printf("Summary of Crawl: %s", queryResult.String())
|
|
|
|
if len(errs) > 0 {
|
|
return errs
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
// FetchDocument first tries to fetch the document with d.FilePath. If it fails,
|
|
// it will try to add each string in konfig.RecognizedKustomizationFileNames() to
|
|
// d.FilePath, and try to fetch the document again.
|
|
func (gc githubCrawler) FetchDocument(_ context.Context, d *doc.Document) error {
|
|
// set the default branch if it is empty
|
|
if d.DefaultBranch == "" {
|
|
url := gc.client.ReposRequest(d.RepositoryFullName())
|
|
defaultBranch, err := gc.client.GetDefaultBranch(url, d.RepositoryURL, gc.branchMap)
|
|
if err != nil {
|
|
logger.Printf(
|
|
"(error: %v) setting default_branch to master\n", err)
|
|
defaultBranch = "master"
|
|
}
|
|
d.DefaultBranch = defaultBranch
|
|
}
|
|
gc.SetDefaultBranch(d.RepositoryURL, d.DefaultBranch)
|
|
|
|
repoURL := d.RepositoryURL + "/" + d.FilePath + "?ref=" + d.DefaultBranch
|
|
repoSpec, err := git.NewRepoSpecFromUrl(repoURL)
|
|
if err != nil {
|
|
return fmt.Errorf("invalid repospec: %v", err)
|
|
}
|
|
|
|
url := "https://raw.githubusercontent.com/" + repoSpec.OrgRepo +
|
|
"/" + repoSpec.Ref + "/" + repoSpec.Path
|
|
|
|
handle := func(resp *http.Response, err error, path string) error {
|
|
if resp == nil {
|
|
return fmt.Errorf("empty http response (url: %s; path: %s), error: %v",
|
|
url, path, err)
|
|
}
|
|
if err == nil && resp.StatusCode == http.StatusOK {
|
|
d.IsSame = httpclient.FromCache(resp.Header)
|
|
defer CloseResponseBody(resp)
|
|
data, err := ioutil.ReadAll(resp.Body)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
d.DocumentData = string(data)
|
|
d.FilePath = d.FilePath + path
|
|
return nil
|
|
}
|
|
|
|
return err
|
|
}
|
|
resp, errGetRawUserContent := gc.client.GetRawUserContent(url)
|
|
if err := handle(resp, errGetRawUserContent, ""); err == nil {
|
|
return nil
|
|
}
|
|
|
|
for _, file := range konfig.RecognizedKustomizationFileNames() {
|
|
resp, errGetRawUserContent = gc.client.GetRawUserContent(url + "/" + file)
|
|
if err = handle(resp, errGetRawUserContent, "/"+file); err == nil {
|
|
return nil
|
|
}
|
|
}
|
|
return fmt.Errorf("file not found: %s, error: %v", url, err)
|
|
}
|
|
|
|
func (gc githubCrawler) SetCreated(_ context.Context, d *doc.Document) error {
|
|
fs := GhFileSpec{
|
|
Path: d.FilePath,
|
|
Repository: GitRepository{
|
|
FullName: d.RepositoryFullName(),
|
|
},
|
|
}
|
|
creationTime, err := gc.client.GetFileCreationTime(fs)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
d.CreationTime = &creationTime
|
|
return nil
|
|
}
|
|
|
|
func (gc githubCrawler) Match(d *doc.Document) bool {
|
|
url := d.RepositoryURL + "/" + d.FilePath + "?ref=" + "/" +
|
|
d.DefaultBranch
|
|
repoSpec, err := git.NewRepoSpecFromUrl(url)
|
|
if err != nil {
|
|
return false
|
|
}
|
|
|
|
return strings.Contains(repoSpec.Host, "github.com")
|
|
}
|
|
|
|
type RangeQueryResult struct {
|
|
totalDocCnt uint64
|
|
seenDocCnt uint64
|
|
newDocCnt uint64
|
|
errorCnt uint64
|
|
}
|
|
|
|
func (r *RangeQueryResult) Add(other RangeQueryResult) {
|
|
r.totalDocCnt += other.totalDocCnt
|
|
r.newDocCnt += other.newDocCnt
|
|
r.seenDocCnt += other.seenDocCnt
|
|
r.errorCnt += other.errorCnt
|
|
}
|
|
|
|
func (r *RangeQueryResult) String() string {
|
|
return fmt.Sprintf("got %d files from API. "+
|
|
"%d have been seen before. %d are new and sent to the output channel." +
|
|
" %d have kustomizationResultAdapter errors.",
|
|
r.totalDocCnt, r.seenDocCnt, r.newDocCnt, r.errorCnt)
|
|
}
|
|
|
|
// processQuery follows all of the pages in a query, and updates/adds the
|
|
// documents from the crawl to the datastore/index.
|
|
func processQuery(ctx context.Context, gcl GhClient, query string,
|
|
output chan<- crawler.CrawledDocument, seen crawler.SeenMap,
|
|
branchMap map[string]string) (RangeQueryResult, error) {
|
|
|
|
queryPages := make(chan GhResponseInfo)
|
|
|
|
go func() {
|
|
// Forward the document metadata to the retrieval channel.
|
|
// This separation allows for concurrent requests for the code
|
|
// search, and the retrieval portions of the API.
|
|
err := gcl.ForwardPaginatedQuery(ctx, query, queryPages)
|
|
if err != nil {
|
|
// TODO(damienr74) handle this error with redis?
|
|
logger.Println(err)
|
|
}
|
|
close(queryPages)
|
|
}()
|
|
|
|
errs := make(multiError, 0)
|
|
result := RangeQueryResult{}
|
|
pageID := 1
|
|
for page := range queryPages {
|
|
if page.Error != nil {
|
|
errs = append(errs, page.Error)
|
|
continue
|
|
}
|
|
pageResult := RangeQueryResult{}
|
|
for _, file := range page.Parsed.Items {
|
|
k, err := kustomizationResultAdapter(gcl, file, seen, branchMap)
|
|
if err != nil {
|
|
logger.Printf("kustomizationResultAdapter failed: %v", err)
|
|
errs = append(errs, err)
|
|
pageResult.errorCnt++
|
|
}
|
|
if k != nil {
|
|
pageResult.newDocCnt++
|
|
output <- k
|
|
} else {
|
|
pageResult.seenDocCnt++
|
|
}
|
|
pageResult.totalDocCnt++
|
|
}
|
|
|
|
logger.Printf("processQuery [TotalCount %d - page %d]: %s",
|
|
page.Parsed.TotalCount, pageID, pageResult.String())
|
|
result.Add(pageResult)
|
|
|
|
pageID++
|
|
}
|
|
|
|
logger.Printf("Summary of processQuery: %s", result.String())
|
|
|
|
return result, errs
|
|
}
|
|
|
|
func kustomizationResultAdapter(gcl GhClient, k GhFileSpec, seen crawler.SeenMap,
|
|
branchMap map[string]string) (crawler.CrawledDocument, error) {
|
|
url := gcl.ReposRequest(k.Repository.FullName)
|
|
defaultBranch, err := gcl.GetDefaultBranch(url, k.Repository.URL, branchMap)
|
|
if err != nil {
|
|
logger.Printf(
|
|
"(error: %v) setting default_branch to master\n", err)
|
|
defaultBranch = "master"
|
|
}
|
|
|
|
document := doc.Document{
|
|
FilePath: k.Path,
|
|
DefaultBranch: defaultBranch,
|
|
RepositoryURL: k.Repository.URL,
|
|
}
|
|
|
|
if seen.Seen(document.ID()) {
|
|
return nil, nil
|
|
}
|
|
|
|
data, err := gcl.GetFileData(k)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
d := doc.KustomizationDocument{
|
|
Document: doc.Document{
|
|
DocumentData: string(data),
|
|
FilePath: k.Path,
|
|
DefaultBranch: defaultBranch,
|
|
RepositoryURL: k.Repository.URL,
|
|
},
|
|
}
|
|
creationTime, err := gcl.GetFileCreationTime(k)
|
|
if err != nil {
|
|
logger.Printf("GetFileCreationTime failed: %v", err)
|
|
return &d, err
|
|
}
|
|
d.CreationTime = &creationTime
|
|
|
|
if err := d.ParseYAML(); err != nil {
|
|
logger.Printf("ParseYAML failed: %v", err)
|
|
return &d, err
|
|
}
|
|
|
|
return &d, nil
|
|
}
|
|
|
|
// ForwardPaginatedQuery follows the links to the next pages and performs all of
|
|
// the queries for a given search query, relaying the data from each request
|
|
// back to an output channel.
|
|
func (gcl GhClient) ForwardPaginatedQuery(ctx context.Context, query string,
|
|
output chan<- GhResponseInfo) error {
|
|
|
|
logger.Println("querying: ", query)
|
|
response := gcl.parseGithubResponse(query)
|
|
|
|
if response.Error != nil {
|
|
return response.Error
|
|
}
|
|
|
|
output <- response
|
|
|
|
for response.LastURL != "" && response.NextURL != "" {
|
|
select {
|
|
case <-ctx.Done():
|
|
return nil
|
|
default:
|
|
response = gcl.parseGithubResponse(response.NextURL)
|
|
if response.Error != nil {
|
|
return response.Error
|
|
}
|
|
|
|
output <- response
|
|
}
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
// GetFileData gets the bytes from a file.
|
|
func (gcl GhClient) GetFileData(k GhFileSpec) ([]byte, error) {
|
|
|
|
url := gcl.ContentsRequest(k.Repository.FullName, k.Path)
|
|
|
|
resp, err := gcl.GetReposData(url)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("%+v: could not get '%s' metadata: %v",
|
|
k, url, err)
|
|
}
|
|
|
|
data, err := ioutil.ReadAll(resp.Body)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("%+v: could not read '%s' metadata: %v",
|
|
k, url, err)
|
|
}
|
|
|
|
if err := resp.Body.Close(); err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
type githubContentRawURL struct {
|
|
DownloadURL string `json:"download_url,omitempty"`
|
|
}
|
|
var rawURL githubContentRawURL
|
|
err = json.Unmarshal(data, &rawURL)
|
|
if err != nil {
|
|
return nil, fmt.Errorf(
|
|
"%+v: could not get 'download_url' from '%s' response: %v",
|
|
k, data, err)
|
|
}
|
|
|
|
resp, err = gcl.GetRawUserContent(rawURL.DownloadURL)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("%+v: could not fetch file raw data '%s': %v",
|
|
k, rawURL.DownloadURL, err)
|
|
}
|
|
|
|
defer CloseResponseBody(resp)
|
|
data, err = ioutil.ReadAll(resp.Body)
|
|
return data, err
|
|
}
|
|
|
|
func CloseResponseBody(resp *http.Response) {
|
|
if err := resp.Body.Close(); err != nil {
|
|
log.Printf("failed to close response body: %v", err)
|
|
}
|
|
}
|
|
|
|
// GetDefaultBranch gets the default branch of a github repository.
|
|
// m is a map which maps a github repository to its default branch.
|
|
// If repo is already in m, the default branch for url will be obtained from m;
|
|
// otherwise, a query will be made to github to obtain the default branch.
|
|
func (gcl GhClient) GetDefaultBranch(url, repo string, m map[string]string) (string, error) {
|
|
if v, ok := m[repo]; ok {
|
|
return v, nil
|
|
}
|
|
|
|
resp, err := gcl.GetReposData(url)
|
|
if err != nil {
|
|
return "", fmt.Errorf(
|
|
"'%s' could not get default_branch: %v", url, err)
|
|
}
|
|
defer CloseResponseBody(resp)
|
|
data, err := ioutil.ReadAll(resp.Body)
|
|
if err != nil {
|
|
return "", fmt.Errorf(
|
|
"could not read default_branch: %v", err)
|
|
}
|
|
|
|
type defaultBranch struct {
|
|
DefaultBranch string `json:"default_branch,omitempty"`
|
|
}
|
|
var branch defaultBranch
|
|
err = json.Unmarshal(data, &branch)
|
|
if err != nil {
|
|
return "", fmt.Errorf(
|
|
"default_branch json malformed: %v", err)
|
|
}
|
|
|
|
return branch.DefaultBranch, nil
|
|
}
|
|
|
|
// GetFileCreationTime gets the earliest date of a file.
|
|
func (gcl GhClient) GetFileCreationTime(
|
|
k GhFileSpec) (time.Time, error) {
|
|
|
|
url := gcl.CommitsRequest(k.Repository.FullName, k.Path)
|
|
|
|
defaultTime := time.Now()
|
|
|
|
resp, err := gcl.GetReposData(url)
|
|
if err != nil {
|
|
return defaultTime, fmt.Errorf(
|
|
"%+v: '%s' could not get metadata: %v", k, url, err)
|
|
}
|
|
|
|
type DateSpec struct {
|
|
Commit struct {
|
|
Author struct {
|
|
Date string `json:"date,omitempty"`
|
|
} `json:"author,omitempty"`
|
|
} `json:"commit,omitempty"`
|
|
}
|
|
|
|
_, lastURL := parseGithubLinkFormat(resp.Header.Get("link"))
|
|
if lastURL != "" {
|
|
resp, err = gcl.GetReposData(lastURL)
|
|
if err != nil {
|
|
return defaultTime, fmt.Errorf(
|
|
"%+v: '%s' could not get metadata: %v",
|
|
k, lastURL, err)
|
|
}
|
|
}
|
|
|
|
defer CloseResponseBody(resp)
|
|
data, err := ioutil.ReadAll(resp.Body)
|
|
if err != nil {
|
|
return defaultTime, fmt.Errorf(
|
|
"%+v: failed to read metadata: %v", k, err)
|
|
}
|
|
var earliestDate []DateSpec
|
|
err = json.Unmarshal(data, &earliestDate)
|
|
size := len(earliestDate)
|
|
if err != nil || size == 0 {
|
|
return defaultTime, fmt.Errorf(
|
|
"%+v: server response '%s' not in expected format: %v",
|
|
k, data, err)
|
|
}
|
|
|
|
return time.Parse(time.RFC3339, earliestDate[size-1].Commit.Author.Date)
|
|
}
|
|
|
|
// TODO(damienr74) change the tickers to actually check api rate limits, reset
|
|
// times, and throttle requests dynamically based off of current utilization,
|
|
// instead of hardcoding the documented values, these calls are not quota'd.
|
|
// This is now especially important, since caching the API requests will reduce
|
|
// API quota use (so we can actually make more requests in the allotted time
|
|
// period).
|
|
//
|
|
// See https://developer.github.com/v3/rate_limit/ for details.
|
|
var (
|
|
searchRateTicker = time.NewTicker(time.Second * 2)
|
|
contentRateTicker = time.NewTicker(time.Second * 1)
|
|
)
|
|
|
|
func throttleSearchAPI() {
|
|
<-searchRateTicker.C
|
|
}
|
|
|
|
func throttleRepoAPI() {
|
|
<-contentRateTicker.C
|
|
}
|
|
|
|
type multiError []error
|
|
|
|
func (e multiError) Error() string {
|
|
size := len(e) + 2
|
|
strs := make([]string, size)
|
|
strs[0] = "Errors ["
|
|
for i, err := range e {
|
|
strs[i+1] = "\t" + err.Error()
|
|
}
|
|
strs[size-1] = "]"
|
|
return strings.Join(strs, "\n")
|
|
}
|
|
|
|
type GitRepository struct {
|
|
API string `json:"url,omitempty"`
|
|
URL string `json:"html_url,omitempty"`
|
|
FullName string `json:"full_name,omitempty"`
|
|
}
|
|
|
|
type GhFileSpec struct {
|
|
Path string `json:"path,omitempty"`
|
|
Repository GitRepository `json:"repository,omitempty"`
|
|
}
|
|
|
|
type githubResponse struct {
|
|
// MaxUint is reserved as a sentinel value.
|
|
// This is the number of files that match the query.
|
|
TotalCount uint64 `json:"total_count,omitempty"`
|
|
|
|
// Github representation of a file.
|
|
Items []GhFileSpec `json:"items,omitempty"`
|
|
}
|
|
|
|
type GhResponseInfo struct {
|
|
*http.Response
|
|
Parsed *githubResponse
|
|
Error error
|
|
NextURL string
|
|
LastURL string
|
|
}
|
|
|
|
func parseGithubLinkFormat(links string) (string, string) {
|
|
const (
|
|
linkNext = "next"
|
|
linkLast = "last"
|
|
linkInfoURL = 1
|
|
linkInfoRel = 2
|
|
)
|
|
|
|
next, last := "", ""
|
|
linkInfo := regexp.MustCompile(`<(.*)>.*; rel="(last|next)"`)
|
|
|
|
for _, link := range strings.Split(links, ",") {
|
|
linkParse := linkInfo.FindStringSubmatch(link)
|
|
if len(linkParse) != 3 {
|
|
continue
|
|
}
|
|
|
|
url := linkParse[linkInfoURL]
|
|
switch linkParse[linkInfoRel] {
|
|
case linkNext:
|
|
next = url
|
|
case linkLast:
|
|
last = url
|
|
default:
|
|
}
|
|
}
|
|
|
|
return next, last
|
|
}
|
|
|
|
func (gcl GhClient) parseGithubResponse(getRequest string) GhResponseInfo {
|
|
resp, err := gcl.SearchGithubAPI(getRequest)
|
|
requestInfo := GhResponseInfo{
|
|
Response: resp,
|
|
Error: err,
|
|
Parsed: nil,
|
|
}
|
|
|
|
if err != nil || resp == nil {
|
|
return requestInfo
|
|
}
|
|
|
|
var data []byte
|
|
defer CloseResponseBody(resp)
|
|
data, requestInfo.Error = ioutil.ReadAll(resp.Body)
|
|
if requestInfo.Error != nil {
|
|
return requestInfo
|
|
}
|
|
|
|
if resp.StatusCode != http.StatusOK {
|
|
logger.Println("query: ", getRequest)
|
|
logger.Println("status not OK at the source")
|
|
logger.Println("header dump", resp.Header)
|
|
logger.Println("body dump", string(data))
|
|
requestInfo.Error = fmt.Errorf("request rejected, status '%s'",
|
|
resp.Status)
|
|
return requestInfo
|
|
}
|
|
|
|
requestInfo.NextURL, requestInfo.LastURL =
|
|
parseGithubLinkFormat(resp.Header.Get("link"))
|
|
|
|
resultCount := githubResponse{
|
|
TotalCount: math.MaxUint64,
|
|
}
|
|
requestInfo.Error = json.Unmarshal(data, &resultCount)
|
|
if requestInfo.Error != nil {
|
|
return requestInfo
|
|
}
|
|
|
|
requestInfo.Parsed = &resultCount
|
|
|
|
return requestInfo
|
|
|
|
}
|
|
|
|
// SearchGithubAPI performs a search query and handles rate limitting for
|
|
// the 'search/code?' endpoint as well as timed retries in the case of abuse
|
|
// prevention.
|
|
func (gcl GhClient) SearchGithubAPI(query string) (*http.Response, error) {
|
|
throttleSearchAPI()
|
|
return gcl.getWithRetry(query)
|
|
}
|
|
|
|
// GetReposData performs a search query and handles rate limitting for
|
|
// the '/repos' endpoint as well as timed retries in the case of abuse
|
|
// prevention.
|
|
func (gcl GhClient) GetReposData(query string) (*http.Response, error) {
|
|
throttleRepoAPI()
|
|
return gcl.getWithRetry(query)
|
|
}
|
|
|
|
// User content (file contents) is not API rate limited, so there's no use in
|
|
// throttling this call.
|
|
func (gcl GhClient) GetRawUserContent(query string) (*http.Response, error) {
|
|
return gcl.getWithRetry(query)
|
|
}
|
|
|
|
func (gcl GhClient) Do(query string) (*http.Response, error) {
|
|
req, err := http.NewRequest("GET", query, nil)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
req.Header.Add("Authorization", fmt.Sprintf("token %s", gcl.accessToken))
|
|
|
|
// gcl.client.Do: a non-2xx status code doesn't cause an error.
|
|
// See https://golang.org/pkg/net/http/#Client.Do for more info.
|
|
resp, err := gcl.client.Do(req)
|
|
if resp != nil && resp.StatusCode != http.StatusOK {
|
|
err = fmt.Errorf("GhClient.Do(%s) failed with response code: %d",
|
|
query, resp.StatusCode)
|
|
}
|
|
return resp, err
|
|
}
|
|
|
|
func (gcl GhClient) getWithRetry(
|
|
query string) (resp *http.Response, err error) {
|
|
|
|
resp, err = gcl.Do(query)
|
|
|
|
retryCount := gcl.retryCount
|
|
|
|
for resp != nil && resp.StatusCode == http.StatusForbidden && retryCount > 0 {
|
|
retryTime := resp.Header.Get("Retry-After")
|
|
i, errAtoi := strconv.Atoi(retryTime)
|
|
if errAtoi != nil {
|
|
return resp, fmt.Errorf(
|
|
"query '%s' forbidden without 'Retry-After'", query)
|
|
}
|
|
logger.Printf(
|
|
"status forbidden, retring %d more times\n", retryCount)
|
|
|
|
logger.Printf("waiting %d seconds before retrying\n", i)
|
|
time.Sleep(time.Second * time.Duration(i))
|
|
retryCount--
|
|
resp, err = gcl.Do(query)
|
|
}
|
|
|
|
if err != nil {
|
|
return resp, fmt.Errorf("query '%s' could not be processed, %v",
|
|
query, err)
|
|
}
|
|
|
|
return resp, err
|
|
}
|