internal/fetcher/http.go (view raw)
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 | package fetcher import ( "context" "fmt" "io" "net/http" "strings" "time" "go.alanpearce.eu/searchix/internal/config" "github.com/andybalholm/brotli" "gitlab.com/tozd/go/errors" "go.alanpearce.eu/x/log" ) type brotliReadCloser struct { src io.ReadCloser *brotli.Reader } func newBrotliReader(src io.ReadCloser) *brotliReadCloser { return &brotliReadCloser{ src: src, Reader: brotli.NewReader(src), } } func (r *brotliReadCloser) Close() error { return errors.Wrap(r.src.Close(), "failed to call close on underlying reader") } func fetchFileIfNeeded( ctx context.Context, log *log.Logger, mtime time.Time, url string, ) (io.ReadCloser, time.Time, errors.E) { var newMtime time.Time var ifModifiedSince string if !mtime.IsZero() { ifModifiedSince = strings.Replace(mtime.UTC().Format(time.RFC1123), "UTC", "GMT", 1) } req, baseErr := http.NewRequestWithContext(ctx, "GET", url, http.NoBody) if baseErr != nil { return nil, newMtime, errors.WithMessagef( baseErr, "could not create HTTP request for %s", url, ) } req.Header.Set("User-Agent", fmt.Sprintf("Searchix %s", config.Version)) if ifModifiedSince != "" { req.Header.Set("If-Modified-Since", ifModifiedSince) } res, baseErr := http.DefaultClient.Do(req) if baseErr != nil { return nil, newMtime, errors.WithMessagef(baseErr, "could not make HTTP request to %s", url) } var body io.ReadCloser var err errors.E switch res.StatusCode { case http.StatusNotModified: newMtime = mtime return nil, newMtime, nil case http.StatusOK: var baseErr error newMtime, baseErr = time.Parse(time.RFC1123, res.Header.Get("Last-Modified")) if baseErr != nil { log.Warn( "could not parse Last-Modified header from response", "value", res.Header.Get("Last-Modified"), ) newMtime = time.Now() } switch ce := res.Header.Get("Content-Encoding"); ce { case "br": log.Debug("using brotli encoding") body = newBrotliReader(res.Body) case "", "identity", "gzip": body = res.Body default: err = errors.Errorf("cannot handle a body with content-encoding %s", ce) } default: err = errors.Errorf("got response code %d, don't know what to do", res.StatusCode) } return NewReadCloser(body), newMtime, err } |