summaryrefslogtreecommitdiff
path: root/modules/proxy/proxy.go
blob: 120a856ba1184e4326bb0934dbe87bc4ccc9c152 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
// This Source Code Form is subject to the terms of the Mozilla Public
// License, v. 2.0. If a copy of the MPL was not distributed with this
// file, You can obtain one at http://mozilla.org/MPL/2.0/.

package proxy

import (
	"crypto/tls"
	"math/rand"
	"net/http"
	"net/url"

	"github.com/philippta/flyscrape"
)

func init() {
	flyscrape.RegisterModule(Module{})
}

type Module struct {
	Proxies []string `json:"proxies"`

	transports []*http.Transport
}

func (Module) ModuleInfo() flyscrape.ModuleInfo {
	return flyscrape.ModuleInfo{
		ID:  "proxy",
		New: func() flyscrape.Module { return new(Module) },
	}
}

func (m *Module) Provision(ctx flyscrape.Context) {
	if m.disabled() {
		return
	}

	for _, purl := range m.Proxies {
		if parsed, err := url.Parse(purl); err == nil {
			m.transports = append(m.transports, &http.Transport{
				Proxy:           http.ProxyURL(parsed),
				TLSClientConfig: &tls.Config{InsecureSkipVerify: true},
			})
		}
	}
}

func (m *Module) AdaptTransport(t http.RoundTripper) http.RoundTripper {
	if m.disabled() {
		return t
	}

	return flyscrape.RoundTripFunc(func(r *http.Request) (*http.Response, error) {
		transport := m.transports[rand.Intn(len(m.transports))]
		return transport.RoundTrip(r)
	})
}

func (m *Module) disabled() bool {
	return len(m.Proxies) == 0
}