blob: 832bc7a9503673b4440cb33470c579fa97f2fac8 (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
|
// This Source Code Form is subject to the terms of the Mozilla Public
// License, v. 2.0. If a copy of the MPL was not distributed with this
// file, You can obtain one at http://mozilla.org/MPL/2.0/.
package proxy
import (
"crypto/tls"
"math/rand"
"net/http"
"net/url"
"github.com/philippta/flyscrape"
)
func init() {
flyscrape.RegisterModule(Module{})
}
type Module struct {
Proxies []string `json:"proxies"`
Proxy string `json:"proxy"`
transports []*http.Transport
}
func (Module) ModuleInfo() flyscrape.ModuleInfo {
return flyscrape.ModuleInfo{
ID: "proxy",
New: func() flyscrape.Module { return new(Module) },
}
}
func (m *Module) Provision(ctx flyscrape.Context) {
if m.disabled() {
return
}
for _, purl := range append(m.Proxies, m.Proxy) {
if purl == "" {
continue
}
if parsed, err := url.Parse(purl); err == nil {
m.transports = append(m.transports, &http.Transport{
Proxy: http.ProxyURL(parsed),
TLSClientConfig: &tls.Config{InsecureSkipVerify: true},
})
}
}
}
func (m *Module) AdaptTransport(t http.RoundTripper) http.RoundTripper {
if m.disabled() {
return t
}
return flyscrape.RoundTripFunc(func(r *http.Request) (*http.Response, error) {
transport := m.transports[rand.Intn(len(m.transports))]
return transport.RoundTrip(r)
})
}
func (m *Module) disabled() bool {
return len(m.Proxies) == 0
}
|