1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
|
// This Source Code Form is subject to the terms of the Mozilla Public
// License, v. 2.0. If a copy of the MPL was not distributed with this
// file, You can obtain one at http://mozilla.org/MPL/2.0/.
package headers_test
import (
"fmt"
"net/http"
"reflect"
"testing"
"github.com/philippta/flyscrape"
"github.com/philippta/flyscrape/modules/headers"
"github.com/philippta/flyscrape/modules/hook"
"github.com/philippta/flyscrape/modules/starturl"
"github.com/stretchr/testify/require"
)
func TestHeaders(t *testing.T) {
testCases := []struct {
name string
headersFn func() headers.Module
wantHeaders map[string][]string
}{
{
name: "empty custom headers",
headersFn: func() headers.Module {
return headers.Module{
Headers: map[string]string{},
}
},
wantHeaders: map[string][]string{"User-Agent": {"flyscrape/0.1"}},
},
{
name: "no duplicate headers between default and custom",
headersFn: func() headers.Module {
return headers.Module{
Headers: map[string]string{
"Authorization": "Basic ZGVtbzpwQDU1dzByZA==",
},
}
},
wantHeaders: map[string][]string{
"Authorization": {"Basic ZGVtbzpwQDU1dzByZA=="},
"User-Agent": {"flyscrape/0.1"},
},
},
{
name: "duplicate headers between default and custom",
headersFn: func() headers.Module {
return headers.Module{
Headers: map[string]string{
"Authorization": "Basic ZGVtbzpwQDU1dzByZA==",
"User-Agent": "Gecko/1.0",
},
}
},
wantHeaders: map[string][]string{
"Authorization": {"Basic ZGVtbzpwQDU1dzByZA=="},
"User-Agent": {"Gecko/1.0"},
},
},
}
for _, tc := range testCases {
t.Run(tc.name, func(t *testing.T) {
var headers map[string][]string
mods := []flyscrape.Module{
&starturl.Module{URL: "http://www.example.com"},
hook.Module{
AdaptTransportFn: func(rt http.RoundTripper) http.RoundTripper {
return flyscrape.RoundTripFunc(func(r *http.Request) (*http.Response, error) {
headers = r.Header
return rt.RoundTrip(r)
})
},
},
tc.headersFn(),
}
scraper := flyscrape.NewScraper()
scraper.Modules = mods
scraper.Run()
require.Truef(
t,
reflect.DeepEqual(tc.wantHeaders, headers),
fmt.Sprintf("expected: %v; actual: %v", tc.wantHeaders, headers),
)
})
}
}
|