-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathdupefilter.go
111 lines (85 loc) · 2.13 KB
/
dupefilter.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
package middlewares
import (
"encoding/hex"
"errors"
"fmt"
"hash"
"io"
"net/http"
"sort"
"strings"
"sync"
"github.com/tech-engine/goscrapy/pkg/middlewaremanager"
"golang.org/x/crypto/blake2b"
)
var ERR_DUPEFILTER_BLOCKED = errors.New("duplicate request")
type RequestMap struct {
seen map[string]struct{}
mu sync.RWMutex
}
func NewRequestMap() *RequestMap {
return &RequestMap{
seen: make(map[string]struct{}),
}
}
func generateSHA1FingerprintFromReq(r *http.Request) (string, error) {
var (
err error
body io.ReadCloser
hash hash.Hash
)
if r.GetBody != nil {
body, err = r.GetBody()
if err != nil {
return "", err
}
defer body.Close()
}
var combinedBuf strings.Builder
hash, err = blake2b.New256(nil)
if err != nil {
return "", err
}
if body != nil {
if _, err = io.Copy(hash, body); err != nil {
return "", err
}
}
combinedBuf.WriteString(r.Method)
combinedBuf.WriteString(r.URL.String())
headerKeys := make([]string, 0, len(r.Header))
for key := range r.Header {
headerKeys = append(headerKeys, key)
}
sort.Strings(headerKeys)
// added sorted headers
for _, key := range headerKeys {
for _, value := range r.Header[key] {
combinedBuf.WriteString(key)
combinedBuf.WriteString(value)
}
}
if _, err = hash.Write([]byte(combinedBuf.String())); err != nil {
return "", err
}
finalHash := hash.Sum(nil)
return hex.EncodeToString(finalHash[:]), nil
}
func DupeFilter(next http.RoundTripper) http.RoundTripper {
requestMap := NewRequestMap()
return middlewaremanager.MiddlewareFunc(func(req *http.Request) (*http.Response, error) {
signature, err := generateSHA1FingerprintFromReq(req)
if err != nil {
return nil, fmt.Errorf("duplicatefilter.go:DupeFilterMiddleware: error generating request signature %w", err)
}
requestMap.mu.Lock()
// we have already seen this signature so we skip
if _, ok := requestMap.seen[signature]; ok {
requestMap.mu.Unlock()
return nil, fmt.Errorf("duplicatefilter.go:DupeFilterMiddleware: %w", ERR_DUPEFILTER_BLOCKED)
}
requestMap.seen[signature] = struct{}{}
requestMap.mu.Unlock()
return next.RoundTrip(req)
})
}