-
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathregex.go
98 lines (77 loc) · 1.62 KB
/
regex.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
package mail
import (
"errors"
"log/slog"
"net/url"
"regexp"
"strings"
)
var urlR = regexp.MustCompile(`https?://[^\s]+|ftp://[^\s]+`)
func urls(data string) []*url.URL {
out := []*url.URL{}
var dedup = make(map[string]bool)
allU := urlR.FindAllString(data, -1)
for _, u := range allU {
u = strings.TrimSuffix(u, ">")
u = strings.TrimSuffix(u, ")")
u = strings.TrimSuffix(u, "\"")
if dedup[u] {
continue
}
dedup[u] = true
parsed, err := url.Parse(u)
if err != nil {
slog.Warn(
"Error parsing URL",
"error", err.Error(),
"url", u,
)
}
if parsed == nil {
continue
}
parsed, err = RMSafeLink(parsed)
if err != nil {
slog.Warn(
"Error stripping safe link",
"error", err.Error(),
"url", u,
)
}
// check for duplicate
if dedup[parsed.String()] {
continue
}
out = append(out, parsed)
}
return out
}
var ErrEmpty = errors.New("empty safe link")
//nolint:gochecknoglobals // this is a list of known safe link suffixes
var knownSafeLinkSuffix = []string{
"safelinks.protection.outlook.com",
}
// RMSafeLink removes the safe link wrapper from a URL that was added by
// known safe link providers registered by the knownSafeLinkSuffix global
// variable for host suffixes.
func RMSafeLink(ln *url.URL) (*url.URL, error) {
if ln == nil {
return nil, ErrEmpty
}
if !isSafeLn(ln) {
return ln, nil
}
u, ok := ln.Query()["url"]
if !ok || len(u) == 0 {
return nil, ErrEmpty
}
return url.Parse(u[0])
}
func isSafeLn(ln *url.URL) bool {
for _, s := range knownSafeLinkSuffix {
if strings.HasSuffix(ln.Host, s) {
return true
}
}
return false
}