forked from snowplow-referer-parser/golang-referer-parser
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrefererparser.go
112 lines (99 loc) · 2.51 KB
/
refererparser.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
/*
Package refererparser implements referer extraction using a shared 'database' of known referers found in referers.yml [1].
Links
[1] https://github.com/snowplow/referer-parser/blob/master/referers.yml
*/
package refererparser
import (
"encoding/json"
"net/url"
"strings"
)
type refererData map[string]map[string]map[string][]string
var data refererData
func init() {
data = loadRefererData()
}
// loadRefererData loads and parses the YAML file.
func loadRefererData() refererData {
dat, err := Asset("data/referers.json")
if err != nil {
panic(err)
}
res := make(refererData)
if err := json.Unmarshal(dat, &res); err != nil {
panic(err)
}
return res
}
// RefererResult holds the extracted data
type RefererResult struct {
Known bool
Referer string
Medium string
SearchParameter string
SearchTerm string
URI *url.URL
}
// SetCurrent is used to set the "internal" medium if needed.
func (ref *RefererResult) SetCurrent(curl string) {
purl, _ := url.Parse(curl)
if purl.Host == ref.URI.Host {
ref.Medium = "internal"
}
}
func lookup(uri *url.URL, q string, suffix bool) (refResult *RefererResult) {
refResult = &RefererResult{URI: uri, Medium: "unknown"}
for medium, mediumData := range data {
for refName, refconfig := range mediumData {
for _, domain := range refconfig["domains"] {
if (!suffix && q == domain) || (suffix && (strings.HasSuffix(q, domain) || strings.HasPrefix(q, domain))) {
refResult.Known = true
refResult.Referer = refName
refResult.Medium = medium
params, paramExists := refconfig["parameters"]
if paramExists {
for _, param := range params {
sterm := uri.Query().Get(param)
if sterm != "" {
refResult.SearchParameter = param
refResult.SearchTerm = sterm
}
}
}
return refResult
}
}
}
}
return
}
// Parse an url and extract referer, it returns a RefererResult.
func Parse(uri string) (refResult *RefererResult) {
puri, parseErr := url.Parse(uri)
if parseErr != nil {
return
}
// Split before the first dot ".".
parts := strings.SplitAfterN(puri.Host, ".", 2)
rhost := ""
if len(parts) > 1 {
rhost = parts[1]
}
queries := []string{puri.Host + puri.Path, rhost + puri.Path, puri.Host, rhost}
for _, q := range queries {
refResult = lookup(puri, q, false)
if refResult.Known {
return
}
}
if !refResult.Known {
for _, q := range queries {
refResult = lookup(puri, q, true)
if refResult.Known {
return
}
}
}
return
}