From e4e052cf2709835217a748db7674bb6b45d0a8cf Mon Sep 17 00:00:00 2001 From: Jordan Date: Tue, 7 Dec 2021 11:07:13 -0700 Subject: archive, keep: host -> regexp ignore list --- archive.go | 12 ++++-------- 1 file changed, 4 insertions(+), 8 deletions(-) (limited to 'archive.go') diff --git a/archive.go b/archive.go index 7f44078..924e6f4 100644 --- a/archive.go +++ b/archive.go @@ -4,6 +4,7 @@ import ( "encoding/json" "log" "net/http" + "regexp" "strconv" "time" ) @@ -14,11 +15,6 @@ var ( TIMEOUT time.Duration = 25 client *http.Client = &http.Client{Timeout: TIMEOUT * time.Second} - - ignoreList = []string{"cdn.discordapp.com", "discord.com", "tenor.com", - "c.tenor.com", "archive.org", "web.archive.org", "youtu.be", - "youtube.com", "www.youtube.com", "discord.gg", "media.discordapp.net", - "open.spotify.com", "i.redd.it", "v.redd.it"} ) type Wayback struct { @@ -34,11 +30,11 @@ type Closest struct { Status string `json:"status"` } -func isIgnored(host string) bool { +func isIgnored(regex []string, url string) bool { - for _, h := range ignoreList { + for _, r := range regex { - if host == h { + if v := regexp.MustCompile(r); v.MatchString(url) { return true } } -- cgit v1.2.3-54-g00ecf