From 03e343a13634932077fdad9431dd2cad0cad3689 Mon Sep 17 00:00:00 2001 From: Joe Lothan Date: Wed, 20 May 2026 00:53:24 -0400 Subject: [PATCH] cap number of favicons to 50 per host --- pipeline/02_warc_parse/parser.go | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pipeline/02_warc_parse/parser.go b/pipeline/02_warc_parse/parser.go index 0d0460a..37b4339 100644 --- a/pipeline/02_warc_parse/parser.go +++ b/pipeline/02_warc_parse/parser.go @@ -47,7 +47,7 @@ func ParseHTML(body []byte, protocol, hostname string) ParseResult { continue } - if tagName == "link" && hasAttr { + if tagName == "link" && hasAttr && len(result.Icons) < 50 { icon := parseLinkTag(tokenizer, protocol, hostname) if icon != nil { result.Icons = append(result.Icons, *icon)