Fix bug in redirect handling that caused the crawler to not index some documents.

This commit is contained in:
vlofgren 2022-08-17 00:51:07 +02:00
parent 8f2485870d
commit 0bac422091

View File

@ -168,10 +168,11 @@ public class CrawlerRetreiver {
var d = doc.get();
crawledDomainWriter.accept(d);
try {
visited.add(new EdgeUrl(d.url));
if (d.url != null) {
try {
visited.add(new EdgeUrl(d.url));
} catch (URISyntaxException ex) {}
}
catch (URISyntaxException ex) {}
}