Fix bug in redirect handling that caused the crawler to not index some documents.
This commit is contained in:
parent
8f2485870d
commit
0bac422091
@ -168,10 +168,11 @@ public class CrawlerRetreiver {
|
||||
var d = doc.get();
|
||||
crawledDomainWriter.accept(d);
|
||||
|
||||
try {
|
||||
visited.add(new EdgeUrl(d.url));
|
||||
if (d.url != null) {
|
||||
try {
|
||||
visited.add(new EdgeUrl(d.url));
|
||||
} catch (URISyntaxException ex) {}
|
||||
}
|
||||
catch (URISyntaxException ex) {}
|
||||
|
||||
}
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user