Skip to content

Commit

Permalink
updateRobots deem S_CONNECT_FAILED 404
Browse files Browse the repository at this point in the history
  • Loading branch information
galgeek committed Oct 6, 2017
1 parent 0ec055c commit d4b8566
Showing 1 changed file with 6 additions and 0 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -157,6 +157,12 @@ public synchronized void updateRobots(CrawlURI curi) {
gotSomething = true;
}

// special deeming for connection-failure
if (curi.getFetchStatus() == S_CONNECT_FAILED) {
curi.setFetchStatus(S_DEEMED_NOT_FOUND);
gotSomething = true;
}

if (!gotSomething) {
// robots.txt fetch failed and exceptions (ignore/deeming) don't apply; no valid robots info yet
validRobots = false;
Expand Down

0 comments on commit d4b8566

Please sign in to comment.