| org.archive.crawler.datamodel.FetchStatusCodes
All known Subclasses: org.archive.crawler.fetcher.FetchHTTP, org.archive.crawler.processor.BeanShellProcessor, org.archive.crawler.frontier.WorkQueueFrontier, org.archive.crawler.framework.WriterPoolProcessor, org.archive.crawler.prefetch.RuntimeLimitEnforcer, org.archive.crawler.postprocessor.FrontierScheduler, org.archive.crawler.writer.ExperimentalV10WARCWriterProcessor, org.archive.crawler.prefetch.QuotaEnforcer, org.archive.crawler.fetcher.FetchDNS, org.archive.crawler.prefetch.PreconditionEnforcer, org.archive.crawler.frontier.AdaptiveRevisitFrontier, org.archive.crawler.writer.ExperimentalWARCWriterProcessor, org.archive.crawler.processor.CrawlMapper, org.archive.crawler.datamodel.CrawlSubstats, org.archive.crawler.datamodel.CrawlURI, org.archive.crawler.writer.ARCWriterProcessor, org.archive.crawler.prefetch.Preselector, org.archive.crawler.framework.ToeThread, org.archive.crawler.postprocessor.CrawlStateUpdater, org.archive.crawler.frontier.AbstractFrontier, org.archive.crawler.postprocessor.LinksScoper,
FetchStatusCodes | public interface FetchStatusCodes (Code) | | Constant flag codes to be used, in lieu of per-protocol
codes (like HTTP's 200, 404, etc.), when network/internal/
out-of-band conditions occur.
The URISelector may use such codes, along with user-configured
options, to determine whether, when, and how many times
a CrawlURI might be reattempted.
author: gojomo |
S_BLOCKED_BY_CUSTOM_PROCESSOR | final public static int S_BLOCKED_BY_CUSTOM_PROCESSOR(Code) | | Blocked by custom prefetcher processor.
A check against scope or against filters in a custom prefetch
processor rules CrawlURI should not be crawled.
TODO: Add to documentation and help page.
|
S_BLOCKED_BY_QUOTA | final public static int S_BLOCKED_BY_QUOTA(Code) | | Blocked due to exceeding an established quota.
TODO: Add to documentation and help page.
|
S_BLOCKED_BY_RUNTIME_LIMIT | final public static int S_BLOCKED_BY_RUNTIME_LIMIT(Code) | | Blocked due to exceeding an established runtime.
TODO: Add to documentation and help page.
|
S_BLOCKED_BY_USER | final public static int S_BLOCKED_BY_USER(Code) | | blocked from fetch by user setting.
|
S_CONNECT_FAILED | final public static int S_CONNECT_FAILED(Code) | | HTTP connect failed
|
S_CONNECT_LOST | final public static int S_CONNECT_LOST(Code) | | HTTP connect broken
|
S_DEEMED_CHAFF | final public static int S_DEEMED_CHAFF(Code) | | 'chaff' detection of traps/content of negligible value applied
|
S_DEFERRED | final public static int S_DEFERRED(Code) | | temporary status assigned URIs awaiting preconditions; appearance in
logs is a bug
|
S_DELETED_BY_USER | final public static int S_DELETED_BY_USER(Code) | | deleted from frontier by user
|
S_DNS_SUCCESS | final public static int S_DNS_SUCCESS(Code) | | DNS success
|
S_DOMAIN_PREREQUISITE_FAILURE | final public static int S_DOMAIN_PREREQUISITE_FAILURE(Code) | | DNS prerequisite failed, precluding attempt
|
S_DOMAIN_UNRESOLVABLE | final public static int S_DOMAIN_UNRESOLVABLE(Code) | | DNS lookup failed
|
S_GETBYNAME_SUCCESS | final public static int S_GETBYNAME_SUCCESS(Code) | | InetAddress.getByName success
|
S_OTHER_PREREQUISITE_FAILURE | final public static int S_OTHER_PREREQUISITE_FAILURE(Code) | | DNS prerequisite failed, precluding attempt
|
S_OUT_OF_SCOPE | final public static int S_OUT_OF_SCOPE(Code) | | out-of-scope upoin reexamination (only when scope changes during
crawl)
|
S_PREREQUISITE_UNSCHEDULABLE_FAILURE | final public static int S_PREREQUISITE_UNSCHEDULABLE_FAILURE(Code) | | DNS prerequisite failed, precluding attempt
|
S_PROCESSING_THREAD_KILLED | final public static int S_PROCESSING_THREAD_KILLED(Code) | | Processing thread was killed
|
S_ROBOTS_PRECLUDED | final public static int S_ROBOTS_PRECLUDED(Code) | | robots rules precluded fetch
|
S_ROBOTS_PREREQUISITE_FAILURE | final public static int S_ROBOTS_PREREQUISITE_FAILURE(Code) | | Robots prerequisite failed, precluding attempt
|
S_RUNTIME_EXCEPTION | final public static int S_RUNTIME_EXCEPTION(Code) | | Unexpected runtime exception; see runtime-errors.log
|
S_SERIOUS_ERROR | final public static int S_SERIOUS_ERROR(Code) | | severe java 'Error' conditions (OutOfMemoryError, StackOverflowError,
etc.) during URI processing
|
S_TIMEOUT | final public static int S_TIMEOUT(Code) | | HTTP timeout (before any meaningful response received)
|
S_TOO_MANY_EMBED_HOPS | final public static int S_TOO_MANY_EMBED_HOPS(Code) | | overstepped embed/trans hops
|
S_TOO_MANY_LINK_HOPS | final public static int S_TOO_MANY_LINK_HOPS(Code) | | overstepped link hops
|
S_TOO_MANY_RETRIES | final public static int S_TOO_MANY_RETRIES(Code) | | multiple retries all failed
|
S_UNATTEMPTED | final public static int S_UNATTEMPTED(Code) | | fetch never tried (perhaps protocol unsupported or illegal URI)
|
S_UNFETCHABLE_URI | final public static int S_UNFETCHABLE_URI(Code) | | URI recognized as unsupported or illegal)
|
S_UNQUEUEABLE | final public static int S_UNQUEUEABLE(Code) | | URI could not be queued in Frontier; when URIs are properly
filtered for format, should never occur
|
|
|