public interface Nutch
Modifier and Type | Field and Description |
---|---|
static java.lang.String |
ALL_BATCH_ID_STR |
static org.apache.avro.util.Utf8 |
ALL_CRAWL_ID |
static java.lang.String |
ARG_BATCH
Batch id to select.
|
static java.lang.String |
ARG_CLASS
Class to run as a NutchTool.
|
static java.lang.String |
ARG_CRAWL
Crawl id to use.
|
static java.lang.String |
ARG_CURTIME
The notion of current time.
|
static java.lang.String |
ARG_DEPTH
Depth (number of cycles) of a crawl.
|
static java.lang.String |
ARG_FILTER
Apply URLFilters.
|
static java.lang.String |
ARG_FORCE
Force processing even if there are locks or inconsistencies.
|
static java.lang.String |
ARG_NORMALIZE
Apply URLNormalizers.
|
static java.lang.String |
ARG_NUMTASKS
Number of fetcher tasks.
|
static java.lang.String |
ARG_RESUME
Resume previously aborted op.
|
static java.lang.String |
ARG_SEEDDIR
a path to a directory containing a list of seed URLs.
|
static java.lang.String |
ARG_SEEDLIST
Whitespace-separated list of seed URLs.
|
static java.lang.String |
ARG_SITEMAP
Sitemaps.
|
static java.lang.String |
ARG_SITEMAP_DETECT
Sitemap Detect as fetch .
|
static java.lang.String |
ARG_SOLR
Solr URL.
|
static java.lang.String |
ARG_SORT
Sort statistics.
|
static java.lang.String |
ARG_THREADS
Number of fetcher threads (per map task).
|
static java.lang.String |
ARG_TOPN
Generate topN scoring URLs.
|
static java.lang.String |
BATCH_NAME_KEY |
static java.lang.String |
CACHING_FORBIDDEN_ALL
Don't show either original forbidden content or summaries.
|
static java.lang.String |
CACHING_FORBIDDEN_CONTENT
Don't show original forbidden content, but show summaries.
|
static java.lang.String |
CACHING_FORBIDDEN_KEY
Sites may request that search engines don't provide access to cached
documents.
|
static org.apache.avro.util.Utf8 |
CACHING_FORBIDDEN_KEY_UTF8 |
static java.lang.String |
CACHING_FORBIDDEN_NONE
Show both original forbidden content and summaries (default).
|
static java.lang.String |
CHAR_ENCODING_FOR_CONVERSION |
static java.lang.String |
CRAWL_ID_KEY |
static java.lang.String |
FETCH_STATUS_KEY |
static java.lang.String |
FETCH_TIME_KEY |
static java.lang.String |
GENERATE_TIME_KEY |
static java.lang.String |
ORIGINAL_CHAR_ENCODING |
static java.lang.String |
PROTO_STATUS_KEY |
static java.lang.String |
REPR_URL_KEY |
static java.lang.String |
SCORE_KEY |
static java.lang.String |
SIGNATURE_KEY |
static java.lang.String |
STAT_COUNTERS
Counters.
|
static java.lang.String |
STAT_JOBS
Jobs.
|
static java.lang.String |
STAT_MESSAGE
Status / result message.
|
static java.lang.String |
STAT_PHASE
Phase of processing.
|
static java.lang.String |
STAT_PROGRESS
Progress (float).
|
static Text |
WRITABLE_GENERATE_TIME_KEY |
static Text |
WRITABLE_PROTO_STATUS_KEY |
static Text |
WRITABLE_REPR_URL_KEY |
static final java.lang.String ORIGINAL_CHAR_ENCODING
static final java.lang.String CHAR_ENCODING_FOR_CONVERSION
static final java.lang.String SIGNATURE_KEY
static final java.lang.String BATCH_NAME_KEY
static final java.lang.String SCORE_KEY
static final java.lang.String GENERATE_TIME_KEY
static final Text WRITABLE_GENERATE_TIME_KEY
static final java.lang.String PROTO_STATUS_KEY
static final Text WRITABLE_PROTO_STATUS_KEY
static final java.lang.String FETCH_TIME_KEY
static final java.lang.String FETCH_STATUS_KEY
static final java.lang.String CACHING_FORBIDDEN_KEY
static final org.apache.avro.util.Utf8 CACHING_FORBIDDEN_KEY_UTF8
static final java.lang.String CACHING_FORBIDDEN_NONE
static final java.lang.String CACHING_FORBIDDEN_ALL
static final java.lang.String CACHING_FORBIDDEN_CONTENT
static final java.lang.String REPR_URL_KEY
static final Text WRITABLE_REPR_URL_KEY
static final java.lang.String ALL_BATCH_ID_STR
static final org.apache.avro.util.Utf8 ALL_CRAWL_ID
static final java.lang.String CRAWL_ID_KEY
static final java.lang.String ARG_BATCH
static final java.lang.String ARG_CRAWL
static final java.lang.String ARG_RESUME
static final java.lang.String ARG_FORCE
static final java.lang.String ARG_SORT
static final java.lang.String ARG_SOLR
static final java.lang.String ARG_THREADS
static final java.lang.String ARG_NUMTASKS
static final java.lang.String ARG_TOPN
static final java.lang.String ARG_CURTIME
static final java.lang.String ARG_FILTER
static final java.lang.String ARG_NORMALIZE
static final java.lang.String ARG_SEEDLIST
static final java.lang.String ARG_SEEDDIR
static final java.lang.String ARG_CLASS
static final java.lang.String ARG_DEPTH
static final java.lang.String ARG_SITEMAP
static final java.lang.String ARG_SITEMAP_DETECT
static final java.lang.String STAT_MESSAGE
static final java.lang.String STAT_PHASE
static final java.lang.String STAT_PROGRESS
static final java.lang.String STAT_JOBS
static final java.lang.String STAT_COUNTERS
Copyright © 2019 The Apache Software Foundation