aCrawler
latest
Contents:
Tutorial
Basic Concepts
Main Interface
aCrawler
Docs
»
Index
Edit on GitHub
Index
_
|
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
L
|
M
|
N
|
O
|
P
|
R
|
S
|
T
|
U
|
W
_
_Middleware (class in acrawler.middleware)
A
acrawler.parser (module)
acrawler.setting (module)
acrawler.utils (module)
add_task() (acrawler.crawler.Crawler method)
address (acrawler.handlers.ItemToMongo attribute)
,
[1]
(acrawler.handlers.ItemToRedis attribute)
append_func() (acrawler.middleware._Middleware method)
B
bind() (acrawler.item.ParselItem class method)
body (acrawler.http.Response attribute)
BrowserRequest (class in acrawler.http)
C
callback (acrawler.http.Request attribute)
callback() (in module acrawler.handlers)
callbacks (acrawler.http.Response attribute)
check_import() (in module acrawler.utils)
col_name (acrawler.handlers.ItemToMongo attribute)
,
[1]
config (acrawler.crawler.Crawler attribute)
content (acrawler.item.Item attribute)
cookies (acrawler.http.Response attribute)
Crawler (class in acrawler.crawler)
custom_process() (acrawler.item.Item method)
D
db_name (acrawler.handlers.ItemToMongo attribute)
,
[1]
DefaultItem (class in acrawler.item)
doc (acrawler.http.Response attribute)
DOWNLOAD_DELAY (in module acrawler.setting)
DOWNLOAD_DELAY_SPECIAL_HOST (in module acrawler.setting)
drop() (acrawler.item.Processors static method)
drop_item() (acrawler.item.Processors static method)
E
exceptions (acrawler.task.Task attribute)
execute() (acrawler.task.Task method)
ExpiredWatcher (class in acrawler.handlers)
extra (acrawler.item.Item attribute)
F
family (acrawler.handlers.ItemToMongo attribute)
,
[1]
(acrawler.handlers.ItemToRedis attribute)
(acrawler.http.Request attribute)
(acrawler.middleware.Handler attribute)
fetch() (acrawler.http.BrowserRequest method)
(acrawler.http.Request method)
FileRequest (class in acrawler.http)
filter() (acrawler.item.Processors static method)
fingerprint (acrawler.task.Task attribute)
first() (acrawler.item.Processors static method)
follow() (acrawler.http.Response method)
G
get_logger() (in module acrawler.utils)
H
handle_after() (acrawler.handlers.ItemToMongo method)
,
[1]
(acrawler.handlers.ItemToRedis method)
(acrawler.middleware.Handler method)
handle_before() (acrawler.handlers.ResponseAddCallback method)
(acrawler.middleware.Handler method)
Handler (class in acrawler.middleware)
headers (acrawler.http.Response attribute)
history (acrawler.http.Response attribute)
I
init_time (acrawler.task.Task attribute)
Item (class in acrawler.item)
items_key (acrawler.handlers.ItemToRedis attribute)
ItemToMongo (class in acrawler.handlers)
,
[1]
ItemToRedis (class in acrawler.handlers)
L
last_crawl_time (acrawler.task.Task attribute)
LOCK_ALWAYS (in module acrawler.setting)
LOG_LEVEL (in module acrawler.setting)
LOG_TIME_DELTA (in module acrawler.setting)
LOG_TO_FILE (in module acrawler.setting)
M
manager() (acrawler.crawler.Crawler method)
map() (acrawler.item.Processors class method)
MAX_REQUESTS (in module acrawler.setting)
MAX_REQUESTS_PER_HOST (in module acrawler.setting)
MAX_REQUESTS_SPECIAL_HOST (in module acrawler.setting)
MAX_TRIES (in module acrawler.setting)
maxsize (acrawler.handlers.ItemToRedis attribute)
merge_dicts() (in module acrawler.utils)
meta (acrawler.http.Request attribute)
(acrawler.http.Response attribute)
middleware (acrawler.crawler.Crawler attribute)
middleware_config (acrawler.crawler.Crawler attribute)
N
next_requests() (acrawler.crawler.Crawler method)
O
ok (acrawler.http.Response attribute)
,
[1]
on_close() (acrawler.handlers.ItemToMongo method)
,
[1]
(acrawler.handlers.ItemToRedis method)
(acrawler.middleware.Handler method)
on_start() (acrawler.handlers.ExpiredWatcher method)
(acrawler.handlers.ItemToMongo method)
,
[1]
(acrawler.handlers.ItemToRedis method)
(acrawler.middleware.Handler method)
open() (acrawler.http.Response method)
open_html() (in module acrawler.utils)
operate_page() (acrawler.http.BrowserRequest method)
P
paginate() (acrawler.http.Response method)
parse() (acrawler.crawler.Crawler method)
(acrawler.http.Response method)
(acrawler.parser.Parser method)
parse_items() (acrawler.parser.Parser method)
parse_links() (acrawler.parser.Parser method)
ParselItem (class in acrawler.item)
Parser (class in acrawler.parser)
parsers (acrawler.crawler.Crawler attribute)
PERSISTENT (in module acrawler.setting)
PERSISTENT_NAME (in module acrawler.setting)
priority (acrawler.middleware.Handler attribute)
Processors (class in acrawler.item)
R
REDIS_ADDRESS (in module acrawler.setting)
REDIS_DF_KEY (in module acrawler.setting)
REDIS_ENABLE (in module acrawler.setting)
redis_push_start_urls() (in module acrawler.utils)
redis_push_start_urls_coro() (in module acrawler.utils)
REDIS_QUEUE_KEY (in module acrawler.setting)
REDIS_START_KEY (in module acrawler.setting)
register() (acrawler.middleware._Middleware method)
(in module acrawler.middleware)
request (acrawler.http.Response attribute)
Request (class in acrawler.http)
request_config (acrawler.crawler.Crawler attribute)
(acrawler.http.Request attribute)
Response (class in acrawler.http)
ResponseAddCallback (class in acrawler.handlers)
run() (acrawler.crawler.Crawler method)
S
score (acrawler.task.Task attribute)
sel (acrawler.http.Response attribute)
send() (acrawler.http.Request method)
spawn() (acrawler.http.Response method)
start_requests() (acrawler.crawler.Crawler method)
start_urls (acrawler.crawler.Crawler attribute)
status (acrawler.http.Response attribute)
status_allowed (acrawler.http.Request attribute)
STATUS_ALLOWED (in module acrawler.setting)
strip() (acrawler.item.Processors static method)
sync_coroutine() (in module acrawler.utils)
T
Task (class in acrawler.task)
text (acrawler.http.Response attribute)
to_date() (acrawler.item.Processors static method)
to_datetime() (acrawler.item.Processors static method)
to_float() (acrawler.item.Processors static method)
to_int() (acrawler.item.Processors static method)
tries (acrawler.task.Task attribute)
U
update_sel() (acrawler.http.Response method)
url (acrawler.http.Request attribute)
(acrawler.http.Response attribute)
url_str (acrawler.http.Response attribute)
urljoin() (acrawler.http.Response method)
W
web_action_after_query() (acrawler.crawler.Crawler method)
web_add_task_query() (acrawler.crawler.Crawler method)
WEB_ENABLE (in module acrawler.setting)
WEB_HOST (in module acrawler.setting)
WEB_PORT (in module acrawler.setting)
Read the Docs
v: latest
Versions
latest
stable
Downloads
pdf
html
epub
On Read the Docs
Project Home
Builds
Free document hosting provided by
Read the Docs
.