zz
This commit is contained in:
parent
e06ef64c8f
commit
7d09f112df
@ -4,4 +4,4 @@ COPY requirements.txt /app
|
||||
RUN pip install -r /app/requirements.txt
|
||||
COPY *.py /app
|
||||
WORKDIR /app
|
||||
ENTRYPOINT ["python", "./mongocrawler.py"]
|
||||
ENTRYPOINT ["rq", "worker"]
|
||||
|
@ -1,5 +1,9 @@
|
||||
version: "3.0"
|
||||
services:
|
||||
redis:
|
||||
image: redis
|
||||
ports:
|
||||
- 6379:6379
|
||||
mongo:
|
||||
image: mongo
|
||||
environment:
|
||||
|
@ -591,8 +591,6 @@ def visit(start_link):
|
||||
batch_size = BATCHSIZE
|
||||
rules = fetch_robot(hostname)
|
||||
# renew front links
|
||||
sitemap_links = fetch_sitemap_links(start_link)
|
||||
index_links(db,sitemap_links)
|
||||
front_links = fetch_front_links(start_link,rules)
|
||||
index_links(db,front_links)
|
||||
# start crawling
|
||||
|
Loading…
Reference in New Issue
Block a user