From 2ac0b911f5f2e47fa224da9a87f8eee9b308739f Mon Sep 17 00:00:00 2001 From: dano Date: Thu, 18 Jun 2020 13:19:40 +0000 Subject: [PATCH] Update 'README.md' --- README.md | 32 ++++++++++++++++++++++++++++++++ 1 file changed, 32 insertions(+) diff --git a/README.md b/README.md index 32985ac..85f95ed 100644 --- a/README.md +++ b/README.md @@ -28,6 +28,38 @@ Install package: pip install https://git.kemt.fei.tuke.sk/dano/websucker-pip/archive/master.zip +### Initialize and setup database + +If you have Cassandra installed, first initialize the database schema using the cqlsh command, the schema can be found in the schema.sql file + + +You set up the database using an environment variable (if it is on another machine): + + + export CASSANDRA_HOST=localhost + + export CASSANDRA_PORT=9142 + + ## Usage websuck --help + + + +### Create initial domain list + +Save the list of domains to a file, e.g. + + echo www.sme.sk > domains.txt + + +### Visit initial domains in file + + + websuck --visit file domains.txt + +### Visit unvisited domains + + websuck --visit unvisited 100 +