summaryrefslogtreecommitdiff
path: root/src/crawl/crawl.conf
diff options
context:
space:
mode:
authorAndreas Baumann <mail@andreasbaumann.cc>2014-09-28 21:29:03 +0200
committerAndreas Baumann <mail@andreasbaumann.cc>2014-09-28 21:29:03 +0200
commitb80687f17644766eb890598297c0f37bb898d76d (patch)
tree44e6a15cc058087a19dd44d44c2d1d52194a5876 /src/crawl/crawl.conf
parentc82a15eb0ffe61c1d2d2630981777f72013e833a (diff)
downloadcrawler-b80687f17644766eb890598297c0f37bb898d76d.tar.gz
crawler-b80687f17644766eb890598297c0f37bb898d76d.tar.bz2
first Lua config of crawler
Diffstat (limited to 'src/crawl/crawl.conf')
-rw-r--r--src/crawl/crawl.conf13
1 files changed, 13 insertions, 0 deletions
diff --git a/src/crawl/crawl.conf b/src/crawl/crawl.conf
new file mode 100644
index 0000000..95d0f75
--- /dev/null
+++ b/src/crawl/crawl.conf
@@ -0,0 +1,13 @@
+-- global setting
+
+crawler = {
+ -- stop after N documents
+ stop_after_N_operations = 10
+}
+
+-- seeds: URLS which are fed in the beginning to the URL frontier
+
+seeds = {
+ "http://www.wolframe.net",
+ "http://wolframe.net"
+}