euscan: add new robots.txt exceptions

Signed-off-by: Corentin Chary <corentincj@iksaif.net>
This commit is contained in:
Corentin Chary 2011-10-08 08:33:03 +02:00
parent d7f655cdde
commit 277fb4ebe6

View File

@ -18,7 +18,7 @@ CONFIG = {
'brute-force-recursive': True,
'brute-force-false-watermark': 50,
'scan-dir': True,
'oneshot': False,
'oneshot': True,
'user-agent' : 'escan (http://euscan.iksaif.net)',
'skip-robots-txt' : False,
'cache' : False
@ -60,4 +60,6 @@ ROBOTS_TXT_BLACKLIST_DOMAINS = [
'(.*)sourceforge(.*)',
'(.*)github.com',
'(.*)berlios(.*)',
'(.*)qt.nokia.com(.*)',
'(.*)chromium.org(.*)',
]