mirror of
https://github.com/ail-project/ail-framework.git
synced 2024-11-27 00:07:16 +00:00
fix: [Crawler] retry when splash is not available
This commit is contained in:
parent
4e08aaa80f
commit
f842194c57
1 changed files with 20 additions and 10 deletions
|
@ -27,17 +27,27 @@ def crawl_onion(url, domain, date, date_month, message):
|
||||||
if super_father is None:
|
if super_father is None:
|
||||||
super_father=paste
|
super_father=paste
|
||||||
|
|
||||||
try:
|
retry = True
|
||||||
r = requests.get(splash_url , timeout=30.0)
|
nb_retry = 0
|
||||||
except Exception:
|
while retry:
|
||||||
# TODO: relaunch docker or send error message
|
try:
|
||||||
|
r = requests.get(splash_url , timeout=30.0)
|
||||||
|
retry = False
|
||||||
|
except Exception:
|
||||||
|
# TODO: relaunch docker or send error message
|
||||||
|
nb_retry += 1
|
||||||
|
|
||||||
on_error_send_message_back_in_queue(type_hidden_service, domain, message)
|
if nb_retry == 30:
|
||||||
publisher.error('{} SPASH DOWN'.format(splash_url))
|
on_error_send_message_back_in_queue(type_hidden_service, domain, message)
|
||||||
print('--------------------------------------')
|
publisher.error('{} SPASH DOWN'.format(splash_url))
|
||||||
print(' \033[91m DOCKER SPLASH DOWN\033[0m')
|
print('--------------------------------------')
|
||||||
print(' {} DOWN'.format(splash_url))
|
print(' \033[91m DOCKER SPLASH DOWN\033[0m')
|
||||||
exit(1)
|
print(' {} DOWN'.format(splash_url))
|
||||||
|
exit(1)
|
||||||
|
|
||||||
|
print(' \033[91m DOCKER SPLASH NOT AVAILABLE\033[0m')
|
||||||
|
print(' Retry({}) in 10 seconds'.format(nb_retry))
|
||||||
|
time.sleep(10)
|
||||||
|
|
||||||
if r.status_code == 200:
|
if r.status_code == 200:
|
||||||
process = subprocess.Popen(["python", './torcrawler/tor_crawler.py', splash_url, type_hidden_service, url, domain, paste, super_father],
|
process = subprocess.Popen(["python", './torcrawler/tor_crawler.py', splash_url, type_hidden_service, url, domain, paste, super_father],
|
||||||
|
|
Loading…
Reference in a new issue