-
Notifications
You must be signed in to change notification settings - Fork 414
/
Copy pathrun_validator.py
76 lines (64 loc) · 2.36 KB
/
run_validator.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
# -*- coding: utf-8 -*-
import logging
import os
import subprocess
import sys
import time
import scrapydo
import utils
from importlib import import_module
VALIDATORS = {
'HttpBinSpider': 'crawler.spiders.validator.httpbin',
# 'DoubanSpider':'ipproxytool.spiders.validator.douban',
# 'AssetStoreSpider':'ipproxytool.spiders.validator.assetstore',
# 'GatherSpider' :'ipproxytool.spiders.validator.gather',
# 'HttpBinSpider' :'ipproxytool.spiders.validator.httpbin',
# 'SteamSpider' :'ipproxytool.spiders.validator.steam',
# 'BossSpider' :'ipproxytool.spiders.validator.boss',
# 'LagouSpider' :'ipproxytool.spiders.validator.lagou',
# 'LiepinSpider' :'ipproxytool.spiders.validator.liepin',
# 'JDSpider' :'ipproxytool.spiders.validator.jd',
# 'BBSSpider' :'ipproxytool.spiders.validator.bbs',
# 'ZhiLianSpider' :'ipproxytool.spiders.validator.zhilian',
# 'AmazonCnSpider' :'ipproxytool.spiders.validator.amazoncn',
}
scrapydo.setup()
def validator():
process_list = []
for item, path in VALIDATORS.items():
module = import_module(path)
validator = getattr(module, item)
popen = subprocess.Popen(['python', 'run_spider.py', validator.name], shell=False)
data = {
'name': validator.name,
'popen': popen,
}
process_list.append(data)
while True:
time.sleep(60)
for process in process_list:
popen = process.get('popen', None)
utils.log('name:%s poll:%s' % (process.get('name'), popen.poll()))
# 检测结束进程,如果有结束进程,重新开启
if popen != None and popen.poll() == 0:
name = process.get('name')
utils.log('%(name)s spider finish...\n' % {'name': name})
process_list.remove(process)
p = subprocess.Popen(['python', 'run_spider.py', name], shell=False)
data = {
'name': name,
'popen': p,
}
process_list.append(data)
time.sleep(1)
break
if __name__ == '__main__':
os.chdir(sys.path[0])
if not os.path.exists('log'):
os.makedirs('log')
logging.basicConfig(
filename='log/validator.log',
format='%(asctime)s: %(message)s',
level=logging.DEBUG
)
validator()