1 Star 1 Fork 1

Draycen / Spider

加入 Gitee
与超过 1200万 开发者一起发现、参与优秀开源项目,私有仓库也完全免费 :)
免费加入
克隆/下载
Spider.py 3.97 KB
一键复制 编辑 原始数据 按行查看 历史
Mingfei Gao 提交于 2017-07-11 21:55 . 增加关键词
# -*- coding: utf-8 -*-
######################
# Author : 高明飞
# Data : 2016-07-25
# Brief : 用于自动检查新信息的爬虫
######################
import time, logging
import logging.handlers
from ZJU_Talk import *
from SJTU_Talk import *
from FD_Talk import *
from YJS import *
from RuanKao import *
# Init
FinanceKeywords = [
'金融', '投资', '资产', '债券', '证券', '期货', '银行', '保险',
'基金', '信托', 'analyst', 'Analyst'
]
EngineerKeywords = [
'Linux', 'linux', '嵌入式', 'C++', 'RTOS', 'firmware', 'Firmware',
'固件', 'ARM', 'arm', 'C语言', '操作系统', '虚拟化', '中间件',
'Hadoop', '虚拟机', 'MapReduce', '分布式', '大数据开发', '并行计算',
'云计算', 'Spark', 'Storm', '流式计算'
]
HardwareKeywords = [
'硬件', '电路', 'Altium', '单片机', '信号完整性', '电子设计', '系统设计',
'PCB', '原理图', 'EMC', 'EMI', '电磁兼容', '数字电路', '模拟电路',
'数电', '模电', 'Cadence', '基带'
]
HardwareSpecialKeywords = [
'硬件工程师', '电子工程师', '射频工程师', '硬件应用工程师', '硬件开发工程师', '硬件设计工程师', '硬件技术工程师'
]
EngineerSpecialKeywords = [
'嵌入式工程师', '嵌入式开发工程师', '固件工程师', '驱动工程师', '驱动开发工程师', '操作系统工程师', '操作系统开发工程师',
'算法工程师', '软件开发工程师', '软件工程师'
]
WebList = []
WebList.append(ZJU_Talk('浙大招聘宣讲会', 'ZJU_Talk_Engineer', 7, EngineerKeywords, EngineerSpecialKeywords))
# WebList.append(ZJU_Talk('浙大金融宣讲会', 'ZJU_Talk_Finance', 6, FinanceKeywords))
# WebList.append(SJTU_Talk('交大金融宣讲会', 'SJTU_Talk_Finance', 8, FinanceKeywords))
WebList.append(SJTU_Talk('交大招聘宣讲会', 'SJTU_Talk_Engineer', 9, EngineerKeywords, EngineerSpecialKeywords))
# WebList.append(FD_Talk('复旦金融宣讲会', 'FD_Talk_Finance', 10, FinanceKeywords))
WebList.append(FD_Talk('复旦招聘宣讲会', 'FD_Talk_Engineer', 11, EngineerKeywords, EngineerSpecialKeywords))
# WebList.append(YJS('应届生金融招聘', 'YJS_Finance', 12, FinanceKeywords))
WebList.append(YJS('应届生工程师招聘', 'YJS_Engineer', 13, EngineerKeywords, EngineerSpecialKeywords))
WebList.append(RuanKao(5))
LOG_FILE = "Debug.log"
# logging.basicConfig(
# filename='%s.log'%(time.strftime("%Y_%m_%d", time.localtime())), level=logging.WARNING,
# format='%(asctime)s : %(message)s')
logger = logging.getLogger()
fh = logging.handlers.TimedRotatingFileHandler(LOG_FILE, when='D', interval=1, backupCount=7)
formatter = logging.Formatter('%(asctime)s : %(message)s')
fh.setFormatter(formatter)
logger.addHandler(fh)
logging.critical('Program Start!\n')
while True:
logging.warning('Start a new loop~')
for web in WebList:
try:
logging.warning('************************')
web.GET()
except Exception as err:
logging.error('Unexpected ERROR!!!!!!')
logging.error(repr(err))
# traceback.print_exc()
web.err += 1
if 4 == web.err:
try:
web.ReportErrStatus(repr(err), True)
logging.warning('Send Wchat Error Report.')
except:
logging.critical('Send Wchat Error Report Error!!!!!')
else:
if web.err >= 4:
try:
web.ReportErrStatus('', False)
logging.warning('Send Wchat Recovery Report.')
except:
logging.critical('Send Wchat Recovery Report Error!!!!!')
web.err = 0
finally:
web.Update()
logging.warning('************************')
logging.warning('End of a loop~\n')
time.sleep(900)
logging.critical('Program End!\n')
马建仓 AI 助手
尝试更多
代码解读
代码找茬
代码优化
Python
1
https://gitee.com/Draycen/Spider.git
git@gitee.com:Draycen/Spider.git
Draycen
Spider
Spider
master

搜索帮助

344bd9b3 5694891 D2dac590 5694891