设为首页 加入收藏

TOP

python3-爬取cnnvd漏洞信息(三)
2017-11-22 06:07:16 】 浏览:422
Tags:python3- 爬取 cnnvd 漏洞 信息
tml,'html.parser') try: holes_titles1 = holes_title_soup2.find_all(name='p')[0].string holes_titles2 = holes_title_soup2.find_all(name='p')[1].string holes_titles = holes_titles1 + holes_titles2 holes_titles = holes_titles.replace(' ','').replace('\t','').replace('\r','').replace('\n','') except: holes_titles = '' holes_result_list.append(holes_titles) #漏洞公告 holes_notice_html = holes_detainled_soup1.find('div',attrs={'class':'d_ldjj m_t_20'}) #定义 漏洞公告 块的soup holes_notice_html = holes_notice_html.decode() holes_notice_soup2 = BeautifulSoup(holes_notice_html,'html.parser') try: holes_notice1 = holes_notice_soup2.find_all(name='p')[0].string holes_notice2 = holes_notice_soup2.find_all(name='p')[1].string holes_notice = holes_notice1+holes_notice2 holes_notice = holes_notice.replace('\n','').replace('\r','').replace('\t','') except: holes_notice = '' holes_result_list.append(holes_notice) #参考网址 holes_reference_html = holes_detainled_soup1.find_all('div',attrs={'class':'d_ldjj m_t_20'})[1] #定义 参考网址 块的soup holes_reference_html = holes_reference_html.decode() holes_reference_soup2 = BeautifulSoup(holes_reference_html,'html.parser') try: holes_reference = holes_reference_soup2.find_all(name='p')[1].string holes_reference = holes_reference.replace('\n','').replace('\r','').replace('\t','').replace('链接:','') except: holes_reference = '' holes_result_list.append(holes_reference) #受影响实体 holes_effect_html = holes_detainled_soup1.find_all('div',attrs={'class':'d_ldjj m_t_20'})[2] #定义 受影响实体 块的soup holes_effect_html = holes_effect_html.decode() holes_effect_soup2 = BeautifulSoup(holes_effect_html,'html.parser') try: holes_effect = holes_effect_soup2.find_all(name='p')[0].string holes_effect = holes_effect.replace('\n','').replace('\r','').replace('\t','').replace(' ','') except: try: holes_effect = holes_effect_soup2.find_all(name='a')[0].string holes_effect = holes_effect.replace('\n','').replace('\r','').replace('\t','').replace(' ','') except: holes_effect = '' holes_result_list.append(holes_effect) #补丁 holes_patch_html = holes_detainled_soup1.find_all('div',attrs={'class':'d_ldjj m_t_20'})[3] #定义 补丁 块的soup holes_patch_html = holes_patch_html.decode() holes_patch_soup2 = BeautifulSoup(holes_patch_html,'html.parser') try: holes_patch = holes_patch_soup2.find_all(name='p')[0].string holes_patch = holes_patch.replace('\n','').replace('\r','').replace('\t','').replace(' ','') except: holes_patch = '' holes_result_list.append(holes_patch) #漏洞信息写入excel def holes_excel(excel): workbook = xlsxwriter.Workbook('holes_data.xlsx') worksheet = workbook.add_worksheet() row = 0 col = 0 worksheet.write(row,0,'漏洞名称') worksheet.write(row,1,'CNNVD编号') worksheet.write(row,2,'危害等级') worksheet.write(row,3,'CVE编号') worksheet.write(row,4,'漏洞类型') worksheet.write(row,5,'发布时间') worksheet.write(row,6,'攻击途径') worksheet.write(row,7,'更新时间') worksheet.write(row,8,'厂商') worksheet.write(row,9,'漏洞来源') worksheet.write(row,10,'漏洞描述') worksheet.write(row,11,'解决方案') worksheet.write(row,12,'参考链接') worksheet.write(row,13,'受影响实体') worksheet.write(row,14,'补丁') row = 1 for i in range(l
首页 上一页 1 2 3 4 下一页 尾页 3/4/4
】【打印繁体】【投稿】【收藏】 【推荐】【举报】【评论】 【关闭】 【返回顶部
上一篇[Python]嵌套循环nested loop-练.. 下一篇Python入门3

最新文章

热门文章

Hot 文章

Python

C 语言

C++基础

大数据基础

linux编程基础

C/C++面试题目