批量查询网址是否备案
- 作者: 不是二是四
- 来源: 51数据库
- 2022-08-12
#coding:utf-8
import requests,xlrd,datetime,threading,sys
from bs4 import BeautifulSoup
reload(sys)
sys.setdefaultencoding("utf-8")
def beian(url,excel):
f = xlrd.open_workbook(excel)
sheet1 = f.sheet_by_name('Sheet1')
num_cols = sheet1.ncols
for curr_col in range(num_cols):
rows = sheet1.col_values(curr_col)
for each in rows:
data = {'s': each,'guid': '1e4b4b3f-310f-4aaa-90f7-a552db48758d'}
r = requests.post(url,data=data)
soup = BeautifulSoup(r.content,'html.parser')
tags = soup.find_all('div',id='contenthtml')
try:
for tag in tags:
d_name = tag.find('td',class_='tdright').get_text()
#print d_name
print ('%s 已备案') % each
except AttributeError:
print ('%s 未备案') % each
if __name__ == "__main__":
url = 'http://www.51sjk.com/Upload/Articles/1/0/320/320902_20220812160139866.aspx'
excel = (r'C:\\1.xlsx')
threads = []
print "程序开始运行%s" % datetime.datetime.now()
t1 = threading.Thread(target=beian,args=(url,excel))
threads.append(t1)
for th in threads:
th.setDaemon(True)
th.start()
th.join()
print "程序结束时间%s" % datetime.datetime.now()
#beian(url,excel)
推荐阅读
热点文章
Discord.py(重写)on_member_update 无法正常工作
0
Discord.py 在 vc 中获取用户分钟数
0
discord.py 重写 |为我的命令出错
0
Discord.py rewrite 如何 DM 命令?
0
播放音频时,最后一部分被切断.如何解决这个问题?(discord.py)
0
在消息删除消息 Discord.py
0
如何使 discord.py 机器人私人/直接消息不是作者的人?
0
(Discord.py) 如何获取整个嵌入内容?
0
Discord bot 尽管获得了许可,但不能提及所有人
0
Discord.py discord.NotFound 异常
0
