代码拉取完成,页面将自动刷新
import requests
import json
from bs4 import BeautifulSoup
import webbrowser
nowplayingUrl = 'https://movie.douban.com/cinema/nowplaying/dongying/'
class getM():
def getNowPlaying (url):
r = requests.get(url)
res = r.text
soup = BeautifulSoup(res,'html.parser')
div = soup.find(id = 'nowplaying').find_all("li", attrs={"class": "list-item"})
# print(div)
nowplaying = ''
for i in range(len(div)):
# if i < 10 :
# print(div[i].find("li", attrs={"class": 'srating'}).find('span','subject-rate'))
if div[i].find("li", attrs={"class": 'stitle'}).find('a').get('title') != None:
nowplaying += '电影名称:'+ div[i].find("li", attrs={"class": 'stitle'}).find('a').get('title')+ '\r\n'
else:
nowplaying += '电影名称:'+'暂无名称'+ '\r\n'
if div[i].find("li", attrs={"class": 'srating'}).find('span','subject-rate') != None:
nowplaying += '评分:' + div[i].find("li", attrs={"class": 'srating'}).find('span','subject-rate').text+ '\r\n'
else:
nowplaying +='评分:' + '暂无评分'+'\r\n'
if div[i].find("li", attrs={"class": 'stitle'}).find('a').get('href') != None:
nowplaying += '电影简介:<a target="_blank" href='+ div[i].find("li", attrs={"class": 'stitle'}).find('a').get('href')+'/>'+div[i].find("li", attrs={"class": 'stitle'}).find('a').get('href')+'</a>' +'\r\n'
else:
nowplaying += '电影简介:'+'暂无简介'+ '\r\n'
if div[i].find("li", attrs={"class": 'sbtn'}).find('a').get('href') != None:
nowplaying += '购票地址:<a target="_blank" href='+ div[i].find("li", attrs={"class": 'sbtn'}).find('a').get('href')+ '>'+div[i].find("li", attrs={"class": 'sbtn'}).find('a').get('href')+'</a>'+'\r\n'
else:
nowplaying += '购票地址:'+'暂无地址'+ '\r\n'
return nowplaying
def getComing (url):
r = requests.get(url)
res = r.text
soup = BeautifulSoup(res,'html.parser')
trs = soup.find('table','coming_list').find('tbody').find_all('tr')
coming = ''
for i in range(len(trs)):
if trs[i]:
coming += '上映日期:' + trs[i].find_all('td')[0].text.strip() + '\r\n'
coming += '片名:' + trs[i].find_all('td')[1].text.strip() + '\r\n'
coming += '类型:' + trs[i].find_all('td')[2].text.strip() + '\r\n'
coming += '制片地区:' + trs[i].find_all('td')[3].text.strip() + '\r\n'
coming += '想看:' + trs[i].find_all('td')[4].text.strip() + '\r\n'
coming += '简介:<a target="_blank" href=' + trs[i].find_all('td')[1].find('a').get('href').strip() + '>'+trs[i].find_all('td')[1].find('a').get('href').strip()+'</a>' +'\r\n'
coming += '\r\n' + '\r\n'
# pass
return coming
GEN_HTML = 'asd.html'
print(getM.getNowPlaying(nowplayingUrl))
print(getM.getComing('https://movie.douban.com/coming'))
content = getM.getNowPlaying(nowplayingUrl).replace('\r\n','<br/>')
coming = getM.getComing('https://movie.douban.com/coming').replace('\r\n','<br/>')
f = open(GEN_HTML,'w',encoding='utf8')
message = """
<html>
<head>
<meta name="renderer" content="webkit" />
<meta http-equiv="X-UA-Compatible" content="IE=edge,chrome=1" />
<meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
</head>
<body>
<p>Hello,World!</p>
<p>豆瓣电影</p>
<div>
<p>热映</p>
%s
</div>
<div>
<p>即将上映</p>
%s
</div>
</body>
</html>"""%(content,coming)
f.write(message)
f.close()
webbrowser.open(GEN_HTML,new = 1)
此处可能存在不合适展示的内容,页面不予展示。您可通过相关编辑功能自查并修改。
如您确认内容无涉及 不当用语 / 纯广告导流 / 暴力 / 低俗色情 / 侵权 / 盗版 / 虚假 / 无价值内容或违法国家有关法律法规的内容,可点击提交进行申诉,我们将尽快为您处理。