热卖商品
新闻详情
print语句打印出错???【python吧】_百度贴吧
来自 : 百度贴吧
发布时间:2021-03-24
该楼层疑似违规已被系统折叠隐藏此楼查看此楼 总是显示不全,不知道是个什么情况
import requests
from bs4 import BeautifulSoup
from fake_useragent import UserAgent
def get_html():
url = https://dianying.2345.com/top/
headers = { User-Agent : UserAgent().Chrome}
try:
r = requests.get(url=url, timeout=10, headers=headers)
r.raise_for_status()
r.encoding = utf-8
return r.content.decode( GBK )
except:
print( Something Wrong! )
def parse_html():
html = get_html()
soup = BeautifulSoup(html, lxml )
titles = soup.select( div.txt p.pTit span.sTit a )
t = []
[t.append(title.text) for title in titles]
directors = soup.select( div.txt p.pActor )
dir = []
for d in directors:
d = d.text.replace( \\n , ).replace( , )
dir.append(d)
intro = soup.select( div.txt p.pTxt.pIntroShow )
introduction = []
[introduction.append(i.text) for i in intro]
pics = soup.select( div.pic img )
pics_link = []
[pics_link.append(pic[ src ]) for pic in pics]
for i in range(50):
print(t[i])
print(f 片名:{t[i]},导演:{dir[i]} )
# print( 片名: , t[i], 导演: , dir[i])
# print( 导演: , end= )
# print(dir[i])
# print(introduction[i])
print( * *50)
# with open( D:\\\\pachong\\\\Ehco\\\\pic\\\\ + t[i] + .png , wb ) as f:
# f.write(requests.get( http: + pics_link[i]).content)
def main():
parse_html()
if __name__ == __main__ :
main()
姜子牙
程腾 李炜 郑希
**************************************************
import requests
from bs4 import BeautifulSoup
from fake_useragent import UserAgent
def get_html():
url = https://dianying.2345.com/top/
headers = { User-Agent : UserAgent().Chrome}
try:
r = requests.get(url=url, timeout=10, headers=headers)
r.raise_for_status()
r.encoding = utf-8
return r.content.decode( GBK )
except:
print( Something Wrong! )
def parse_html():
html = get_html()
soup = BeautifulSoup(html, lxml )
titles = soup.select( div.txt p.pTit span.sTit a )
t = []
[t.append(title.text) for title in titles]
directors = soup.select( div.txt p.pActor )
dir = []
for d in directors:
d = d.text.replace( \\n , ).replace( , )
dir.append(d)
intro = soup.select( div.txt p.pTxt.pIntroShow )
introduction = []
[introduction.append(i.text) for i in intro]
pics = soup.select( div.pic img )
pics_link = []
[pics_link.append(pic[ src ]) for pic in pics]
for i in range(50):
print(t[i])
print(f 片名:{t[i]},导演:{dir[i]} )
# print( 片名: , t[i], 导演: , dir[i])
# print( 导演: , end= )
# print(dir[i])
# print(introduction[i])
print( * *50)
# with open( D:\\\\pachong\\\\Ehco\\\\pic\\\\ + t[i] + .png , wb ) as f:
# f.write(requests.get( http: + pics_link[i]).content)
def main():
parse_html()
if __name__ == __main__ :
main()
姜子牙
程腾 李炜 郑希
**************************************************
本文链接: http://fakeprint.immuno-online.com/view-696772.html
发布于 : 2021-03-24
阅读(0)
最新动态
2021-03-24
2021-03-24
2021-03-24
2021-03-24
2021-03-24
2021-03-24
2021-03-24
2021-03-24
2021-03-24
2021-03-24
2021-03-24
2021-03-24