本文初取了猫眼电影top100电影信息。网址:https://maoyan.com/board/4importrequestsfrombs4importBeautifulSoupimporttimedefget_content(url):#获取htmlheaders={'User-Agent':'Mozilla/5.0(WindowsNT10.0;Win64;x64)AppleWebKit/537.36(KHTML,如Gecko)Chrome/80.0.3987.87Safari/537.36','Accept-Language':'zh-CN,zh;q=0.9'}r=requests.get(url,headers=headers)ifr.status_code==200:returnr.textreturnNonedefget_info(html):#从html中获取信息soup=BeautifulSoup(html,'lxml')movie_list=soup.find('dl',class_='board-wrapper').find_all('dd')l_=[]foriinmovie_list:rank=i.find('i').textname=i.find('p',class_='name').textactor=i.find('p',class_='star').text.strip()[3:]time=i.find('p',class_='releasetime').text.strip()[5:]score=i.find('p',class_='score').textl_.append([rank,name,actor,time,score])returnl_defwrite_to_file(l_):with打开('result.txt','a',encoding='utf-8')asf:foriinl_:f.write(str(i)+'\n')defmain(i):url='https://maoyan.com/board/4?offset={}'.format(i)html=get_content(url)l_=get_info(html)write_to_file(l_)if__name__=='__main__':foriinrange(0,100,10):尝试:main(i)除了:main(i)time.sleep(1)
