是获取豆瓣电影top100的信息的
import requests
from bs4 import BeautifulSoup
def get_urls(url):
all_url=[]
for i in range(0,100,25):
if i== 0:
all_url.append(url)
else:
urls='https://movie.douban.com/top250?start={}&filter='.format(i)
all_url.append(urls)
return(all_url)
def get_details(url):
res = requests.get(url)
soup = BeautifulSoup(res.text,'html.parser')
contents =soup.select('.info')
for content in contents:
names = content.select('.title')[0].text
links = content.select('a')[0]['href']
comments = content.select('.rating_num')[0].text
print(names,comments,links)
return
def get_movie(main_url):
all_urls = get_urls(main_url)
print(all_urls)
for url in all_urls:
contents=get_details(url)
print(contents)
main_url='https://movie.douban.com/top250'
info = get_movie(main_url)![](http://imgsrc.baidu.com/forum/w%3D580/sign=1d1131e246086e066aa83f4332097b5a/bf35b119ebc4b745e6211ac5c5fc1e178b821508.jpg)
![](http://imgsrc.baidu.com/forum/w%3D580/sign=0f89d4eb64061d957d4637304bf50a5d/0679e9c4b74543a924ae571f14178a82b8011408.jpg)
![](http://imgsrc.baidu.com/forum/w%3D580/sign=eb80f6e517950a7b75354ecc3ad0625c/5ea4b54543a98226687486f48082b9014b90eb09.jpg)
import requests
from bs4 import BeautifulSoup
def get_urls(url):
all_url=[]
for i in range(0,100,25):
if i== 0:
all_url.append(url)
else:
urls='https://movie.douban.com/top250?start={}&filter='.format(i)
all_url.append(urls)
return(all_url)
def get_details(url):
res = requests.get(url)
soup = BeautifulSoup(res.text,'html.parser')
contents =soup.select('.info')
for content in contents:
names = content.select('.title')[0].text
links = content.select('a')[0]['href']
comments = content.select('.rating_num')[0].text
print(names,comments,links)
return
def get_movie(main_url):
all_urls = get_urls(main_url)
print(all_urls)
for url in all_urls:
contents=get_details(url)
print(contents)
main_url='https://movie.douban.com/top250'
info = get_movie(main_url)
![](http://imgsrc.baidu.com/forum/w%3D580/sign=1d1131e246086e066aa83f4332097b5a/bf35b119ebc4b745e6211ac5c5fc1e178b821508.jpg)
![](http://imgsrc.baidu.com/forum/w%3D580/sign=0f89d4eb64061d957d4637304bf50a5d/0679e9c4b74543a924ae571f14178a82b8011408.jpg)
![](http://imgsrc.baidu.com/forum/w%3D580/sign=eb80f6e517950a7b75354ecc3ad0625c/5ea4b54543a98226687486f48082b9014b90eb09.jpg)