美文网首页
爬取豆瓣top250的电影和电影概括

爬取豆瓣top250的电影和电影概括

作者: lvanzn | 来源:发表于2018-10-09 14:50 被阅读0次
    import requests
    from bs4 import BeautifulSoup
    
    
    def getHTML(url):
        html = requests.get(url)
        return html.text
    
    
    def getInfo(list, qlist):
        cnt = 0
        flag = 0
        for i in range(10):
            turl = 'https://movie.douban.com/top250?start=' + str(i*25)
            html = getHTML(turl)
            soup = BeautifulSoup(html, 'html.parser')
            links = soup.find_all('div', class_='hd')
            for link in links:
                cnt = cnt + 1
                movie = link.a.span.text.strip()
                list.append([cnt, movie])
            quotes = soup.find_all('p', class_='quote')
            for quote in quotes:
                flag = flag + 1
                movie_quote = quote.span.text.strip()
                qlist.append(movie_quote)
    
    
    
    def printInfo(list,qlist):
        module = "{0:^5}\t{1:{3}^20}\t{2:{3}<30}"
        print(module.format("排名", "电影名称", "一句话概括", chr(12288)))
        for i in range(1, 250):
            l_ = list[i]
            q_ = qlist[i]
            print(module.format(l_[0], l_[1], q_, chr(12288)))
    
    
    def main():
        list = []
        qlist = []
        getInfo(list, qlist)
        printInfo(list, qlist)
    
    
    if __name__ == '__main__':
        main()
    

    相关文章

      网友评论

          本文标题:爬取豆瓣top250的电影和电影概括

          本文链接:https://www.haomeiwen.com/subject/kfoeaftx.html