• 简易版爬虫(豆瓣)



    import requests
    import re
    def get_douban():

        res_str = requests.get("https://movie.douban.com/top250?start=0&filter=")

        return res_str.text
    def run():

        resong = get_douban()

        obj = re.compile('<span class="title">(?P<name>.*?)</span>.*?<span>(?P<evaluate>.*?)</span>.*?'
                         '<p class="">\ns+(?P<director>.*?)&nbsp;&nbsp;&nbsp;?', re.S)

        ret = obj.finditer(resong)

        return ret
    def zuz():

        for i in run():

            yield{"name":i.group('name'),
                "evaluate":i.group('evaluate'),
                  "director":i.group('director')

               }
    for i in zuz():

        print(i)

  • 相关阅读:
    CodeForces
    [AHOI 2013] 差异
    BZOJ
    [校内训练20_09_15]ABC
    [校内训练20_09_10]ABC
    [校内训练20_09_08]AC
    fastIO
    [校内训练20_06_05]ABC
    [校内训练20_06_04]ABC
    [校内训练20_06_03]ABC
  • 原文地址:https://www.cnblogs.com/lizhaoyu/p/7117235.html
Copyright © 2020-2023  润新知