Python爬取内涵段子里的段子

发布时间:2019-09-16 07:33:19编辑:auto阅读(1465)

    环境:Python3.6



    #!/usr/bin/env python3
    #-*-coding:utf-8-*-
    #version:3.6.4
    __author__ = '杜文涛'
    
    import requests
    import json
    
    
    def get_json_dic(url):
        global dict_json
        response = requests.get(url=url)
        json_response = response.content.decode() #获取r的文本 就是一个json字符串
        dict_json = json.loads(json_response) #  将json字符串转换成dic字典对象
    
        return dict_json
    
    def get_joke(dict_json):
        print(len(dict_json['data']['data']))
        for i in range(1,20):
            conture = input('是否继续,Y/N')
            if conture == 'Y' or conture == 'y':
                joke = dict_json['data']['data'][i]['group']['text']
                if i == 19:
                    dict_json = {}
                    conture
                print(joke)
            else:
                exit()
    
    def get_max_time(dic_json):
        global max_time
        max_time = dict_json['data']['max_time']
        return max_time
    
    if __name__ == '__main__':
        max_time = 1519404642
        url = 'http://www.neihanshequ.com/joke/?is_json=1&app_name=neihanshequ_web&max_time=' + str(max_time)
    
        get_json_dic(url)
        get_max_time(dic_json=dict_json)
        get_joke(dict_json=dict_json)
    
        while True:
            url = 'http://www.neihanshequ.com/joke/?is_json=1&app_name=neihanshequ_web&max_time=' + str(max_time)
            get_json_dic(url)
            get_max_time(dic_json=dict_json)
            get_joke(dict_json=dict_json)
            print(url)

    微信公众号:

    qrcode_for_gh_0cd223682950_344.jpg

关键字