天天看点

python获取微博热搜

# 获取热搜源码
import json
import re

import requests as requests


def main(json_list=[]):
    response = requests.get('http://s.weibo.com/top/summary')
    html = response.text
    regex = re.compile(
        r'<tr class="">\s+<td class="td-01 ranktop">(\d+)</td>\s+<td class="td-02">\s+<a href="(\S+)" target="_blank" rel="external nofollow"  target="_blank">('
        r'.*?)</a>\s+<span>(.*?)</span>\s+</td>\s+<td class="td-03">.*</td>\s+</tr>')
    lists = regex.findall(html)
    [json_list.append(dict(num=vo[0], url="https://s.weibo.com" + vo[1], key=vo[2], hotNum=vo[3])) for vo in lists]
    print(json.dumps(json_list, indent=2, ensure_ascii=False))


if __name__ == '__main__':
    main()
           
python获取微博热搜