import re import requests import pandas as pd import numpy as np def hot_github(keyword): url = 'https://github.com/trending/{0}'.format(keyword) main_url = 'https://github.com{0}' html = requests.get(url).content.decode('utf-8') reg_hot_url = re.compile('

\s*') hot_url = [main_url.format(i) for i in re.findall(reg_hot_url, html)] url_abstract_reg = re.compile('

\s*(.*?)\s*

') summary_text = re.findall(url_abstract_reg, html) hotDF = pd.DataFrame() hotDF['项目简介'] = summary_text hotDF['项目地址'] = hot_url hotDF.to_csv('./github_hot.csv', index=False) if __name__ == '__main__': keyword = input('请输入查找的热门语言:') hot_github(keyword)