程序贼简单,运行就知道了
import requestsimport reweb_url='/search/'keyword=input('请输入搜索关键词:')page=input('请输入要检索的总页数:')headers = {'User-Agent': 'Mozilla/5.0 (iPhone; CPU iPhone OS 9_1 like Mac OS X) AppleWebKit/601.1.46 (KHTML, like Gecko) Version/9.0 Mobile/13B143 Safari/601.1'}def parse_page(response):comment = re.findall('<a href=\"(.*?)\" target', response)namee= re.findall('rel=\"nofollow\"> (.*?) <\/a>',response)return comment,namee#pagee=1while pagee<int(page)+1:print('---------------第'+str(pagee)+'页---------------------')url=web_url+keyword+'?page='+str(pagee)response = requests.get(url=url,headers=headers).textcomment,namee = parse_page(response)for x, y in zip(namee, comment):print('\n')print(x.replace('<em>','').replace('</em>',''))print(y)pagee+=1
运行截图: