# 抓取36氪快讯
# https://36kr.com/newsflashes
import requests
import json
header = {
'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36(KHTML, like Gecko) Chrome/58.0.3029.110 Safari/537.36'
}
url = 'https://36kr.com/api/newsflash?&per_page=20'
response = requests.get(url,headers=header,timeout=5)
data = json.loads(response.text)['data']
items = data['items']
# print(items)
for item in items:
# print(item)
item_info = {}
title = item['title']
item_info['title'] = title
description = item['description']
item_info['content'] = description
published_time = item['published_at']
item_info['published_time'] = published_time
print(item_info)
版权声明:本文内容由互联网用户自发贡献,该文观点与技术仅代表作者本人。本站仅提供信息存储空间服务,不拥有所有权,不承担相关法律责任。如发现本站有涉嫌侵权/违法违规的内容, 请发送邮件至 [email protected] 举报,一经查实,本站将立刻删除。