Files
RSSHub-python/rsshub/spiders/xinhuanet/world.py
icedragon a0c40774cf add xinhuanet (news.cn)
Signed-off-by: icedragon <flyingicedragon@qq.com>
2023-05-31 15:07:15 +08:00

20 lines
606 B
Python

from rsshub.spiders.xinhuanet.utils import parse_html as parse
from rsshub.utils import DEFAULT_HEADERS, fetch
domain = 'http://www.news.cn/world/index.html'
def ctx():
url = f'{domain}'
tree = fetch(url, headers=DEFAULT_HEADERS)
with open('/home/icedragon/tmp.html', 'w') as log:
log.write(tree.getall()[0])
posts = tree.xpath('//div[@id=\'recommendDepth\']//a')
return {
'title': '新华网 - 国际要闻',
'link': url,
'description': '新华网 - 国际要闻',
'author': 'flyingicedragon',
'items': list(map(parse, posts)),
}