From b9bb677cd04bdc54cf15ba49534f7af81f3be5a8 Mon Sep 17 00:00:00 2001 From: Zhihai Liao Date: Sat, 1 Jul 2023 22:56:58 +0000 Subject: [PATCH] fall back to xinhuanet world --- rsshub/spiders/xinhuanet/utils.py | 9 ++++----- 1 file changed, 4 insertions(+), 5 deletions(-) diff --git a/rsshub/spiders/xinhuanet/utils.py b/rsshub/spiders/xinhuanet/utils.py index b0a6446..e5f83a6 100644 --- a/rsshub/spiders/xinhuanet/utils.py +++ b/rsshub/spiders/xinhuanet/utils.py @@ -1,4 +1,3 @@ -from time import sleep from rsshub.utils import DEFAULT_HEADERS, fetch @@ -6,10 +5,10 @@ def parse_html(post): item = {} item['title'] = post.xpath('text()').extract_first() item['link'] = post.xpath('@href').extract_first() - html = fetch(item['link'], headers=DEFAULT_HEADERS) + print(item['link']) item['description'] = ( - html - .xpath('//div[@id="detail"]') + fetch(item['link'], headers=DEFAULT_HEADERS) + .xpath('//div[@id=\'detail\']') .get() ) - return item \ No newline at end of file + return item