diff --git a/rsshub/spiders/xinhuanet/utils.py b/rsshub/spiders/xinhuanet/utils.py index b0a6446..e5f83a6 100644 --- a/rsshub/spiders/xinhuanet/utils.py +++ b/rsshub/spiders/xinhuanet/utils.py @@ -1,4 +1,3 @@ -from time import sleep from rsshub.utils import DEFAULT_HEADERS, fetch @@ -6,10 +5,10 @@ def parse_html(post): item = {} item['title'] = post.xpath('text()').extract_first() item['link'] = post.xpath('@href').extract_first() - html = fetch(item['link'], headers=DEFAULT_HEADERS) + print(item['link']) item['description'] = ( - html - .xpath('//div[@id="detail"]') + fetch(item['link'], headers=DEFAULT_HEADERS) + .xpath('//div[@id=\'detail\']') .get() ) - return item \ No newline at end of file + return item