mirror of
https://github.com/d0zingcat/RSSHub-python.git
synced 2026-05-22 07:26:48 +00:00
chuansongme full text crawl
This commit is contained in:
@@ -6,7 +6,12 @@ domain = 'https://chuansongme.com'
|
|||||||
def parse(post):
|
def parse(post):
|
||||||
item = {}
|
item = {}
|
||||||
item['title'] = post.css('a.question_link::text').extract()[-1].strip()
|
item['title'] = post.css('a.question_link::text').extract()[-1].strip()
|
||||||
item['link'] = f"{domain}{post.css('a.question_link::attr(href)').extract_first()}"
|
link = f"{domain}{post.css('a.question_link::attr(href)').extract_first()}"
|
||||||
|
item['link'] = link
|
||||||
|
try:
|
||||||
|
item['description'] = '\n'.join(fetch(link).css('p span::text').extract())
|
||||||
|
except AttributeError:
|
||||||
|
pass
|
||||||
return item
|
return item
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user