From c2b3a5ff66ad9e5120d4258219ce6af175ba023d Mon Sep 17 00:00:00 2001 From: doubaniux Date: Mon, 16 Nov 2020 13:36:31 +0100 Subject: [PATCH] fix summary scraping problem of douban movies --- common/scraper.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/common/scraper.py b/common/scraper.py index 973746c8..8931aa96 100644 --- a/common/scraper.py +++ b/common/scraper.py @@ -358,7 +358,7 @@ def scrape_douban_movie(url): brief_elem = content.xpath("//span[@class='all hidden']") if not brief_elem: brief_elem = content.xpath("//span[@property='v:summary']") - brief = brief_elem[0].xpath('./text()')[0].strip() if brief_elem else None + brief = '\n'.join([e.strip() for e in brief_elem[0].xpath('./text()')]) if brief_elem else None img_url_elem = content.xpath("//img[@rel='v:image']/@src") img_url = img_url_elem[0].strip() if img_url_elem else None