From 850d1915b2cb510d1041f44019755efc2ba47256 Mon Sep 17 00:00:00 2001 From: doubaniux Date: Sun, 11 Oct 2020 20:30:29 +0200 Subject: [PATCH] fix movie summary scrape bug --- common/scraper.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/common/scraper.py b/common/scraper.py index a3c72236..0326ccbe 100644 --- a/common/scraper.py +++ b/common/scraper.py @@ -354,8 +354,10 @@ def scrape_douban_movie(url): # if has field `episodes` not none then must be series is_series = True if episodes else False - brief_elem = content.xpath("//span[@property='v:summary']/text()") - brief = brief_elem[0].strip() if brief_elem else None + brief_elem = content.xpath("//span[@class='all hidden']") + if not brief_elem: + brief_elem = content.xpath("//span[@property='v:summary']") + brief = brief_elem[0].xpath('./text()')[0].strip() if brief_elem else None img_url_elem = content.xpath("//img[@rel='v:image']/@src") img_url = img_url_elem[0].strip() if img_url_elem else None