From 03fe53cec977f5dfe13f72e0b235a08d19b0ab7e Mon Sep 17 00:00:00 2001
From: Your Name <you@example.com>
Date: Fri, 22 Jul 2022 21:30:37 -0400
Subject: [PATCH] support more google book urls

---
 common/scrapers/google.py | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/common/scrapers/google.py b/common/scrapers/google.py
index 18b0a2c3..0082fb3e 100644
--- a/common/scrapers/google.py
+++ b/common/scrapers/google.py
@@ -28,10 +28,16 @@ class GoogleBooksScraper(AbstractScraper):
 
     @classmethod
     def get_effective_url(cls, raw_url):
-        u = re.match(r"https://books\.google\.com/books\?id=[^&#]+", raw_url)
-        return u[0] if u else None
+        # https://books.google.com/books?id=wUHxzgEACAAJ
+        # https://books.google.com/books/about/%E7%8F%BE%E5%A0%B4%E6%AD%B7%E5%8F%B2.html?id=nvNoAAAAIAAJ
+        # https://www.google.com/books/edition/_/nvNoAAAAIAAJ?hl=en&gbpv=1
+        u = re.match(r"https://books\.google\.com/books.*id=([^&#]+)", raw_url)
+        if not u:
+            u = re.match(r"https://www\.google\.com/books/edition/[^/]+/([^&#?]+)", raw_url)
+        return 'https://books.google.com/books?id=' + u[1] if u else None
 
     def scrape(self, url, response=None):
+        url = self.get_effective_url(url)
         m = self.regex.match(url)
         if m:
             api_url = f'https://www.googleapis.com/books/v1/volumes/{m[1]}'