From b492ef2329ef918b0b40f3090b4bdc3681e3fd09 Mon Sep 17 00:00:00 2001 From: lolcat Date: Thu, 30 May 2024 19:13:47 -0400 Subject: qwant gibberish check fix --- scraper/qwant.php | 24 ++++++++++++------------ 1 file changed, 12 insertions(+), 12 deletions(-) (limited to 'scraper') diff --git a/scraper/qwant.php b/scraper/qwant.php index f914e15..48ecd85 100644 --- a/scraper/qwant.php +++ b/scraper/qwant.php @@ -360,7 +360,17 @@ class qwant{ return $out; } - throw new Exception("Server returned an error code: " . $json["data"]["error_code"]); + if(isset($json["data"]["error_code"])){ + + switch($json["data"]["error_code"]){ + + case 27: + throw new Exception("Qwant returned a captcha"); + break; + } + } + + throw new Exception("Qwant returned an error code: " . $json["data"]["error_code"]); } if(!isset($json["data"]["result"]["items"]["mainline"])){ @@ -488,17 +498,7 @@ class qwant{ // detect gibberish results if( $first_iteration && - preg_match( - "/^" . - preg_quote( - $this->trimdots( - $result["source"] - ), - "/" - ) . - "/", - $result["url"] - ) !== 1 + !isset($result["urlPingSuffix"]) ){ throw new Exception("Qwant returned gibberish results"); -- cgit v1.2.3