From 46e6ed12e34b2d905ffb46526798406c7d50f100 Mon Sep 17 00:00:00 2001 From: lolcat Date: Tue, 21 Oct 2025 00:35:20 -0400 Subject: [PATCH] fix invalid sublinks on google scraper --- scraper/google.php | 42 ++++++++++++++++++++++++++---------------- 1 file changed, 26 insertions(+), 16 deletions(-) diff --git a/scraper/google.php b/scraper/google.php index 148b1b5..03fa718 100644 --- a/scraper/google.php +++ b/scraper/google.php @@ -953,23 +953,33 @@ class google{ ]) ); - if(count($probe) !== 0){ + $url = + $this->unshiturl( + $a["attributes"]["href"] + ); + + if( + preg_match( + '/^http/', + $url + ) + ){ - $sublinks[] = [ - "title" => - $this->titledots( - $this->fuckhtml - ->getTextContent( - $probe[0] - ) - ), - "description" => null, - "date" => null, - "url" => - $this->unshiturl( - $a["attributes"]["href"] - ) - ]; + if(count($probe) !== 0){ + + $sublinks[] = [ + "title" => + $this->titledots( + $this->fuckhtml + ->getTextContent( + $probe[0] + ) + ), + "description" => null, + "date" => null, + "url" => $url + ]; + } } }