fixed google formatting changes

This commit is contained in:
lolcat 2024-06-29 19:02:33 -04:00
parent 6df9d17ada
commit 7a91eb7839
1 changed files with 97 additions and 79 deletions

View File

@ -703,6 +703,43 @@ class google{
} }
// reset // reset
$this->fuckhtml->load($result_div);
}else{
// get the "Did you mean?" prompt
$taw =
$this->fuckhtml
->getElementById(
"taw"
);
if($taw){
$this->fuckhtml->load($taw);
$as =
$this->fuckhtml
->getElementsByTagName(
"a"
);
if(count($as) !== 0){
$text =
$this->fuckhtml
->getTextContent(
$as[0]
);
// @TODO implement did_you_mean
$out["spelling"] = [
"type" => "including",
"using" => $search,
"correction" => $text
];
}
}
$this->fuckhtml->load($result_div); $this->fuckhtml->load($result_div);
} }
@ -895,36 +932,10 @@ class google{
// get "Related Searches" and "People also search for" // get "Related Searches" and "People also search for"
// //
$relateds = $relateds =
array_merge(
$this->fuckhtml
->getElementsByClassName(
$this->getstyle(
[
"align-items" => "center",
"background-color" => "#28292a",
"border-radius" => "100px",
"box-sizing" => "border-box",
"display" => "flex",
"max-height" => "none",
"min-height" => "48px",
"padding-left" => "17px",
"padding-right" => "17px",
"position" => "relative"
]
) . " " .
$this->getstyle(
[
"margin-left" => "8px",
"margin-right" => "8px"
]
),
"a"
),
$this->fuckhtml $this->fuckhtml
->getElementsByClassName( ->getElementsByClassName(
"wyccme", "wyccme",
"div" "div"
)
); );
foreach($relateds as $related){ foreach($relateds as $related){
@ -1354,7 +1365,7 @@ class google{
"font-size" => "12px", "font-size" => "12px",
"line-height" => "1.34", "line-height" => "1.34",
"display" => "inline-block", "display" => "inline-block",
"font-family" => "Google Sans,arial,sans-serif", "font-family" => "google sans,arial,sans-serif",
"padding-right" => "0", "padding-right" => "0",
"white-space" => "nowrap" "white-space" => "nowrap"
] ]
@ -1415,12 +1426,9 @@ class google{
->getElementsByClassName( ->getElementsByClassName(
$this->getstyle( $this->getstyle(
[ [
"border-radius" => "10px", "background-color" => "rgba(0,0,0,0.6)",
"font-family" => "arial,sans-serif-medium,sans-serif", "color" => "#fff",
"font-size" => "12px", "fill" => "#fff"
"line-height" => "16px",
"padding-block" => "2px",
"padding-inline" => "8px"
] ]
), ),
"div" "div"
@ -1433,14 +1441,6 @@ class google{
->getTextContent( ->getTextContent(
$duration[0] $duration[0]
); );
// remove duration from description
$description[0]["innerHTML"] =
str_replace(
$duration[0]["outerHTML"],
"",
$description[0]["innerHTML"]
);
} }
$web["description"] = $web["description"] =
@ -1979,7 +1979,7 @@ class google{
"font-size" => "12px", "font-size" => "12px",
"line-height" => "1.34", "line-height" => "1.34",
"display" => "inline-block", "display" => "inline-block",
"font-family" => "Google Sans,arial,sans-serif", "font-family" => "google sans,arial,sans-serif",
"padding-right" => "0", "padding-right" => "0",
"white-space" => "nowrap" "white-space" => "nowrap"
] ]
@ -2211,7 +2211,7 @@ class google{
->getElementsByClassName( ->getElementsByClassName(
$this->getstyle( $this->getstyle(
[ [
"font-family" => "Google Sans,arial,sans-serif", "font-family" => "google sans,arial,sans-serif",
"font-size" => "28px", "font-size" => "28px",
"line-height" => "36px" "line-height" => "36px"
] ]
@ -2801,7 +2801,22 @@ class google{
} }
} }
// get thumbnail // get heading element
$heading =
$this->fuckhtml
->getElementsByAttributeValue(
"role",
"heading",
"div"
);
if(count($heading) === 0){
// no heading, fuck this.
continue;
}
// get thumbnail before loading heading object
$image = $image =
$this->fuckhtml $this->fuckhtml
->getElementsByAttributeName( ->getElementsByAttributeName(
@ -2823,35 +2838,6 @@ class google{
]; ];
} }
// get title
$title =
$this->fuckhtml
->getElementsByClassName(
$this->getstyle(
[
"font-family" => "arial,sans-serif",
"font-size" => "16px",
"font-weight" => "400",
"line-height" => "24px"
]
),
"div"
);
if(count($title) === 0){
// ?? no title
continue;
}
$title =
$this->titledots(
$this->fuckhtml
->getTextContent(
$title[0]
)
);
// get duration // get duration
$duration_div = $duration_div =
$this->fuckhtml $this->fuckhtml
@ -2908,6 +2894,38 @@ class google{
} }
} }
// load heading
$this->fuckhtml->load($heading[0]);
// get title
$title =
$this->fuckhtml
->getElementsByClassName(
$this->getstyle(
[
"font-family" => "arial,sans-serif",
"font-size" => "16px",
"font-weight" => "400",
"line-height" => "24px"
]
),
"div"
);
if(count($title) === 0){
// ?? no title
continue;
}
$title =
$this->titledots(
$this->fuckhtml
->getTextContent(
$title[0]
)
);
// get date // get date
$date_div = $date_div =
$this->fuckhtml $this->fuckhtml
@ -3940,7 +3958,7 @@ class google{
for($k=0; $k<count($values_regex[1]); $k++){ for($k=0; $k<count($values_regex[1]); $k++){
$values[trim($values_regex[1][$k])] = $values[trim($values_regex[1][$k])] =
trim($values_regex[2][$k]); strtolower(trim($values_regex[2][$k]));
} }
$names = explode(",", $matches[1][$i]); $names = explode(",", $matches[1][$i]);
@ -3971,7 +3989,7 @@ class google{
foreach($this->styles[":root"] as $key => $value){ foreach($this->styles[":root"] as $key => $value){
$this->css_colors[$value] = $key; $this->css_colors[$value] = strtolower($key);
} }
} }
} }