542 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
			
		
		
	
	
			542 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
| <?php
 | ||
| 
 | ||
| class sepiasearch{
 | ||
| 	
 | ||
| 	public function __construct(){
 | ||
| 		
 | ||
| 		include "lib/backend.php";
 | ||
| 		$this->backend = new backend("sepiasearch");
 | ||
| 	}
 | ||
| 	
 | ||
| 	public function getfilters($page){
 | ||
| 		
 | ||
| 		return [
 | ||
| 			"nsfw" => [
 | ||
| 				"display" => "NSFW",
 | ||
| 				"option" => [
 | ||
| 					"yes" => "Yes", // &sensitiveContent=both
 | ||
| 					"no" => "No" // &sensitiveContent=false
 | ||
| 				]
 | ||
| 			],
 | ||
| 			"language" => [
 | ||
| 				"display" => "Language", // &language=
 | ||
| 				"option" => [
 | ||
| 					"any" => "Any language",
 | ||
| 					"en" => "English",
 | ||
| 					"fr" => "Français",
 | ||
| 					"ar" => "العربية",
 | ||
| 					"ca" => "Català",
 | ||
| 					"cs" => "Čeština",
 | ||
| 					"de" => "Deutsch",
 | ||
| 					"el" => "ελληνικά",
 | ||
| 					"eo" => "Esperanto",
 | ||
| 					"es" => "Español",
 | ||
| 					"eu" => "Euskara",
 | ||
| 					"fa" => "فارسی",
 | ||
| 					"fi" => "Suomi",
 | ||
| 					"gd" => "Gàidhlig",
 | ||
| 					"gl" => "Galego",
 | ||
| 					"hr" => "Hrvatski",
 | ||
| 					"hu" => "Magyar",
 | ||
| 					"is" => "Íslenska",
 | ||
| 					"it" => "Italiano",
 | ||
| 					"ja" => "日本語",
 | ||
| 					"kab" => "Taqbaylit",
 | ||
| 					"nl" => "Nederlands",
 | ||
| 					"no" => "Norsk",
 | ||
| 					"oc" => "Occitan",
 | ||
| 					"pl" => "Polski",
 | ||
| 					"pt" => "Português (Brasil)",
 | ||
| 					"pt-PT" => "Português (Portugal)",
 | ||
| 					"ru" => "Pусский",
 | ||
| 					"sk" => "Slovenčina",
 | ||
| 					"sq" => "Shqip",
 | ||
| 					"sv" => "Svenska",
 | ||
| 					"th" => "ไทย",
 | ||
| 					"tok" => "Toki Pona",
 | ||
| 					"tr" => "Türkçe",
 | ||
| 					"uk" => "украї́нська мо́ва",
 | ||
| 					"vi" => "Tiếng Việt",
 | ||
| 					"zh-Hans" => "简体中文(中国)",
 | ||
| 					"zh-Hant" => "繁體中文(台灣)"
 | ||
| 				]
 | ||
| 			],
 | ||
| 			"type" => [
 | ||
| 				"display" => "Result type", // i handle this
 | ||
| 				"option" => [
 | ||
| 					"videos" => "Videos",
 | ||
| 					"playlists" => "Playlists",
 | ||
| 					"channels" => "Channels"
 | ||
| 				]
 | ||
| 			],
 | ||
| 			"sort" => [
 | ||
| 				"display" => "Sort by",
 | ||
| 				"option" => [
 | ||
| 					"best" => "Best match", // no filter
 | ||
| 					"-publishedAt" => "Newest", // sort=-publishedAt
 | ||
| 					"publishedAt" => "Oldest" // sort=publishedAt
 | ||
| 				]
 | ||
| 			],
 | ||
| 			"newer" => [ // &startDate=2025-07-26T04:00:00.000Z
 | ||
| 				"display" => "Newer than",
 | ||
| 				"option" => "_DATE"
 | ||
| 			],
 | ||
| 			"duration" => [
 | ||
| 				"display" => "Duration",
 | ||
| 				"option" => [
 | ||
| 					"any" => "Any duration",
 | ||
| 					"short" => "Short (0-4mins)", // &durationRange=short
 | ||
| 					"medium" => "Medium (4-10 mins)",
 | ||
| 					"long" => "Long (10+ mins)",
 | ||
| 				]
 | ||
| 			],
 | ||
| 			"category" => [
 | ||
| 				"display" => "Category", // &categoryOneOf[]=
 | ||
| 				"option" => [
 | ||
| 					"any" => "Any category",
 | ||
| 					"1" => "Music",
 | ||
| 					"2" => "Films",
 | ||
| 					"3" => "Vehicles",
 | ||
| 					"4" => "Art",
 | ||
| 					"5" => "Sports",
 | ||
| 					"6" => "Travels",
 | ||
| 					"7" => "Gaming",
 | ||
| 					"8" => "People",
 | ||
| 					"9" => "Comedy",
 | ||
| 					"10" => "Entertainment",
 | ||
| 					"11" => "News & Politics",
 | ||
| 					"12" => "How To",
 | ||
| 					"13" => "Education",
 | ||
| 					"14" => "Activism",
 | ||
| 					"15" => "Science & Technology",
 | ||
| 					"16" => "Animals",
 | ||
| 					"17" => "Kids",
 | ||
| 					"18" => "Food"
 | ||
| 				]
 | ||
| 			],
 | ||
| 			"display" => [
 | ||
| 				"display" => "Display",
 | ||
| 				"option" => [
 | ||
| 					"any" => "Everything",
 | ||
| 					"true" => "Live videos", // &isLive=true
 | ||
| 					"false" => "VODs" // &isLive=false
 | ||
| 				]
 | ||
| 			],
 | ||
| 			"license" => [
 | ||
| 				"display" => "License", // &license=
 | ||
| 				"option" => [
 | ||
| 					"any" => "Any license",
 | ||
| 					"1" => "Attribution",
 | ||
| 					"2" => "Attribution - Share Alike",
 | ||
| 					"3" => "Attribution - No Derivatives",
 | ||
| 					"4" => "Attribution - Non Commercial",
 | ||
| 					"5" => "Attribution - Non Commercial - Share Alike",
 | ||
| 					"6" => "Attribution - Non Commercial - No Derivatives",
 | ||
| 					"7" => "Public Domain Dedication"
 | ||
| 				]
 | ||
| 			]
 | ||
| 		];
 | ||
| 	}
 | ||
| 	
 | ||
| 	private function get($proxy, $url, $get = []){
 | ||
| 		
 | ||
| 		$curlproc = curl_init();
 | ||
| 		
 | ||
| 		if($get !== []){
 | ||
| 			$get = http_build_query($get);
 | ||
| 			$url .= "?" . $get;
 | ||
| 		}
 | ||
| 		
 | ||
| 		curl_setopt($curlproc, CURLOPT_URL, $url);
 | ||
| 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding
 | ||
| 		
 | ||
| 		curl_setopt(
 | ||
| 			$curlproc,
 | ||
| 			CURLOPT_HTTPHEADER,
 | ||
| 			["User-Agent: " . config::USER_AGENT,
 | ||
| 			"Accept: application/json, text/plain, */*",
 | ||
| 			"Accept-Language: en-US,en;q=0.5",
 | ||
| 			"Accept-Encoding: gzip, deflate, br, zstd",
 | ||
| 			"DNT: 1",
 | ||
| 			"Sec-GPC: 1",
 | ||
| 			"Connection: keep-alive",
 | ||
| 			"Referer: https://sepiasearch.org/search",
 | ||
| 			"Sec-Fetch-Dest: empty",
 | ||
| 			"Sec-Fetch-Mode: cors",
 | ||
| 			"Sec-Fetch-Site: same-origin",
 | ||
| 			"Priority: u=0",
 | ||
| 			"TE: trailers"]
 | ||
| 		);
 | ||
| 		
 | ||
| 		curl_setopt($curlproc, CURLOPT_RETURNTRANSFER, true);
 | ||
| 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYHOST, 2);
 | ||
| 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYPEER, true);
 | ||
| 		curl_setopt($curlproc, CURLOPT_CONNECTTIMEOUT, 30);
 | ||
| 		curl_setopt($curlproc, CURLOPT_TIMEOUT, 30);
 | ||
| 
 | ||
| 		$this->backend->assign_proxy($curlproc, $proxy);
 | ||
| 		
 | ||
| 		$data = curl_exec($curlproc);
 | ||
| 		
 | ||
| 		if(curl_errno($curlproc)){
 | ||
| 			
 | ||
| 			throw new Exception(curl_error($curlproc));
 | ||
| 		}
 | ||
| 		
 | ||
| 		curl_close($curlproc);
 | ||
| 		return $data;
 | ||
| 	}
 | ||
| 	
 | ||
| 	public function video($get){
 | ||
| 		
 | ||
| 		if($get["npt"]){
 | ||
| 			
 | ||
| 			[$npt, $proxy] =
 | ||
| 				$this->backend
 | ||
| 				->get(
 | ||
| 					$get["npt"],
 | ||
| 					"videos"
 | ||
| 				);
 | ||
| 			
 | ||
| 			$npt = json_decode($npt, true);
 | ||
| 			$type = $npt["type"];
 | ||
| 			$npt = $npt["npt"];
 | ||
| 		}else{
 | ||
| 			
 | ||
| 			$proxy = $this->backend->get_ip();
 | ||
| 						
 | ||
| 			$npt = [
 | ||
| 				"search" => $get["s"],
 | ||
| 				"start" => 0,
 | ||
| 				"count" => 20
 | ||
| 			];
 | ||
| 			
 | ||
| 			if($get["type"] == "videos"){
 | ||
| 				
 | ||
| 				//
 | ||
| 				// Parse video filters
 | ||
| 				//
 | ||
| 				switch($get["nsfw"]){
 | ||
| 					
 | ||
| 					case "yes": $npt["nsfw"] = "both"; break;
 | ||
| 					case "no": $npt["nsfw"] = "false"; break;
 | ||
| 				}
 | ||
| 				
 | ||
| 				$npt["boostLanguages[]"] = "en";
 | ||
| 				if($get["language"] != "any"){
 | ||
| 					
 | ||
| 					$npt["languageOneOf[]"] = $get["language"];
 | ||
| 				}
 | ||
| 				
 | ||
| 				if($get["sort"] != "best"){
 | ||
| 					
 | ||
| 					$npt["sort"] = $get["sort"];
 | ||
| 				}
 | ||
| 				
 | ||
| 				if($get["newer"] !== false){
 | ||
| 					
 | ||
| 					$date = new DateTime("@{$get["newer"]}");
 | ||
| 					$date->setTimezone(new DateTimeZone("UTC"));
 | ||
| 					$formatted = $date->format("Y-m-d\TH:i:s.000\Z");
 | ||
| 					
 | ||
| 					$npt["startDate"] = $formatted;
 | ||
| 				}
 | ||
| 				
 | ||
| 				switch($get["duration"]){
 | ||
| 					
 | ||
| 					case "short":
 | ||
| 						$npt["durationMax"] = 240;
 | ||
| 						break;
 | ||
| 					
 | ||
| 					case "medium":
 | ||
| 						$npt["durationMin"] = 240;
 | ||
| 						$npt["durationMax"] = 600;
 | ||
| 						break;
 | ||
| 					
 | ||
| 					case "long":
 | ||
| 						$npt["durationMin"] = 600;
 | ||
| 						break;
 | ||
| 				}
 | ||
| 				
 | ||
| 				if($get["category"] != "any"){
 | ||
| 					
 | ||
| 					$npt["categoryOneOf[]"] = $get["category"];
 | ||
| 				}
 | ||
| 				
 | ||
| 				if($get["display"] != "any"){
 | ||
| 					
 | ||
| 					$npt["isLive"] = $get["display"];
 | ||
| 				}
 | ||
| 				
 | ||
| 				if($get["license"] != "any"){
 | ||
| 					
 | ||
| 					// typo in license, lol
 | ||
| 					$npt["licenceOneOf[]"] = $get["license"];
 | ||
| 				}
 | ||
| 			}
 | ||
| 			
 | ||
| 			$type = $get["type"];
 | ||
| 		}
 | ||
| 		
 | ||
| 		switch($type){
 | ||
| 			
 | ||
| 			case "videos":
 | ||
| 				$url = "https://sepiasearch.org/api/v1/search/videos";
 | ||
| 				break;
 | ||
| 			
 | ||
| 			case "channels":
 | ||
| 				$url = "https://sepiasearch.org/api/v1/search/video-channels";
 | ||
| 				break;
 | ||
| 			
 | ||
| 			case "playlists":
 | ||
| 				$url = "https://sepiasearch.org/api/v1/search/video-playlists";
 | ||
| 				break;
 | ||
| 		}
 | ||
| 		
 | ||
| 		//$json = file_get_contents("scraper/sepia.json");
 | ||
| 		try{
 | ||
| 			
 | ||
| 			$json =
 | ||
| 				$this->get(
 | ||
| 					$proxy,
 | ||
| 					$url,
 | ||
| 					$npt
 | ||
| 				);
 | ||
| 		}catch(Exception $error){
 | ||
| 			
 | ||
| 			throw new Exception("Failed to fetch JSON");
 | ||
| 		}
 | ||
| 		
 | ||
| 		$json = json_decode($json, true);
 | ||
| 		
 | ||
| 		if($json === null){
 | ||
| 			
 | ||
| 			throw new Exception("Failed to parse JSON");
 | ||
| 		}
 | ||
| 		
 | ||
| 		if(isset($json["errors"])){
 | ||
| 			
 | ||
| 			$msg = [];
 | ||
| 			foreach($json["errors"] as $error){
 | ||
| 				
 | ||
| 				if(isset($error["msg"])){
 | ||
| 					
 | ||
| 					$msg[] = $error["msg"];
 | ||
| 				}
 | ||
| 			}
 | ||
| 			
 | ||
| 			throw new Exception("Sepia Search returned error(s): " . implode(", ", $msg));
 | ||
| 		}
 | ||
| 		
 | ||
| 		if(!isset($json["data"])){
 | ||
| 			
 | ||
| 			throw new Exception("Sepia Search did not return a data object");
 | ||
| 		}
 | ||
| 		
 | ||
| 		$out = [
 | ||
| 			"status" => "ok",
 | ||
| 			"npt" => null,
 | ||
| 			"video" => [],
 | ||
| 			"author" => [],
 | ||
| 			"livestream" => [],
 | ||
| 			"playlist" => [],
 | ||
| 			"reel" => []
 | ||
| 		];
 | ||
| 		
 | ||
| 		
 | ||
| 		switch($get["type"]){
 | ||
| 			
 | ||
| 			case "videos":
 | ||
| 				foreach($json["data"] as $video){
 | ||
| 					
 | ||
| 					if(count($video["account"]["avatars"]) !== 0){
 | ||
| 						
 | ||
| 						$avatar =
 | ||
| 							$video["account"]["avatars"][count($video["account"]["avatars"]) - 1]["url"];
 | ||
| 					}else{
 | ||
| 						
 | ||
| 						$avatar = null;
 | ||
| 					}
 | ||
| 					
 | ||
| 					if($video["thumbnailUrl"] === null){
 | ||
| 						
 | ||
| 						$thumb = [
 | ||
| 							"ratio" => null,
 | ||
| 							"url" => null
 | ||
| 						];
 | ||
| 					}else{
 | ||
| 						
 | ||
| 						$thumb  = [
 | ||
| 							"ratio" => "16:9",
 | ||
| 							"url" => $video["thumbnailUrl"]
 | ||
| 						];
 | ||
| 					}
 | ||
| 					
 | ||
| 					if($video["isLive"]){
 | ||
| 						
 | ||
| 						$append = "livestream";
 | ||
| 					}else{
 | ||
| 						
 | ||
| 						$append = "video";
 | ||
| 					}
 | ||
| 					
 | ||
| 					$out[$append][] = [
 | ||
| 						"title" => $video["name"],
 | ||
| 						"description" =>
 | ||
| 							$this->limitstrlen(
 | ||
| 								$this->titledots(
 | ||
| 									$video["description"]
 | ||
| 								)
 | ||
| 							),
 | ||
| 						"author" => [
 | ||
| 							"name" => $video["account"]["displayName"] . " ({$video["account"]["name"]})",
 | ||
| 							"url" => $video["account"]["url"],
 | ||
| 							"avatar" => $avatar
 | ||
| 						],
 | ||
| 						"date" => strtotime($video["publishedAt"]),
 | ||
| 						"duration" => $video["isLive"] ? "_LIVE" : $video["duration"],
 | ||
| 						"views" => $video["views"],
 | ||
| 						"thumb" => $thumb,
 | ||
| 						"url" => $video["url"]
 | ||
| 					];
 | ||
| 				}
 | ||
| 				break;
 | ||
| 			
 | ||
| 			case "playlists":
 | ||
| 				foreach($json["data"] as $playlist){
 | ||
| 					
 | ||
| 					if(count($playlist["ownerAccount"]["avatars"]) !== 0){
 | ||
| 						
 | ||
| 						$avatar =
 | ||
| 							$playlist["ownerAccount"]["avatars"][count($playlist["ownerAccount"]["avatars"]) - 1]["url"];
 | ||
| 					}else{
 | ||
| 						
 | ||
| 						$avatar = null;
 | ||
| 					}
 | ||
| 					
 | ||
| 					if($playlist["thumbnailUrl"] === null){
 | ||
| 						
 | ||
| 						$thumb = [
 | ||
| 							"ratio" => null,
 | ||
| 							"url" => null
 | ||
| 						];
 | ||
| 					}else{
 | ||
| 						
 | ||
| 						$thumb  = [
 | ||
| 							"ratio" => "16:9",
 | ||
| 							"url" => $playlist["thumbnailUrl"]
 | ||
| 						];
 | ||
| 					}
 | ||
| 					
 | ||
| 					$out["playlist"][] = [
 | ||
| 						"title" => $playlist["displayName"],
 | ||
| 						"description" =>
 | ||
| 							$this->limitstrlen(
 | ||
| 								$this->titledots(
 | ||
| 									$playlist["description"]
 | ||
| 								)
 | ||
| 							),
 | ||
| 						"author" => [
 | ||
| 							"name" => $playlist["ownerAccount"]["displayName"] . " ({$playlist["ownerAccount"]["name"]})",
 | ||
| 							"url" => $playlist["ownerAccount"]["url"],
 | ||
| 							"avatar" => $avatar
 | ||
| 						],
 | ||
| 						"date" => strtotime($playlist["createdAt"]),
 | ||
| 						"duration" => $playlist["videosLength"],
 | ||
| 						"views" => null,
 | ||
| 						"thumb" => $thumb,
 | ||
| 						"url" => $playlist["url"]
 | ||
| 					];
 | ||
| 				}
 | ||
| 				break;
 | ||
| 			
 | ||
| 			case "channels":
 | ||
| 				foreach($json["data"] as $channel){
 | ||
| 					
 | ||
| 					if(count($channel["avatars"]) !== 0){
 | ||
| 						
 | ||
| 						$thumb = [
 | ||
| 							"ratio" => "1:1",
 | ||
| 							"url" => $channel["avatars"][count($channel["avatars"]) - 1]["url"]
 | ||
| 						];
 | ||
| 					}else{
 | ||
| 						
 | ||
| 						$thumb = [
 | ||
| 							"ratio" => null,
 | ||
| 							"url" => null
 | ||
| 						];
 | ||
| 					}
 | ||
| 					
 | ||
| 					$out["author"][] = [
 | ||
| 						"title" => $channel["displayName"] . " ({$channel["name"]})",
 | ||
| 						"followers" => $channel["followersCount"],
 | ||
| 						"description" =>
 | ||
| 							$channel["videosCount"] . " videos. " .
 | ||
| 							$this->limitstrlen(
 | ||
| 								$this->titledots(
 | ||
| 									$channel["description"]
 | ||
| 								)
 | ||
| 							),
 | ||
| 						"thumb" => $thumb,
 | ||
| 						"url" => $channel["url"]
 | ||
| 					];
 | ||
| 				}
 | ||
| 				break;
 | ||
| 		}
 | ||
| 		
 | ||
| 		// get next page
 | ||
| 		if($json["total"] - 20 > $npt["start"]){
 | ||
| 			
 | ||
| 			$npt["start"] += 20;
 | ||
| 			
 | ||
| 			$npt = [
 | ||
| 				"type" => $get["type"],
 | ||
| 				"npt" => $npt
 | ||
| 			];
 | ||
| 			
 | ||
| 			$out["npt"] =
 | ||
| 				$this->backend
 | ||
| 				->store(
 | ||
| 					json_encode($npt),
 | ||
| 					"videos",
 | ||
| 					$proxy
 | ||
| 				);
 | ||
| 		}
 | ||
| 		
 | ||
| 		return $out;
 | ||
| 	}
 | ||
| 	
 | ||
| 	private function titledots($title){
 | ||
| 		
 | ||
| 		$substr = substr($title, -3);
 | ||
| 		
 | ||
| 		if(
 | ||
| 			$substr == "..." ||
 | ||
| 			$substr == "…"
 | ||
| 		){
 | ||
| 			
 | ||
| 			return trim(substr($title, 0, -3), " \n\r\t\v\x00\0\x0B\xc2\xa0");
 | ||
| 		}
 | ||
| 		
 | ||
| 		return trim($title, " \n\r\t\v\x00\0\x0B\xc2\xa0");
 | ||
| 	}
 | ||
| 	
 | ||
| 	private function limitstrlen($text){
 | ||
| 		
 | ||
| 		return
 | ||
| 			explode(
 | ||
| 				"\n",
 | ||
| 				wordwrap(
 | ||
| 					str_replace(
 | ||
| 						["\n\r", "\r\n", "\n", "\r"],
 | ||
| 						" ",
 | ||
| 						$text
 | ||
| 					),
 | ||
| 					300,
 | ||
| 					"\n"
 | ||
| 				),
 | ||
| 				2
 | ||
| 			)[0];
 | ||
| 	}
 | ||
| }
 |