forked from lolcat/4get
		
	Compare commits
	
		
			116 Commits
		
	
	
		
			91a792d169
			...
			master
		
	
	| Author | SHA1 | Date | |
|---|---|---|---|
| 46e6ed12e3 | |||
| ce75cbda81 | |||
| 560b9b04da | |||
| 56ea4811d7 | |||
| 036a097d4d | |||
| a4a44709b4 | |||
| 4b16fd5897 | |||
| 61deefb75b | |||
| 8198287ec0 | |||
| bf6319839e | |||
| fa4aa9a0fd | |||
| c69abf41b0 | |||
| 1b6182bc3c | |||
| 1cfeabeb7f | |||
| 73f8472eec | |||
| 0c90c4bc9e | |||
| cfcc4ec8d1 | |||
| 6d34d43a01 | |||
| c44d6292a0 | |||
| 0b350d4d6e | |||
| de328fff1b | |||
| 8613c1e0f4 | |||
| d4aaebcd80 | |||
| a2e056b47b | |||
| 8a0a8359a8 | |||
| dcf5901809 | |||
| aa9806300a | |||
| 91ce5c1563 | |||
| cdf958d293 | |||
| 2d63475b07 | |||
| ae31274db9 | |||
| 20ef5b3e3a | |||
| 7c970031d0 | |||
| 2c2bd28a9f | |||
| dea8b0a362 | |||
| da1ea1d6e8 | |||
| 2ca8fb0006 | |||
| 362cf61508 | |||
| 1828c63233 | |||
| 4215f2678d | |||
| acd02d83d4 | |||
| 319640cd77 | |||
| ad535a1609 | |||
| 7ac53c6e11 | |||
| f33f02e816 | |||
| 27b8509ac0 | |||
| 1e52982cb9 | |||
| 3f2bfcb8c7 | |||
| d3ef1a67c0 | |||
| 9afef55d89 | |||
| 706b490bf3 | |||
| 74f7c920f6 | |||
| 3dbcf60a3e | |||
| f30872134f | |||
| 2c4dc7da84 | |||
| 5a0f5b868a | |||
| 7cf403e125 | |||
| 73b7922898 | |||
| 336cb49d98 | |||
| 8cd8e7380f | |||
| 3d9d95db34 | |||
| eb73b1f357 | |||
| f7499294de | |||
| 60f7150008 | |||
| 2b8d90af12 | |||
| 0f803804a4 | |||
| f43feff0aa | |||
| 0bdd5e73df | |||
| 430c0a2f0f | |||
| 1a00bf8069 | |||
| 502f6d12e4 | |||
| a2bc1e6190 | |||
| f73b5f0298 | |||
| 3e1487e614 | |||
| 037566bbba | |||
| b61bc6d07c | |||
| 8d50667b0d | |||
| a0545b6006 | |||
| 78aa2e198f | |||
| b85820cbcd | |||
| 4b85841a3e | |||
| 8d07e72dfe | |||
| 566680fe36 | |||
| 077692db49 | |||
| e4bf53cdaa | |||
| 4489bb21e5 | |||
| ff8b1addf7 | |||
| 3e2c3fc5d9 | |||
| 49ddd1a216 | |||
| 81ca8eaddc | |||
| c9c8d578f3 | |||
| b2203804c7 | |||
| 13dfa9240c | |||
| 0a53c3605a | |||
| 36b0c570aa | |||
| 47a7a2a224 | |||
| 0180cf5224 | |||
| eed32a153c | |||
| f9f3c919d6 | |||
| 4b0d8f75dc | |||
| 033e4cb959 | |||
| 91f621e105 | |||
| 9f60900875 | |||
| 631aa58565 | |||
| b892f90b13 | |||
| 463ba0775f | |||
| cfad4fb035 | |||
| 4e968b4b1c | |||
| 81df52235c | |||
| 1ca2626ad9 | |||
| 9ca93f34c6 | |||
| 0a43b9c849 | |||
| b636fec319 | |||
| 774f7113df | |||
| 0b3bbe0f15 | |||
| 5f0b0a7b83 | 
							
								
								
									
										1
									
								
								.dockerignore
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										1
									
								
								.dockerignore
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1 @@ | |||||||
|  | .git | ||||||
| @@ -1,48 +0,0 @@ | |||||||
| name: '4get CI' |  | ||||||
|  |  | ||||||
| on: |  | ||||||
|   workflow_dispatch: |  | ||||||
|   push: |  | ||||||
|     branches: |  | ||||||
|       - '*' |  | ||||||
|     paths-ignore: |  | ||||||
|       - 'README.md' |  | ||||||
|       - 'docker-compose.yaml' |  | ||||||
|       - '.gitignore' |  | ||||||
|       - 'docs/**' |  | ||||||
|  |  | ||||||
| jobs: |  | ||||||
|   build: |  | ||||||
|     runs-on: docker |  | ||||||
|  |  | ||||||
|     steps: |  | ||||||
|     - uses: actions/checkout@v4 |  | ||||||
|       name: Checkout 4get repository |  | ||||||
|  |  | ||||||
|     - uses: docker/setup-buildx-action@v3 |  | ||||||
|       name: Setup Docker BuildX system |  | ||||||
|  |  | ||||||
|     - name: Login to Docker Container Registry |  | ||||||
|       uses: docker/login-action@v3 |  | ||||||
|       with: |  | ||||||
|         registry: git.lolcat.ca |  | ||||||
|         username: ${{ secrets.USERNAME }} |  | ||||||
|         password: ${{ secrets.TOKEN }} |  | ||||||
|  |  | ||||||
|     - name: Docker meta |  | ||||||
|       id: meta |  | ||||||
|       uses: docker/metadata-action@v5 |  | ||||||
|       with: |  | ||||||
|         images: git.lolcat.ca/lolcat/4get |  | ||||||
|         tags: | |  | ||||||
|           type=sha,format=short,prefix={{date 'YYYY.MM.DD'}}-,enable=${{ github.ref == format('refs/heads/{0}', 'master') }} |  | ||||||
|           type=raw,value=latest,enable=${{ github.ref == format('refs/heads/{0}', 'master') }} |  | ||||||
|  |  | ||||||
|     - uses: docker/build-push-action@v6 |  | ||||||
|       name: Build images |  | ||||||
|       with: |  | ||||||
|         context: . |  | ||||||
|         file: Dockerfile |  | ||||||
|         tags: ${{ steps.meta.outputs.tags }} |  | ||||||
|         platforms: linux/amd64 |  | ||||||
|         push: true |  | ||||||
| @@ -1,10 +1,9 @@ | |||||||
| FROM alpine:latest | FROM alpine:3.21 | ||||||
| WORKDIR /var/www/html/4get | WORKDIR /var/www/html/4get | ||||||
|  |  | ||||||
| RUN apk update && apk upgrade | RUN apk update && apk upgrade | ||||||
| RUN apk add php apache2-ssl php83-fileinfo php83-openssl php83-iconv php83-common php83-dom php83-sodium php83-curl curl php83-pecl-apcu php83-apache2 imagemagick php83-pecl-imagick php-mbstring imagemagick-webp imagemagick-jpeg | RUN apk add php apache2-ssl php84-fileinfo php84-openssl php84-iconv php84-common php84-dom php84-sodium php84-curl curl php84-pecl-apcu php84-apache2 imagemagick php84-pecl-imagick php84-mbstring imagemagick-webp imagemagick-jpeg | ||||||
|  |  | ||||||
| COPY ./docker/apache/ /etc/apache2/ |  | ||||||
| COPY . . | COPY . . | ||||||
|  |  | ||||||
| RUN chmod 777 /var/www/html/4get/icons | RUN chmod 777 /var/www/html/4get/icons | ||||||
| @@ -14,4 +13,5 @@ EXPOSE 443 | |||||||
|  |  | ||||||
| ENV FOURGET_PROTO=http | ENV FOURGET_PROTO=http | ||||||
|  |  | ||||||
| CMD  ["./docker/docker-entrypoint.sh"] | ENTRYPOINT  ["./docker/docker-entrypoint.sh"] | ||||||
|  | CMD ["start"] | ||||||
							
								
								
									
										37
									
								
								README.md
									
									
									
									
									
								
							
							
						
						
									
										37
									
								
								README.md
									
									
									
									
									
								
							| @@ -9,9 +9,11 @@ https://4get.ca/about | |||||||
| ## Official instance | ## Official instance | ||||||
| https://4get.ca , or visit the official instance list: https://4get.ca/instances | https://4get.ca , or visit the official instance list: https://4get.ca/instances | ||||||
|  |  | ||||||
|  | _NOT to be confused with 4get.ch, 4get.lol and friends! I **don't** host these._ | ||||||
|  |  | ||||||
| ## Totally unbiased comparison between alternatives | ## Totally unbiased comparison between alternatives | ||||||
|  |  | ||||||
| |                            | 4get                    | searx(ng) | libreY      | araa      | hearch            | | |                            | 4get                    | searx(ng) | libreY      | araa      | hearch.co         | | ||||||
| |----------------------------|-------------------------|-----------|-------------|-----------|-------------------| | |----------------------------|-------------------------|-----------|-------------|-----------|-------------------| | ||||||
| | RAM usage                  | 200-400mb~              | 2GB~      | 200-400mb~  | 2GB~      | idk               | | | RAM usage                  | 200-400mb~              | 2GB~      | 200-400mb~  | 2GB~      | idk               | | ||||||
| | Does it suck               | no (debunked by snopes) | yes       | yes         | a little  | better than searx | | | Does it suck               | no (debunked by snopes) | yes       | yes         | a little  | better than searx | | ||||||
| @@ -23,27 +25,28 @@ https://4get.ca , or visit the official instance list: https://4get.ca/instances | |||||||
| 3. Bot protection that *actually* filters out the bots (when configured) | 3. Bot protection that *actually* filters out the bots (when configured) | ||||||
| 4. Interface doesn't require javascript | 4. Interface doesn't require javascript | ||||||
| 5. Favicon fetcher with caching support & image proxy | 5. Favicon fetcher with caching support & image proxy | ||||||
| 6. Bunch of other shit | 6. Bunch of other shits | ||||||
|  |  | ||||||
| tl;dr the best way to actually browse for shit. | tl;dr 4get is the best way to browse for shit. | ||||||
|  |  | ||||||
| # Supported websites | # Supported websites | ||||||
|  |  | ||||||
| | Web        | Images       | Videos       | News       | Music      | Autocompleter | | | Web        | Images       | Videos       | News       | Music      | Autocompleter | | ||||||
| |------------|--------------|------------|------------|------------|---------------| | |------------|--------------|--------------|------------|------------|---------------| | ||||||
| | DuckDuckGo | DuckDuckGo   | YouTube      | DuckDuckGo | Soundcloud | Brave         | | | DuckDuckGo | DuckDuckGo   | YouTube      | DuckDuckGo | Soundcloud | Brave         | | ||||||
| | Brave      | Brave        | DuckDuckGo | Brave      |            | DuckDuckGo    | | | Brave      | Brave        | Sepia Search | Brave      |            | DuckDuckGo    | | ||||||
| | Yandex     | Yandex       | Brave      | Google     |            | Yandex        | | | Yandex     | Yandex       | DuckDuckGo   | Google     |            | Yandex        | | ||||||
| | Google     | Google       | Yandex     | Startpage  |            | Google        | | | Google     | Google       | Brave        | Startpage  |            | Google        | | ||||||
| | Startpage  | Startpage    | Google     | Qwant      |            | Startpage     | | | Startpage  | Startpage    | Yandex       | Qwant      |            | Startpage     | | ||||||
| | Qwant      | Qwant        | Startpage  | Mojeek     |            | Kagi          | | | Qwant      | Qwant        | Google       | Mojeek     |            | Kagi          | | ||||||
| | Ghostery   | Yep          | Qwant      |            |            | Qwant         | | | Ghostery   | Yep          | Startpage    | Baidu      |            | Qwant         | | ||||||
| | Yep        | Solofield    | Solofield  |            |            | Ghostery      | | | Yep        | Baidu        | Qwant        |            |            | Ghostery      | | ||||||
| | Greppr     | Imgur        |            |            |            | Yep           | | | Greppr     | Pinterest    | Baidu        |            |            | Yep           | | ||||||
| | Crowdview  | FindThatMeme |            |            |            | Marginalia    | | | Crowdview  | 500px        | Coc Coc      |            |            | Marginalia    | | ||||||
| | Mwmbl      |              |            |            |            | YouTube       | | | Mwmbl      | VSCO         |              |            |            | YouTube       | | ||||||
| | Mojeek     |              |            |            |            | Soundcloud    | | | Mojeek     | Imgur        |              |            |            | Soundcloud    | | ||||||
| | Solofield  |              |            |            |            |               | | | Baidu      | FindThatMeme |              |            |            |               | | ||||||
|  | | Coc Coc    |              |              |            |            |               | | ||||||
| | Marginalia |              |              |            |            |               | | | Marginalia |              |              |            |            |               | | ||||||
| | wiby       |              |              |            |            |               | | | wiby       |              |              |            |            |               | | ||||||
| | Curlie     |              |              |            |            |               | | | Curlie     |              |              |            |            |               | | ||||||
| @@ -52,7 +55,7 @@ tl;dr the best way to actually browse for shit. | |||||||
| Refer to the <a href="https://git.lolcat.ca/lolcat/4get/src/branch/master/docs/">documentation index</a>. I recommend following the <a href="https://git.lolcat.ca/lolcat/4get/src/branch/master/docs/apache2.md">apache2 guide</a>. | Refer to the <a href="https://git.lolcat.ca/lolcat/4get/src/branch/master/docs/">documentation index</a>. I recommend following the <a href="https://git.lolcat.ca/lolcat/4get/src/branch/master/docs/apache2.md">apache2 guide</a>. | ||||||
|  |  | ||||||
| ## Contact | ## Contact | ||||||
| Shit breaks all the time but I repair it all the time too... Email me here: <b>will (at) lolcat.ca</b> or create an issue. | Shit breaks all the time but I repair it all the time too. Email me here: <b>will (at) lolcat.ca</b> or create an issue. | ||||||
|  |  | ||||||
| ## License | ## License | ||||||
| AGPL | AGPL | ||||||
|   | |||||||
							
								
								
									
										19
									
								
								api.txt
									
									
									
									
									
								
							
							
						
						
									
										19
									
								
								api.txt
									
									
									
									
									
								
							| @@ -1,9 +1,16 @@ | |||||||
|                         __ __             __ |                    44 | ||||||
|                        / // / ____ ____  / /_ |                  4444444      44    | ||||||
|                       / // /_/ __ `/ _ \/ __/ |                  44444444   44444       444 | ||||||
|                      /__  __/ /_/ /  __/ /_  |                  44444444  444444    444444444 | ||||||
|                        /_/  \__, /\___/\__/ |                   44444   44444444  444444444 | ||||||
|                            /____/          |                          444444444   4444444 | ||||||
|  |                         4444444444    444444 | ||||||
|  |                       4444444444444 | ||||||
|  |                     444444444444444444 | ||||||
|  |                        444444444444444 | ||||||
|  |                           44444444 | ||||||
|  |                           4444 | ||||||
|  |                            44 | ||||||
|                   |                   | ||||||
|            + Welcome to the 4get API documentation + |            + Welcome to the 4get API documentation + | ||||||
|  |  | ||||||
|   | |||||||
							
								
								
									
										8
									
								
								data/api_keys/google_api.txt
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										8
									
								
								data/api_keys/google_api.txt
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,8 @@ | |||||||
|  | # Specify API keys for the Google API in the following format: | ||||||
|  | # <key> | ||||||
|  | # | ||||||
|  | # Generate keys here: | ||||||
|  | # https://developers.google.com/custom-search/v1/overview | ||||||
|  | # Make sure to use a different Google account for each key, cause I'm | ||||||
|  | # pretty sure the ratelimit is on a per-account basis :P | ||||||
|  | # | ||||||
| @@ -43,7 +43,7 @@ class config{ | |||||||
| 	 | 	 | ||||||
| 	// If this regex expression matches on the user agent, it blocks the request | 	// If this regex expression matches on the user agent, it blocks the request | ||||||
| 	// Not useful at all against a targetted attack | 	// Not useful at all against a targetted attack | ||||||
| 	const HEADER_REGEX = '/bot|wget|curl|python-requests|scrapy|go-http-client|ruby|yahoo|spider|qwant/i'; | 	const HEADER_REGEX = '/bot|wget|curl|python-requests|scrapy|go-http-client|ruby|yahoo|spider|qwant|meta/i'; | ||||||
| 	 | 	 | ||||||
| 	// Block clients who present any of the following headers in their request (SPECIFY IN !!lowercase!!) | 	// Block clients who present any of the following headers in their request (SPECIFY IN !!lowercase!!) | ||||||
| 	// Eg: ["x-forwarded-for", "x-via", "forwarded-for", "via"]; | 	// Eg: ["x-forwarded-for", "x-via", "forwarded-for", "via"]; | ||||||
| @@ -100,7 +100,6 @@ class config{ | |||||||
| 		"https://4get.sijh.net", | 		"https://4get.sijh.net", | ||||||
| 		"https://4get.hbubli.cc", | 		"https://4get.hbubli.cc", | ||||||
| 		"https://4get.plunked.party", | 		"https://4get.plunked.party", | ||||||
| 		"https://4get.seitan-ayoub.lol", |  | ||||||
| 		"https://4get.etenie.pl", | 		"https://4get.etenie.pl", | ||||||
| 		"https://4get.lunar.icu", | 		"https://4get.lunar.icu", | ||||||
| 		"https://4get.dcs0.hu", | 		"https://4get.dcs0.hu", | ||||||
| @@ -119,7 +118,7 @@ class config{ | |||||||
| 	 | 	 | ||||||
| 	// Default user agent to use for scraper requests. Sometimes ignored to get specific webpages | 	// Default user agent to use for scraper requests. Sometimes ignored to get specific webpages | ||||||
| 	// Changing this might break things. | 	// Changing this might break things. | ||||||
| 	const USER_AGENT = "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:131.0) Gecko/20100101 Firefox/131.0"; | 	const USER_AGENT = "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:142.0) Gecko/20100101 Firefox/142.0"; | ||||||
| 	 | 	 | ||||||
| 	// Proxy pool assignments for each scraper | 	// Proxy pool assignments for each scraper | ||||||
| 	// false = Use server's raw IP | 	// false = Use server's raw IP | ||||||
| @@ -129,9 +128,14 @@ class config{ | |||||||
| 	const PROXY_BRAVE = false; | 	const PROXY_BRAVE = false; | ||||||
| 	const PROXY_FB = false; // facebook | 	const PROXY_FB = false; // facebook | ||||||
| 	const PROXY_GOOGLE = false; | 	const PROXY_GOOGLE = false; | ||||||
|  | 	const PROXY_GOOGLE_API = false; | ||||||
| 	const PROXY_GOOGLE_CSE = false; | 	const PROXY_GOOGLE_CSE = false; | ||||||
|  | 	const PROXY_MULLVAD_GOOGLE = false; | ||||||
|  | 	const PROXY_MULLVAD_BRAVE = false; | ||||||
| 	const PROXY_STARTPAGE = false; | 	const PROXY_STARTPAGE = false; | ||||||
| 	const PROXY_QWANT = false; | 	const PROXY_QWANT = false; | ||||||
|  | 	const PROXY_BAIDU = false; | ||||||
|  | 	const PROXY_COCCOC = false; | ||||||
| 	const PROXY_GHOSTERY = false; | 	const PROXY_GHOSTERY = false; | ||||||
| 	const PROXY_MARGINALIA = false; | 	const PROXY_MARGINALIA = false; | ||||||
| 	const PROXY_MOJEEK = false; | 	const PROXY_MOJEEK = false; | ||||||
| @@ -141,8 +145,16 @@ class config{ | |||||||
| 	const PROXY_WIBY = false; | 	const PROXY_WIBY = false; | ||||||
| 	const PROXY_CURLIE = false; | 	const PROXY_CURLIE = false; | ||||||
| 	const PROXY_YT = false; // youtube | 	const PROXY_YT = false; // youtube | ||||||
|  | 	const PROXY_ARCHIVEORG = false; | ||||||
|  | 	const PROXY_SEPIASEARCH = false; | ||||||
|  | 	const PROXY_ODYSEE = false; | ||||||
|  | 	const PROXY_VIMEO = false; | ||||||
| 	const PROXY_YEP = false; | 	const PROXY_YEP = false; | ||||||
| 	const PROXY_PINTEREST = false; | 	const PROXY_PINTEREST = false; | ||||||
|  | 	const PROXY_SANKAKUCOMPLEX = false; | ||||||
|  | 	const PROXY_FLICKR = false; | ||||||
|  | 	const PROXY_FIVEHPX = false; | ||||||
|  | 	const PROXY_VSCO = false; | ||||||
| 	const PROXY_SEZNAM = false; | 	const PROXY_SEZNAM = false; | ||||||
| 	const PROXY_NAVER = false; | 	const PROXY_NAVER = false; | ||||||
| 	const PROXY_GREPPR = false; | 	const PROXY_GREPPR = false; | ||||||
| @@ -150,6 +162,7 @@ class config{ | |||||||
| 	const PROXY_MWMBL = false; | 	const PROXY_MWMBL = false; | ||||||
| 	const PROXY_FTM = false; // findthatmeme | 	const PROXY_FTM = false; // findthatmeme | ||||||
| 	const PROXY_IMGUR = false; | 	const PROXY_IMGUR = false; | ||||||
|  | 	const PROXY_CARA = false; | ||||||
| 	const PROXY_YANDEX_W = false; // yandex web | 	const PROXY_YANDEX_W = false; // yandex web | ||||||
| 	const PROXY_YANDEX_I = false; // yandex images | 	const PROXY_YANDEX_I = false; // yandex images | ||||||
| 	const PROXY_YANDEX_V = false; // yandex videos | 	const PROXY_YANDEX_V = false; // yandex videos | ||||||
| @@ -158,7 +171,7 @@ class config{ | |||||||
| 	// Scraper-specific parameters | 	// Scraper-specific parameters | ||||||
| 	// | 	// | ||||||
| 	 | 	 | ||||||
| 	// GOOGLE CSE | 	// GOOGLE CSE & GOOGLE API | ||||||
| 	const GOOGLE_CX_ENDPOINT = "d4e68b99b876541f0"; | 	const GOOGLE_CX_ENDPOINT = "d4e68b99b876541f0"; | ||||||
| 	 | 	 | ||||||
| 	// MARGINALIA | 	// MARGINALIA | ||||||
|   | |||||||
| @@ -6,14 +6,15 @@ services: | |||||||
|     image: luuul/4get:latest |     image: luuul/4get:latest | ||||||
|     restart: unless-stopped |     restart: unless-stopped | ||||||
|     environment: |     environment: | ||||||
|  |       - FOURGET_PROTO=http | ||||||
|       - FOURGET_SERVER_NAME=4get.ca |       - FOURGET_SERVER_NAME=4get.ca | ||||||
|  |       - FOURGET_INSTANCES=https://4get.ca | ||||||
|  |  | ||||||
|     ports: |     ports: | ||||||
|       - "80:80" |       - "80:80" | ||||||
|       - "443:443" |       - "443:443" | ||||||
|  |  | ||||||
|     volumes: |     # volumes: | ||||||
|       - /etc/letsencrypt/live/domain.tld:/etc/4get/certs |     # - /etc/letsencrypt/live/domain.tld:/etc/4get/certs # mount ssl | ||||||
|       # mount custom banners and captcha |     # - ./banners:/var/www/html/4get/banner # mount custom banners | ||||||
|       - ./banners:/var/www/html/4get/banner |     # - ./captcha:/var/www/html/4get/data/captcha # mount captcha images | ||||||
|       - ./captcha:/var/www/html/4get/data/captcha |  | ||||||
|   | |||||||
							
								
								
									
										1
									
								
								docker/apache/http/conf.d/ssl.conf
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										1
									
								
								docker/apache/http/conf.d/ssl.conf
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1 @@ | |||||||
|  | # intentionally blank | ||||||
| @@ -8,18 +8,27 @@ FOURGET_PROTO="${FOURGET_PROTO#\"}" | |||||||
| # make lowercase | # make lowercase | ||||||
| FOURGET_PROTO=`echo $FOURGET_PROTO | awk '{print tolower($0)}'` | FOURGET_PROTO=`echo $FOURGET_PROTO | awk '{print tolower($0)}'` | ||||||
|  |  | ||||||
|  | FOURGET_SRC='/var/www/html/4get' | ||||||
|  |  | ||||||
|  | mkdir -p /etc/apache2 | ||||||
|  |  | ||||||
| if [ "$FOURGET_PROTO" = "https" ]; then | if [ "$FOURGET_PROTO" = "https" ]; then | ||||||
|         echo "Using https configuration" |         echo "Using https configuration" | ||||||
|         cp /etc/apache2/https.conf /etc/apache2/httpd.conf |         cp -r ${FOURGET_SRC}/docker/apache/https/httpd.conf /etc/apache2 | ||||||
|  |         cp -r ${FOURGET_SRC}/docker/apache/https/conf.d/* /etc/apache2/conf.d | ||||||
|  |  | ||||||
| else | else | ||||||
|         echo "Using http configuration" |         echo "Using http configuration" | ||||||
|         cp /etc/apache2/http.conf /etc/apache2/httpd.conf |         cp -r ${FOURGET_SRC}/docker/apache/http/httpd.conf /etc/apache2 | ||||||
|  |         cp -r ${FOURGET_SRC}/docker/apache/http/conf.d/* /etc/apache2/conf.d | ||||||
| fi | fi | ||||||
|  |  | ||||||
| php ./docker/gen_config.php | php ./docker/gen_config.php | ||||||
|  |  | ||||||
|  | if [ "$@" = "start" ]; then | ||||||
| echo "4get is running" |         echo "4get is running" | ||||||
| exec httpd -DFOREGROUND |         exec httpd -DFOREGROUND | ||||||
|  | else  | ||||||
|  |         exec "$@" | ||||||
|  | fi | ||||||
|  |  | ||||||
|   | |||||||
| @@ -7,27 +7,35 @@ Then, install the following dependencies: | |||||||
| ```sh | ```sh | ||||||
| apt update | apt update | ||||||
| apt upgrade | apt upgrade | ||||||
| apt install php-mbstring apache2 certbot php-imagick imagemagick php-curl curl php-apcu git libapache2-mod-php | apt install php-mbstring apache2 certbot php-imagick imagemagick php-curl curl php-apcu git libapache2-mod-fcgid php-fpm | ||||||
| ``` | ``` | ||||||
|  |  | ||||||
| Enable the required modules: | Enable the required modules: | ||||||
| ```sh | ```sh | ||||||
|  | a2dismod mpm_prefork | ||||||
|  | a2enmod mpm_event | ||||||
| a2enmod ssl | a2enmod ssl | ||||||
| a2enmod rewrite | a2enmod rewrite | ||||||
|  | a2enmod proxy_fcgi setenvif actions alias | ||||||
|  | a2enmod http2 | ||||||
|  | a2enmod headers | ||||||
|  | a2enmod proxy | ||||||
| ``` | ``` | ||||||
|  |  | ||||||
| And enable these optional ones, which might be useful to you later on. The `proxy` module is useful for setting up reverse proxies to services like gitea, and `headers` is useful to tweak global header values: | Tune the performance of php-fpm. You will need to edit this file according to your server specs and number of users. Edit the file at `/etc/php/8.4/pool.d/www.conf`: | ||||||
| ```sh | ```sh | ||||||
| a2enmod proxy | pm = static | ||||||
| a2enmod headers | pm.max_children = 50 | ||||||
| ``` | ``` | ||||||
|  |  | ||||||
|  | These values are what I currently use on 4get.ca, but for personal use, you can set `pm` to `ondemand` and `pm.max_children` to `20` (if you want those thumbnails to load fast!) | ||||||
|  |  | ||||||
| Now, restart apache2: | Now, restart apache2: | ||||||
| ```sh | ```sh | ||||||
| service apache2 restart | service apache2 restart | ||||||
| ``` | ``` | ||||||
|  |  | ||||||
| Just for good measure, please check if your webserver is running. Access it through HTTP, not HTTPS. You should see the apache2 default landing page. | Just for good measure, please check if your webserver is running. Access it through HTTP, not HTTPS. You should see the apache2 default landing page. Just a note, http2 won't work just yet since you don't have SSL yet. | ||||||
|  |  | ||||||
| ## 000-default.conf | ## 000-default.conf | ||||||
| Now, edit the following file: `/etc/apache2/sites-available/000-default.conf`, remove everything and carefully add each rule specified here, while making sure to replace my domains with your own: | Now, edit the following file: `/etc/apache2/sites-available/000-default.conf`, remove everything and carefully add each rule specified here, while making sure to replace my domains with your own: | ||||||
| @@ -74,12 +82,27 @@ Now, edit the following file: `/etc/apache2/sites-available/000-default.conf`, r | |||||||
|  |  | ||||||
| 	DocumentRoot /var/www/4get | 	DocumentRoot /var/www/4get | ||||||
| 	 | 	 | ||||||
|  | 	<FilesMatch \.php$> | ||||||
|  | 		SetHandler "proxy:unix:/run/php/php8.1-fpm.sock|fcgi://localhost/" | ||||||
|  | 	</FilesMatch> | ||||||
|  | 	 | ||||||
| 	Options -MultiViews | 	Options -MultiViews | ||||||
| 	RewriteEngine On | 	RewriteEngine On | ||||||
| 	RewriteCond %{REQUEST_FILENAME} !-d | 	RewriteCond %{REQUEST_FILENAME} !-d | ||||||
| 	RewriteCond %{REQUEST_FILENAME} !-f | 	RewriteCond %{REQUEST_FILENAME} !-f | ||||||
| 	RewriteRule ^([^\.]+)$ $1.php [NC,L] | 	RewriteRule ^([^\.]+)$ $1.php [NC,L] | ||||||
| 	 | 	 | ||||||
|  | 	<Directory /var/www/4get> | ||||||
|  | 		Options -MultiViews | ||||||
|  | 		AllowOverride All | ||||||
|  | 		Require all granted | ||||||
|  | 		 | ||||||
|  | 		RewriteEngine On | ||||||
|  | 		RewriteCond %{REQUEST_FILENAME} !-d | ||||||
|  | 		RewriteCond %{REQUEST_FILENAME} !-f | ||||||
|  | 		RewriteRule ^([^\.]+)$ $1.php [NC,L] | ||||||
|  | 	</Directory> | ||||||
|  | 	 | ||||||
| 	# deny access to private resources | 	# deny access to private resources | ||||||
| 	<Directory /var/www/4get/data/> | 	<Directory /var/www/4get/data/> | ||||||
| 		Order Deny,allow | 		Order Deny,allow | ||||||
| @@ -116,6 +139,7 @@ Make sure to replace `4get.ca` with your own domain under the `SSLCertificate*` | |||||||
| 	ServerAdmin will@lolcat.ca | 	ServerAdmin will@lolcat.ca | ||||||
| 	DocumentRoot /var/www/4get | 	DocumentRoot /var/www/4get | ||||||
| 	 | 	 | ||||||
|  | 	Protocols h2 http/1.1 | ||||||
| 	SSLEngine On | 	SSLEngine On | ||||||
| 	SSLOptions +StdEnvVars | 	SSLOptions +StdEnvVars | ||||||
| 	 | 	 | ||||||
| @@ -128,6 +152,10 @@ Make sure to replace `4get.ca` with your own domain under the `SSLCertificate*` | |||||||
| 	AddOutputFilterByType DEFLATE text/plain | 	AddOutputFilterByType DEFLATE text/plain | ||||||
| 	AddOutputFilterByType DEFLATE text/css | 	AddOutputFilterByType DEFLATE text/css | ||||||
| 	 | 	 | ||||||
|  | 	<FilesMatch \.php$> | ||||||
|  | 		SetHandler "proxy:unix:/run/php/php8.1-fpm.sock|fcgi://localhost/" | ||||||
|  | 	</FilesMatch> | ||||||
|  | 	 | ||||||
| 	SSLCertificateFile /etc/letsencrypt/live/4get.ca/fullchain.pem | 	SSLCertificateFile /etc/letsencrypt/live/4get.ca/fullchain.pem | ||||||
| 	SSLCertificateKeyFile /etc/letsencrypt/live/4get.ca/privkey.pem | 	SSLCertificateKeyFile /etc/letsencrypt/live/4get.ca/privkey.pem | ||||||
| 	SSLCertificateChainFile /etc/letsencrypt/live/4get.ca/chain.pem | 	SSLCertificateChainFile /etc/letsencrypt/live/4get.ca/chain.pem | ||||||
|   | |||||||
| @@ -9,34 +9,47 @@ Welcome! This guide assumes that you have a working 4get instance. This will hel | |||||||
| 4. The captcha font is located in `data/fonts/captcha.ttf` | 4. The captcha font is located in `data/fonts/captcha.ttf` | ||||||
|  |  | ||||||
| # Cloudflare bypass (TLS check) | # Cloudflare bypass (TLS check) | ||||||
| **Note: this only allows you to bypass the browser integrity checks. Captchas & javascript challenges will not be bypassed.** | >These instructions have been updated to work with Debian 13 Trixie. | ||||||
|  |  | ||||||
| Configuring this lets you fetch images sitting behind Cloudflare and allows you to scrape the **Yep** & the **Mwmbl** search engines. Please be aware that APT will fight against you and will re-install the openSSL-version of curl constantly when updating. | **Note: this only allows you to bypass the browser integrity checks. Captchas & javascript challenges will not be bypassed by this program!** | ||||||
|  |  | ||||||
| First, follow these instructions. Only install the Firefox modules: | Configuring this lets you fetch images sitting behind Cloudflare and allows you to scrape the **Yep** search engine. | ||||||
|  |  | ||||||
| https://github.com/lwthiker/curl-impersonate/blob/main/INSTALL.md#native-build | To come up with this set of instructions, I used [this guide](https://github.com/lwthiker/curl-impersonate/blob/main/INSTALL.md#native-build) as a reference, but trust me you probably want to stick to what's written on this page. | ||||||
|  |  | ||||||
| Once you did this, you should be able to run the following inside your terminal: |  | ||||||
|  |  | ||||||
|  | First, compile curl-impersonate (the firefox flavor). | ||||||
| ```sh | ```sh | ||||||
| $ curl_ff117 --version | git clone https://github.com/lwthiker/curl-impersonate/ | ||||||
| curl 8.1.1 (x86_64-pc-linux-gnu) libcurl/8.1.1 NSS/3.92 zlib/1.2.13 brotli/1.0.9 zstd/1.5.4 libidn2/2.3.3 nghttp2/1.56.0 | cd curl-impersonate | ||||||
| Release-Date: 2023-05-23 | sudo apt install build-essential pkg-config cmake ninja-build curl autoconf automake libtool python3-pip libnss3 libnss3-dev | ||||||
| Protocols: dict file ftp ftps gopher gophers http https imap imaps mqtt pop3 pop3s rtsp smb smbs smtp smtps telnet tftp ws wss | mkdir build | ||||||
| Features: alt-svc AsynchDNS brotli HSTS HTTP2 HTTPS-proxy IDN IPv6 Largefile libz NTLM NTLM_WB SSL threadsafe UnixSockets zstd | cd build | ||||||
| ``` | ../configure | ||||||
| Now, after compiling, you should have a `libcurl-impersonate-ff.so` sitting somewhere. Mine (on my debian install) is located at `/usr/local/lib/libcurl-impersonate-ff.so`. | make firefox-build | ||||||
|  | sudo make firefox-install | ||||||
| Find the `libcurl.so.4` file used by your current installation of curl. For me, this file is located at `/usr/lib/x86_64-linux-gnu/libcurl.so.4` | sudo ldconfig | ||||||
|  |  | ||||||
| Now comes the sketchy part: replace `libcurl.so.4` with `libcurl-impersonate-ff.so`. You can do this in the following way: |  | ||||||
| ```sh |  | ||||||
| sudo rm /usr/lib/x86_64-linux-gnu/libcurl.so.4 |  | ||||||
| sudo cp /usr/local/lib/libcurl-impersonate-ff.so /usr/lib/x86_64-linux-gnu/libcurl.so.4 |  | ||||||
| ``` | ``` | ||||||
|  |  | ||||||
| Make sure to restart your webserver and/or PHP daemon, otherwise it will keep using the old library. You should now be able to bypass Cloudflare's shitty checks!! | Now, after compiling, you should have a `libcurl-impersonate-ff.so` sitting somewhere. Mine is located at `/usr/local/lib/libcurl-impersonate-ff.so`. Patch your PHP install so that it loads the right library: | ||||||
|  |  | ||||||
|  | ```sh | ||||||
|  | sudo systemctl edit php8.4-fpm.service | ||||||
|  | ``` | ||||||
|  |  | ||||||
|  | ^This will open a text editor. Add the following shit in there, in between those 2 comments I pasted for ya just for reference: | ||||||
|  |  | ||||||
|  | ```sh | ||||||
|  | ### Editing /etc/systemd/system/php8.4-fpm.service.d/override.conf | ||||||
|  | ### Anything between here and the comment below will become the contents of the> | ||||||
|  |  | ||||||
|  | [Service] | ||||||
|  | Environment="LD_PRELOAD=/usr/local/lib/libcurl-impersonate-ff.so" | ||||||
|  | Environment="CURL_IMPERSONATE=firefox117" | ||||||
|  |  | ||||||
|  | ### Edits below this comment will be discarded | ||||||
|  | ``` | ||||||
|  |  | ||||||
|  | Restart php8.4-fpm. (`sudo service php8.4-fpm restart`). To test things out, try making a search on "Yep", they check for SSL. If you get results (or a timeout, this piece of shit engine is slow as fuck) that means it works! | ||||||
|  |  | ||||||
| # Robots.txt | # Robots.txt | ||||||
| Make sure you configure this right to optimize your search engine presence! Head over to `/robots.txt` and change the 4get.ca domain to your own domain. | Make sure you configure this right to optimize your search engine presence! Head over to `/robots.txt` and change the 4get.ca domain to your own domain. | ||||||
|   | |||||||
| @@ -15,7 +15,12 @@ class favicon{ | |||||||
| 		 | 		 | ||||||
| 		header("Content-Type: image/png"); | 		header("Content-Type: image/png"); | ||||||
| 		 | 		 | ||||||
| 		if(substr_count($url, "/") !== 2){ | 		if( | ||||||
|  | 			preg_match( | ||||||
|  | 				'/^https?:\/\/[A-Za-z0-9.-]+$/', | ||||||
|  | 				$url | ||||||
|  | 			) === 0 | ||||||
|  | 		){ | ||||||
| 			 | 			 | ||||||
| 			header("X-Error: Only provide the protocol and domain"); | 			header("X-Error: Only provide the protocol and domain"); | ||||||
| 			$this->defaulticon(); | 			$this->defaulticon(); | ||||||
|   | |||||||
							
								
								
									
										100
									
								
								lib/anubis.php
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										100
									
								
								lib/anubis.php
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,100 @@ | |||||||
|  | <?php | ||||||
|  |  | ||||||
|  | // | ||||||
|  | // Reference | ||||||
|  | // https://github.com/TecharoHQ/anubis/blob/ecc716940e34ebe7249974f2789a99a2c7115e4e/web/js/proof-of-work.mjs | ||||||
|  | // | ||||||
|  |  | ||||||
|  | class anubis{ | ||||||
|  | 	 | ||||||
|  | 	public function __construct(){ | ||||||
|  | 		 | ||||||
|  | 		include_once "fuckhtml.php"; | ||||||
|  | 		$this->fuckhtml = new fuckhtml(); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function scrape($html){ | ||||||
|  | 		 | ||||||
|  | 		$this->fuckhtml->load($html); | ||||||
|  | 		 | ||||||
|  | 		$script = | ||||||
|  | 			$this->fuckhtml | ||||||
|  | 			->getElementById( | ||||||
|  | 				"anubis_challenge", | ||||||
|  | 				"script" | ||||||
|  | 			); | ||||||
|  | 		 | ||||||
|  | 		if($script === false){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to scrape anubis challenge data"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$script = | ||||||
|  | 			json_decode( | ||||||
|  | 				$this->fuckhtml | ||||||
|  | 				->getTextContent( | ||||||
|  | 					$script | ||||||
|  | 				), | ||||||
|  | 				true | ||||||
|  | 			); | ||||||
|  | 		 | ||||||
|  | 		if($script === null){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to decode anubis challenge data"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if( | ||||||
|  | 			!isset($script["challenge"]) || | ||||||
|  | 			!isset($script["rules"]["difficulty"]) || | ||||||
|  | 			!is_int($script["rules"]["difficulty"]) || | ||||||
|  | 			!is_string($script["challenge"]) | ||||||
|  | 		){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Found invalid challenge data"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return $this->rape($script["challenge"], $script["rules"]["difficulty"]); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function is_valid_hash($hash, $difficulty){ | ||||||
|  | 		 | ||||||
|  | 		for ($i=0; $i<$difficulty; $i++) { | ||||||
|  | 			 | ||||||
|  | 			$index = (int)floor($i / 2); | ||||||
|  | 			$nibble = $i % 2; | ||||||
|  | 			 | ||||||
|  | 			$byte = ord($hash[$index]); | ||||||
|  | 			$nibble = ($byte >> ($nibble === 0 ? 4 : 0)) & 0x0f; | ||||||
|  | 			 | ||||||
|  | 			if($nibble !== 0){ | ||||||
|  | 				return false; | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return true; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function rape($data, $difficulty = 5){ | ||||||
|  | 		 | ||||||
|  | 		$nonce = 0; | ||||||
|  | 		 | ||||||
|  | 		while(true){ | ||||||
|  | 			 | ||||||
|  | 			$hash_binary = hash("sha256", $data . $nonce, true); | ||||||
|  | 			 | ||||||
|  | 			if($this->is_valid_hash($hash_binary, $difficulty)){ | ||||||
|  | 				 | ||||||
|  | 				$hash_hex = bin2hex($hash_binary); | ||||||
|  | 				 | ||||||
|  | 				return [ | ||||||
|  | 					"response" => $hash_hex, | ||||||
|  | 					//"data" => $data, | ||||||
|  | 					//"difficulty" => $difficulty, | ||||||
|  | 					"nonce" => $nonce | ||||||
|  | 				]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$nonce++; | ||||||
|  | 		} | ||||||
|  | 	} | ||||||
|  | } | ||||||
| @@ -9,7 +9,7 @@ class backend{ | |||||||
| 	/* | 	/* | ||||||
| 		Proxy stuff | 		Proxy stuff | ||||||
| 	*/ | 	*/ | ||||||
| 	public function get_ip(){ | 	public function get_ip($proxy_index_raw = null){ | ||||||
| 		 | 		 | ||||||
| 		$pool = constant("config::PROXY_" . strtoupper($this->scraper)); | 		$pool = constant("config::PROXY_" . strtoupper($this->scraper)); | ||||||
| 		if($pool === false){ | 		if($pool === false){ | ||||||
| @@ -19,7 +19,10 @@ class backend{ | |||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
| 		// indent | 		// indent | ||||||
|  | 		if($proxy_index_raw === null){ | ||||||
|  | 			 | ||||||
| 			$proxy_index_raw = apcu_inc("p." . $this->scraper); | 			$proxy_index_raw = apcu_inc("p." . $this->scraper); | ||||||
|  | 		} | ||||||
| 		 | 		 | ||||||
| 		$proxylist = file_get_contents("data/proxies/" . $pool . ".txt"); | 		$proxylist = file_get_contents("data/proxies/" . $pool . ".txt"); | ||||||
| 		$proxylist = explode("\n", $proxylist); | 		$proxylist = explode("\n", $proxylist); | ||||||
| @@ -32,6 +35,12 @@ class backend{ | |||||||
| 		 | 		 | ||||||
| 		$proxylist = array_values($proxylist); | 		$proxylist = array_values($proxylist); | ||||||
| 		 | 		 | ||||||
|  | 		if(count($proxylist) === 0){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("A proxy list was specified but it's empty!"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		//echo $proxylist[$proxy_index_raw % count($proxylist)]; | ||||||
| 		return $proxylist[$proxy_index_raw % count($proxylist)]; | 		return $proxylist[$proxy_index_raw % count($proxylist)]; | ||||||
| 	} | 	} | ||||||
| 	 | 	 | ||||||
| @@ -75,6 +84,7 @@ class backend{ | |||||||
| 				break; | 				break; | ||||||
| 			 | 			 | ||||||
| 			case "socks5_hostname": | 			case "socks5_hostname": | ||||||
|  | 			case "socks5h": | ||||||
| 			case "socks5a": | 			case "socks5a": | ||||||
| 				curl_setopt($curlproc, CURLOPT_PROXYTYPE, CURLPROXY_SOCKS5_HOSTNAME); | 				curl_setopt($curlproc, CURLOPT_PROXYTYPE, CURLPROXY_SOCKS5_HOSTNAME); | ||||||
| 				curl_setopt($curlproc, CURLOPT_PROXY, $address . ":" . $port); | 				curl_setopt($curlproc, CURLOPT_PROXY, $address . ":" . $port); | ||||||
| @@ -87,6 +97,30 @@ class backend{ | |||||||
| 		} | 		} | ||||||
| 	} | 	} | ||||||
| 	 | 	 | ||||||
|  | 	// API key rotation | ||||||
|  | 	public function get_key(){ | ||||||
|  | 		 | ||||||
|  | 		$keys = file_get_contents("data/api_keys/" . $this->scraper . ".txt"); | ||||||
|  | 		$keys = explode("\n", $keys); | ||||||
|  | 		 | ||||||
|  | 		$keys = array_filter($keys, function($entry){ | ||||||
|  | 			$entry = ltrim($entry); | ||||||
|  | 			return strlen($entry) > 0 && substr($entry, 0, 1) != "#"; | ||||||
|  | 		}); | ||||||
|  | 		 | ||||||
|  | 		$keys = array_values($keys); | ||||||
|  | 		 | ||||||
|  | 		if(count($keys) === 0){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Please specify API keys in data/api_keys/" . $this->scraper . ".txt"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$increment = apcu_inc("s." . $this->scraper) % count($keys); | ||||||
|  | 		return [ | ||||||
|  | 			"key" => $keys[$increment], | ||||||
|  | 			"increment" => $increment | ||||||
|  | 		]; | ||||||
|  | 	} | ||||||
| 	 | 	 | ||||||
| 	 | 	 | ||||||
| 	/* | 	/* | ||||||
|   | |||||||
| @@ -1,144 +0,0 @@ | |||||||
| <?php |  | ||||||
|  |  | ||||||
| // https://www.bing.com/search?q=url%3Ahttps%3A%2F%2Flolcat.ca |  | ||||||
| // https://cc.bingj.com/cache.aspx?q=url%3ahttps%3a%2f%2flolcat.ca&d=4769685974291356&mkt=en-CA&setlang=en-US&w=tEsWuE7HW3Z5AIPQMVkDH4WaotS4LrK- |  | ||||||
| // <div class="b_attribution" u="0N|5119|4769685974291356|tEsWuE7HW3Z5AIPQMVkDH4WaotS4LrK-" tabindex="0"> |  | ||||||
|  |  | ||||||
| new bingcache(); |  | ||||||
|  |  | ||||||
| class bingcache{ |  | ||||||
| 	 |  | ||||||
| 	public function __construct(){ |  | ||||||
| 		 |  | ||||||
| 		if( |  | ||||||
| 			!isset($_GET["s"]) || |  | ||||||
| 			$this->validate_url($_GET["s"]) === false |  | ||||||
| 		){ |  | ||||||
| 			 |  | ||||||
| 			var_dump($this->validate_url($_GET["s"])); |  | ||||||
| 			$this->do404("Please provide a valid URL."); |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		$url = $_GET["s"]; |  | ||||||
| 		 |  | ||||||
| 		$curlproc = curl_init(); |  | ||||||
| 		 |  | ||||||
| 		curl_setopt( |  | ||||||
| 			$curlproc, |  | ||||||
| 			CURLOPT_URL, |  | ||||||
| 			"https://www.bing.com/search?q=url%3A" . |  | ||||||
| 			urlencode($url) |  | ||||||
| 		); |  | ||||||
| 		 |  | ||||||
| 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding |  | ||||||
| 		curl_setopt( |  | ||||||
| 			$curlproc, |  | ||||||
| 			CURLOPT_HTTPHEADER, |  | ||||||
| 			["User-Agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:107.0) Gecko/20100101 Firefox/107.0", |  | ||||||
| 			"Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8", |  | ||||||
| 			"Accept-Language: en-US,en;q=0.5", |  | ||||||
| 			"Accept-Encoding: gzip", |  | ||||||
| 			"DNT: 1", |  | ||||||
| 			"Connection: keep-alive", |  | ||||||
| 			"Upgrade-Insecure-Requests: 1", |  | ||||||
| 			"Sec-Fetch-Dest: document", |  | ||||||
| 			"Sec-Fetch-Mode: navigate", |  | ||||||
| 			"Sec-Fetch-Site: none", |  | ||||||
| 			"Sec-Fetch-User: ?1"] |  | ||||||
| 		); |  | ||||||
| 		 |  | ||||||
| 		curl_setopt($curlproc, CURLOPT_RETURNTRANSFER, true); |  | ||||||
| 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYHOST, 2); |  | ||||||
| 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYPEER, true); |  | ||||||
| 		curl_setopt($curlproc, CURLOPT_CONNECTTIMEOUT, 5); |  | ||||||
| 		 |  | ||||||
| 		$data = curl_exec($curlproc); |  | ||||||
| 		 |  | ||||||
| 		if(curl_errno($curlproc)){ |  | ||||||
| 			 |  | ||||||
| 			$this->do404("Failed to connect to bing servers. Please try again later."); |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		curl_close($curlproc); |  | ||||||
| 		 |  | ||||||
| 		preg_match( |  | ||||||
| 			'/<div class="b_attribution" u="(.*)" tabindex="0">/', |  | ||||||
| 			$data, |  | ||||||
| 			$keys |  | ||||||
| 		); |  | ||||||
| 		 |  | ||||||
| 		print_r($keys); |  | ||||||
| 		 |  | ||||||
| 		if(count($keys) === 0){ |  | ||||||
| 			 |  | ||||||
| 			$this->do404("Bing has not archived this URL."); |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		$keys = explode("|", $keys[1]); |  | ||||||
| 		$count = count($keys); |  | ||||||
| 		 |  | ||||||
| 		//header("Location: https://cc.bingj.com/cache.aspx?d=" . $keys[$count - 2] . "&w=" . $keys[$count - 1]); |  | ||||||
| 		echo("Location: https://cc.bingj.com/cache.aspx?d=" . $keys[$count - 2] . "&w=" . $keys[$count - 1]); |  | ||||||
| 	} |  | ||||||
| 	 |  | ||||||
| 	public function do404($text){ |  | ||||||
| 				 |  | ||||||
| 		include "lib/frontend.php"; |  | ||||||
| 		$frontend = new frontend(); |  | ||||||
| 		 |  | ||||||
| 		echo |  | ||||||
| 			$frontend->load( |  | ||||||
| 				"error.html", |  | ||||||
| 				[ |  | ||||||
| 					"title" => "Shit", |  | ||||||
| 					"text" => $text |  | ||||||
| 				] |  | ||||||
| 			); |  | ||||||
| 		 |  | ||||||
| 		die(); |  | ||||||
| 	} |  | ||||||
| 	 |  | ||||||
| 	public function validate_url($url){ |  | ||||||
| 		 |  | ||||||
| 		$url_parts = parse_url($url); |  | ||||||
| 		 |  | ||||||
| 		// check if required parts are there |  | ||||||
| 		if( |  | ||||||
| 			!isset($url_parts["scheme"]) || |  | ||||||
| 			!( |  | ||||||
| 				$url_parts["scheme"] == "http" || |  | ||||||
| 				$url_parts["scheme"] == "https" |  | ||||||
| 			) || |  | ||||||
| 			!isset($url_parts["host"]) |  | ||||||
| 		){ |  | ||||||
| 			return false; |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		if( |  | ||||||
| 			// if its not an RFC-valid URL |  | ||||||
| 			!filter_var($url, FILTER_VALIDATE_URL) |  | ||||||
| 		){ |  | ||||||
| 			return false; |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		$ip =  |  | ||||||
| 			str_replace( |  | ||||||
| 				["[", "]"], // handle ipv6 |  | ||||||
| 				"", |  | ||||||
| 				$url_parts["host"] |  | ||||||
| 			); |  | ||||||
| 		 |  | ||||||
| 		// if its not an IP |  | ||||||
| 		if(!filter_var($ip, FILTER_VALIDATE_IP)){ |  | ||||||
| 			 |  | ||||||
| 			// resolve domain's IP |  | ||||||
| 			$ip = gethostbyname($url_parts["host"] . "."); |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		// check if its localhost |  | ||||||
| 		return filter_var( |  | ||||||
| 			$ip, |  | ||||||
| 			FILTER_VALIDATE_IP, FILTER_FLAG_NO_PRIV_RANGE | FILTER_FLAG_NO_RES_RANGE |  | ||||||
| 		); |  | ||||||
| 	} |  | ||||||
| } |  | ||||||
| @@ -403,27 +403,28 @@ class frontend{ | |||||||
| 		$text = | 		$text = | ||||||
| 			trim( | 			trim( | ||||||
| 				preg_replace( | 				preg_replace( | ||||||
| 					'/<\/span>$/', | 					'/<code [^>]+>/', | ||||||
| 					"", // remove stray ending span because of the <?php stuff | 					"", | ||||||
| 					str_replace( | 					str_replace( | ||||||
| 						[ | 						[ | ||||||
| 							'<br />', | 							"<br />", | ||||||
| 							' ' | 							" ", | ||||||
| 						], | 							"<pre>", | ||||||
| 						[ | 							"</pre>", | ||||||
| 							"\n", // replace <br> with newlines |  | ||||||
| 							" " // replace html entity to space |  | ||||||
| 						], |  | ||||||
| 						str_replace( |  | ||||||
| 							[ |  | ||||||
| 								// leading <?php garbage |  | ||||||
| 								"<span style=\"color: c-default\">\n<?php ", |  | ||||||
| 								"<code>", |  | ||||||
| 							"</code>" | 							"</code>" | ||||||
| 						], | 						], | ||||||
|  | 						[ | ||||||
|  | 							"\n", | ||||||
|  | 							" ", | ||||||
| 							"", | 							"", | ||||||
| 							highlight_string("<?php " . $text, true) | 							"", | ||||||
| 						) | 							"" | ||||||
|  | 						], | ||||||
|  | 						explode( | ||||||
|  | 							"<?php", | ||||||
|  | 							highlight_string("<?php " . $text, true), | ||||||
|  | 							2 | ||||||
|  | 						)[1] | ||||||
| 					) | 					) | ||||||
| 				) | 				) | ||||||
| 			); | 			); | ||||||
| @@ -838,10 +839,10 @@ class frontend{ | |||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
| 		$payload .= | 		$payload .= | ||||||
| 				'<a href="https://webcache.googleusercontent.com/search?q=cache:' . $urlencode . '" class="list" target="_BLANK"><img src="/favicon?s=https://google.com" alt="go">Google cache</a>' . |  | ||||||
| 				'<a href="https://web.archive.org/web/' . $urlencode . '" class="list" target="_BLANK"><img src="/favicon?s=https://archive.org" alt="ar">Archive.org</a>' . | 				'<a href="https://web.archive.org/web/' . $urlencode . '" class="list" target="_BLANK"><img src="/favicon?s=https://archive.org" alt="ar">Archive.org</a>' . | ||||||
| 				'<a href="https://archive.ph/newest/' . htmlspecialchars($link) . '" class="list" target="_BLANK"><img src="/favicon?s=https://archive.is" alt="ar">Archive.is</a>' . | 				'<a href="https://archive.ph/newest/' . htmlspecialchars($link) . '" class="list" target="_BLANK"><img src="/favicon?s=https://archive.is" alt="ar">Archive.is</a>' . | ||||||
| 				'<a href="https://ghostarchive.org/search?term=' . $urlencode . '" class="list" target="_BLANK"><img src="/favicon?s=https://ghostarchive.org" alt="gh">Ghostarchive</a>' . | 				'<a href="https://ghostarchive.org/search?term=' . $urlencode . '" class="list" target="_BLANK"><img src="/favicon?s=https://ghostarchive.org" alt="gh">Ghostarchive</a>' . | ||||||
|  | 				'<a href="https://arquivo.pt/wayback/' . htmlspecialchars($link) . '" class="list" target="_BLANK"><img src="/favicon?s=https://arquivo.pt" alt="ar">Arquivo.pt</a>' . | ||||||
| 				'<a href="https://www.bing.com/search?q=url%3A' . $urlencode . '" class="list" target="_BLANK"><img src="/favicon?s=https://bing.com" alt="bi">Bing cache</a>' . | 				'<a href="https://www.bing.com/search?q=url%3A' . $urlencode . '" class="list" target="_BLANK"><img src="/favicon?s=https://bing.com" alt="bi">Bing cache</a>' . | ||||||
| 				'<a href="https://megalodon.jp/?url=' . $urlencode . '" class="list" target="_BLANK"><img src="/favicon?s=https://megalodon.jp" alt="me">Megalodon</a>' . | 				'<a href="https://megalodon.jp/?url=' . $urlencode . '" class="list" target="_BLANK"><img src="/favicon?s=https://megalodon.jp" alt="me">Megalodon</a>' . | ||||||
| 			'</div>'; | 			'</div>'; | ||||||
| @@ -936,10 +937,14 @@ class frontend{ | |||||||
| 					"display" => "Scraper", | 					"display" => "Scraper", | ||||||
| 					"option" => [ | 					"option" => [ | ||||||
| 						"ddg" => "DuckDuckGo", | 						"ddg" => "DuckDuckGo", | ||||||
|  | 						//"yahoo" => "Yahoo!", | ||||||
| 						"brave" => "Brave", | 						"brave" => "Brave", | ||||||
|  | 						"mullvad_brave" => "Mullvad (Brave)", | ||||||
| 						"yandex" => "Yandex", | 						"yandex" => "Yandex", | ||||||
| 						"google" => "Google", | 						"google" => "Google", | ||||||
|  | 						"google_api" => "Google API", | ||||||
| 						"google_cse" => "Google CSE", | 						"google_cse" => "Google CSE", | ||||||
|  | 						"mullvad_google" => "Mullvad (Google)", | ||||||
| 						"startpage" => "Startpage", | 						"startpage" => "Startpage", | ||||||
| 						"qwant" => "Qwant", | 						"qwant" => "Qwant", | ||||||
| 						"ghostery" => "Ghostery", | 						"ghostery" => "Ghostery", | ||||||
| @@ -948,6 +953,8 @@ class frontend{ | |||||||
| 						"crowdview" => "Crowdview", | 						"crowdview" => "Crowdview", | ||||||
| 						"mwmbl" => "Mwmbl", | 						"mwmbl" => "Mwmbl", | ||||||
| 						"mojeek" => "Mojeek", | 						"mojeek" => "Mojeek", | ||||||
|  | 						"baidu" => "Baidu", | ||||||
|  | 						"coccoc" => "Cốc Cốc", | ||||||
| 						"solofield" => "Solofield", | 						"solofield" => "Solofield", | ||||||
| 						"marginalia" => "Marginalia", | 						"marginalia" => "Marginalia", | ||||||
| 						"wiby" => "wiby", | 						"wiby" => "wiby", | ||||||
| @@ -968,10 +975,16 @@ class frontend{ | |||||||
| 						"startpage" => "Startpage", | 						"startpage" => "Startpage", | ||||||
| 						"qwant" => "Qwant", | 						"qwant" => "Qwant", | ||||||
| 						"yep" => "Yep", | 						"yep" => "Yep", | ||||||
|  | 						"baidu" => "Baidu", | ||||||
| 						"solofield" => "Solofield", | 						"solofield" => "Solofield", | ||||||
| 						//"pinterest" => "Pinterest", | 						"pinterest" => "Pinterest", | ||||||
|  | 						"cara" => "Cara", | ||||||
|  | 						"flickr" => "Flickr", | ||||||
|  | 						"fivehpx" => "500px", | ||||||
|  | 						"vsco" => "VSCO", | ||||||
| 						"imgur" => "Imgur", | 						"imgur" => "Imgur", | ||||||
| 						"ftm" => "FindThatMeme" | 						"ftm" => "FindThatMeme", | ||||||
|  | 						//"sankakucomplex" => "SankakuComplex" | ||||||
| 					] | 					] | ||||||
| 				]; | 				]; | ||||||
| 				break; | 				break; | ||||||
| @@ -981,6 +994,10 @@ class frontend{ | |||||||
| 					"display" => "Scraper", | 					"display" => "Scraper", | ||||||
| 					"option" => [ | 					"option" => [ | ||||||
| 						"yt" => "YouTube", | 						"yt" => "YouTube", | ||||||
|  | 						//"archiveorg" => "Archive.org", | ||||||
|  | 						"vimeo" => "Vimeo", | ||||||
|  | 						//"odysee" => "Odysee", | ||||||
|  | 						"sepiasearch" => "Sepia Search", | ||||||
| 						//"fb" => "Facebook videos", | 						//"fb" => "Facebook videos", | ||||||
| 						"ddg" => "DuckDuckGo", | 						"ddg" => "DuckDuckGo", | ||||||
| 						"brave" => "Brave", | 						"brave" => "Brave", | ||||||
| @@ -988,6 +1005,8 @@ class frontend{ | |||||||
| 						"google" => "Google", | 						"google" => "Google", | ||||||
| 						"startpage" => "Startpage", | 						"startpage" => "Startpage", | ||||||
| 						"qwant" => "Qwant", | 						"qwant" => "Qwant", | ||||||
|  | 						"baidu" => "Baidu", | ||||||
|  | 						"coccoc" => "Cốc Cốc", | ||||||
| 						"solofield" => "Solofield" | 						"solofield" => "Solofield" | ||||||
| 					] | 					] | ||||||
| 				]; | 				]; | ||||||
| @@ -1003,7 +1022,8 @@ class frontend{ | |||||||
| 						"startpage" => "Startpage", | 						"startpage" => "Startpage", | ||||||
| 						"qwant" => "Qwant", | 						"qwant" => "Qwant", | ||||||
| 						"yep" => "Yep", | 						"yep" => "Yep", | ||||||
| 						"mojeek" => "Mojeek" | 						"mojeek" => "Mojeek", | ||||||
|  | 						"baidu" => "Baidu" | ||||||
| 					] | 					] | ||||||
| 				]; | 				]; | ||||||
| 				break; | 				break; | ||||||
| @@ -1328,6 +1348,7 @@ class frontend{ | |||||||
| 			return htmlspecialchars($image); | 			return htmlspecialchars($image); | ||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
|  | 		//return "https://4get.ca/proxy?i=" . urlencode($image) . "&s=" . $format; | ||||||
| 		return "/proxy?i=" . urlencode($image) . "&s=" . $format; | 		return "/proxy?i=" . urlencode($image) . "&s=" . $format; | ||||||
| 	} | 	} | ||||||
| 	 | 	 | ||||||
|   | |||||||
							
								
								
									
										110
									
								
								lib/fuckhtml.php
									
									
									
									
									
								
							
							
						
						
									
										110
									
								
								lib/fuckhtml.php
									
									
									
									
									
								
							| @@ -240,12 +240,13 @@ class fuckhtml{ | |||||||
| 	public function getElementsByFuzzyAttributeValue(string $name, string $value, $collection = null){ | 	public function getElementsByFuzzyAttributeValue(string $name, string $value, $collection = null){ | ||||||
| 		 | 		 | ||||||
| 		$elems = $this->getElementsByAttributeName($name, $collection); | 		$elems = $this->getElementsByAttributeName($name, $collection); | ||||||
|  | 		 | ||||||
| 		$value = | 		$value = | ||||||
| 			explode( | 			explode( | ||||||
| 				" ", | 				" ", | ||||||
| 				trim( | 				trim( | ||||||
| 					preg_replace( | 					preg_replace( | ||||||
| 						'/ +/', | 						'/\s+/', | ||||||
| 						" ", | 						" ", | ||||||
| 						$value | 						$value | ||||||
| 					) | 					) | ||||||
| @@ -258,7 +259,18 @@ class fuckhtml{ | |||||||
| 			 | 			 | ||||||
| 			foreach($elem["attributes"] as $attrib_name => $attrib_value){ | 			foreach($elem["attributes"] as $attrib_name => $attrib_value){ | ||||||
| 				 | 				 | ||||||
| 				$attrib_value = explode(" ", $attrib_value); | 				$attrib_value = | ||||||
|  | 					explode( | ||||||
|  | 						" ", | ||||||
|  | 						trim( | ||||||
|  | 							preg_replace( | ||||||
|  | 								'/\s+/', | ||||||
|  | 								" ", | ||||||
|  | 								$attrib_value | ||||||
|  | 							) | ||||||
|  | 						) | ||||||
|  | 					); | ||||||
|  | 				 | ||||||
| 				$ac = count($attrib_value); | 				$ac = count($attrib_value); | ||||||
| 				$nc = count($value); | 				$nc = count($value); | ||||||
| 				$cr = 0; | 				$cr = 0; | ||||||
| @@ -526,4 +538,98 @@ class fuckhtml{ | |||||||
| 				$string | 				$string | ||||||
| 			); | 			); | ||||||
| 	} | 	} | ||||||
|  | 	 | ||||||
|  | 	public function extract_json($json){ | ||||||
|  | 		 | ||||||
|  | 		$len = strlen($json); | ||||||
|  | 		$array_level = 0; | ||||||
|  | 		$object_level = 0; | ||||||
|  | 		$in_quote = null; | ||||||
|  | 		$start = null; | ||||||
|  | 		 | ||||||
|  | 		for($i=0; $i<$len; $i++){ | ||||||
|  | 			 | ||||||
|  | 			switch($json[$i]){ | ||||||
|  | 				 | ||||||
|  | 				case "\"": | ||||||
|  | 				case "'": | ||||||
|  | 					if( | ||||||
|  | 						$i !== 0 && // only check if a quote could be there | ||||||
|  | 						( | ||||||
|  | 							( | ||||||
|  | 								$json[$i - 1] === "\\" && | ||||||
|  | 								( | ||||||
|  | 									$i === 2 || | ||||||
|  | 									$json[$i - 2] === "\\" | ||||||
|  | 								) | ||||||
|  | 							) || | ||||||
|  | 							$json[$i - 1] !== "\\" | ||||||
|  | 						) | ||||||
|  | 					){ | ||||||
|  | 						// found a non-escaped quote | ||||||
|  | 						 | ||||||
|  | 						if($in_quote === null){ | ||||||
|  | 							 | ||||||
|  | 							// open quote | ||||||
|  | 							$in_quote = $json[$i]; | ||||||
|  | 							 | ||||||
|  | 						}elseif($in_quote === $json[$i]){ | ||||||
|  | 							 | ||||||
|  | 							// close quote | ||||||
|  | 							$in_quote = null; | ||||||
|  | 						} | ||||||
|  | 					} | ||||||
|  | 					break; | ||||||
|  | 				 | ||||||
|  | 				case "[": | ||||||
|  | 					if($in_quote === null){ | ||||||
|  | 						 | ||||||
|  | 						$array_level++; | ||||||
|  | 						if($start === null){ | ||||||
|  | 							 | ||||||
|  | 							$start = $i; | ||||||
|  | 						} | ||||||
|  | 					} | ||||||
|  | 					break; | ||||||
|  | 				 | ||||||
|  | 				case "]": | ||||||
|  | 					if($in_quote === null){ | ||||||
|  | 						 | ||||||
|  | 						$array_level--; | ||||||
|  | 					} | ||||||
|  | 					break; | ||||||
|  | 				 | ||||||
|  | 				case "{": | ||||||
|  | 					if($in_quote === null){ | ||||||
|  | 						 | ||||||
|  | 						$object_level++; | ||||||
|  | 						if($start === null){ | ||||||
|  | 							 | ||||||
|  | 							$start = $i; | ||||||
|  | 						} | ||||||
|  | 					} | ||||||
|  | 					break; | ||||||
|  | 				 | ||||||
|  | 				case "}": | ||||||
|  | 					if($in_quote === null){ | ||||||
|  | 						 | ||||||
|  | 						$object_level--; | ||||||
|  | 					} | ||||||
|  | 					break; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if( | ||||||
|  | 				$array_level === 0 && | ||||||
|  | 				$object_level === 0 && | ||||||
|  | 				$start !== null | ||||||
|  | 			){ | ||||||
|  | 				 | ||||||
|  | 				return substr($json, $start, $i - $start + 1); | ||||||
|  | 				break; | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		// fallback | ||||||
|  | 		return "[]"; | ||||||
|  | 	} | ||||||
| } | } | ||||||
|   | |||||||
							
								
								
									
										42
									
								
								proxy.php
									
									
									
									
									
								
							
							
						
						
									
										42
									
								
								proxy.php
									
									
									
									
									
								
							| @@ -34,22 +34,46 @@ try{ | |||||||
| 		) | 		) | ||||||
| 	){ | 	){ | ||||||
| 		 | 		 | ||||||
| 		if( | 		if(!isset($image["path"])){ | ||||||
| 			!isset($image["query"]) || |  | ||||||
| 			!isset($image["path"]) || |  | ||||||
| 			$image["path"] != "/th" |  | ||||||
| 		){ |  | ||||||
| 			 | 			 | ||||||
| 			header("X-Error: Invalid bing image path"); | 			header("X-Error: Missing bing image path"); | ||||||
| 			$proxy->do404(); | 			$proxy->do404(); | ||||||
| 			die(); | 			die(); | ||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
|  | 		// | ||||||
|  | 		// get image ID | ||||||
|  | 		// formations: | ||||||
|  | 		// https://tse2.mm.bing.net/th/id/OIP.3yLBkUPn8EXA1wlhWP2BHwHaE3 | ||||||
|  | 		// https://tse2.mm.bing.net/th?id=OIP.3yLBkUPn8EXA1wlhWP2BHwHaE3 | ||||||
|  | 		// | ||||||
|  | 		$id = null; | ||||||
|  | 		if(isset($image["query"])){ | ||||||
|  | 			 | ||||||
| 			parse_str($image["query"], $str); | 			parse_str($image["query"], $str); | ||||||
| 			 | 			 | ||||||
| 		if(!isset($str["id"])){ | 			if(isset($str["id"])){ | ||||||
| 				 | 				 | ||||||
| 			header("X-Error: Missing bing ID"); | 				$id = $str["id"]; | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if($id === null){ | ||||||
|  | 			 | ||||||
|  | 			$id = explode("/th/id/", $image["path"], 2); | ||||||
|  | 			 | ||||||
|  | 			if(count($id) !== 2){ | ||||||
|  | 				 | ||||||
|  | 				// malformed | ||||||
|  | 				return $url; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$id = $id[1]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if(is_array($id)){ | ||||||
|  | 			 | ||||||
|  | 			header("X-Error: Missing bing id parameter"); | ||||||
| 			$proxy->do404(); | 			$proxy->do404(); | ||||||
| 			die(); | 			die(); | ||||||
| 		} | 		} | ||||||
| @@ -63,7 +87,7 @@ try{ | |||||||
| 			case "cover": $req = "&w=207&h=270&p=0&qlt=90"; break; | 			case "cover": $req = "&w=207&h=270&p=0&qlt=90"; break; | ||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
| 		$proxy->stream_linear_image("https://" . $image["host"] . "/th?id=" . urlencode($str["id"]) . $req, "https://www.bing.com"); | 		$proxy->stream_linear_image("https://" . $image["host"] . "/th?id=" . rawurlencode($id) . $req, "https://www.bing.com"); | ||||||
| 		die(); | 		die(); | ||||||
| 	} | 	} | ||||||
| 	 | 	 | ||||||
|   | |||||||
							
								
								
									
										2229
									
								
								scraper/baidu.php
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										2229
									
								
								scraper/baidu.php
									
									
									
									
									
										Normal file
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							| @@ -210,6 +210,63 @@ class brave{ | |||||||
| 		return $data; | 		return $data; | ||||||
| 	} | 	} | ||||||
| 	 | 	 | ||||||
|  | 	private function get_js(){ | ||||||
|  | 		 | ||||||
|  | 		$script_disc = | ||||||
|  | 			$this->fuckhtml | ||||||
|  | 			->getElementsByTagName( | ||||||
|  | 				"script" | ||||||
|  | 			); | ||||||
|  | 		 | ||||||
|  | 		$data = null; | ||||||
|  | 		foreach($script_disc as &$discs){ | ||||||
|  | 			 | ||||||
|  | 			if( | ||||||
|  | 				preg_match( | ||||||
|  | 					'/kit\.start\(/', | ||||||
|  | 					$discs["innerHTML"] | ||||||
|  | 				) | ||||||
|  | 			){ | ||||||
|  | 				 | ||||||
|  | 				$data = | ||||||
|  | 					explode( | ||||||
|  | 						"data:", | ||||||
|  | 						$discs["innerHTML"], | ||||||
|  | 						2 | ||||||
|  | 					); | ||||||
|  | 				 | ||||||
|  | 				if(count($data) !== 2){ | ||||||
|  | 					 | ||||||
|  | 					throw new Exception("Failed to split up data field"); | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				$data = $data[1]; | ||||||
|  | 				break; | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if($data === null){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Could not grep JavaScript object"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$data = | ||||||
|  | 			$this->fuckhtml | ||||||
|  | 			->parseJsObject( | ||||||
|  | 				$this->fuckhtml | ||||||
|  | 				->extract_json( | ||||||
|  | 					$data | ||||||
|  | 				) | ||||||
|  | 			); | ||||||
|  | 		 | ||||||
|  | 		if($data === null){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to decode JavaScript object"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return $data; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
| 	public function web($get){ | 	public function web($get){ | ||||||
| 		 | 		 | ||||||
| 		if($get["npt"]){ | 		if($get["npt"]){ | ||||||
| @@ -295,7 +352,6 @@ class brave{ | |||||||
| 		$html = fread($handle, filesize("scraper/brave.html")); | 		$html = fread($handle, filesize("scraper/brave.html")); | ||||||
| 		fclose($handle);*/ | 		fclose($handle);*/ | ||||||
| 		 | 		 | ||||||
| 		 |  | ||||||
| 		try{ | 		try{ | ||||||
| 			$html = | 			$html = | ||||||
| 				$this->get( | 				$this->get( | ||||||
| @@ -346,7 +402,7 @@ class brave{ | |||||||
| 			 | 			 | ||||||
| 			$nextpage = | 			$nextpage = | ||||||
| 				$this->fuckhtml | 				$this->fuckhtml | ||||||
| 				->getElementsByClassName("btn", "a"); | 				->getElementsByClassName("button", "a"); | ||||||
| 			 | 			 | ||||||
| 			if(count($nextpage) !== 0){ | 			if(count($nextpage) !== 0){ | ||||||
| 				 | 				 | ||||||
| @@ -382,55 +438,9 @@ class brave{ | |||||||
| 			} | 			} | ||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
|  | 		// do some magic | ||||||
| 		$this->fuckhtml->load($html); | 		$this->fuckhtml->load($html); | ||||||
| 		 | 		$data = $this->get_js(); | ||||||
| 		$script_disc = |  | ||||||
| 			$this->fuckhtml |  | ||||||
| 			->getElementsByTagName( |  | ||||||
| 				"script" |  | ||||||
| 			); |  | ||||||
| 		 |  | ||||||
| 		$grep = []; |  | ||||||
| 		foreach($script_disc as $discs){ |  | ||||||
| 			 |  | ||||||
| 			preg_match( |  | ||||||
| 				'/const data ?= ?(\[{.*}]);/', |  | ||||||
| 				$discs["innerHTML"], |  | ||||||
| 				$grep |  | ||||||
| 			); |  | ||||||
| 			 |  | ||||||
| 			if(isset($grep[1])){ |  | ||||||
| 				 |  | ||||||
| 				break; |  | ||||||
| 			} |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		if(!isset($grep[1])){ |  | ||||||
| 			 |  | ||||||
| 			throw new Exception("Could not grep JavaScript object"); |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		$data = |  | ||||||
| 			rtrim( |  | ||||||
| 				preg_replace( |  | ||||||
| 					'/\(Array\(0\)\)\).*$/', |  | ||||||
| 					"", |  | ||||||
| 					$grep[1] |  | ||||||
| 				), |  | ||||||
| 				" ]" |  | ||||||
| 			) . "]"; |  | ||||||
| 		 |  | ||||||
| 		$data = |  | ||||||
| 			$this->fuckhtml |  | ||||||
| 			->parseJsObject( |  | ||||||
| 				$data |  | ||||||
| 			); |  | ||||||
| 		unset($grep); |  | ||||||
| 		 |  | ||||||
| 		if($data === null){ |  | ||||||
| 			 |  | ||||||
| 			throw new Exception("Failed to decode JavaScript object"); |  | ||||||
| 		} |  | ||||||
| 		 | 		 | ||||||
| 		if( | 		if( | ||||||
| 			isset($data[2]["data"]["title"]) && | 			isset($data[2]["data"]["title"]) && | ||||||
| @@ -1179,23 +1189,8 @@ class brave{ | |||||||
| 				$proxy | 				$proxy | ||||||
| 			); | 			); | ||||||
| 		 | 		 | ||||||
| 		preg_match( | 		$this->fuckhtml->load($html); | ||||||
| 			'/const data ?= ?(\[{.*}]);/', | 		$json = $this->get_js(); | ||||||
| 			$html, |  | ||||||
| 			$json |  | ||||||
| 		); |  | ||||||
| 		 |  | ||||||
| 		if(!isset($json[1])){ |  | ||||||
| 			 |  | ||||||
| 			throw new Exception("Failed to grep javascript object"); |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		$json = $this->fuckhtml->parseJsObject($json[1], true); |  | ||||||
| 		 |  | ||||||
| 		if($json === null){ |  | ||||||
| 			 |  | ||||||
| 			throw new Exception("Failed to parse javascript object"); |  | ||||||
| 		} |  | ||||||
| 		 | 		 | ||||||
| 		foreach( | 		foreach( | ||||||
| 			$json[1]["data"]["body"]["response"]["news"]["results"] | 			$json[1]["data"]["body"]["response"]["news"]["results"] | ||||||
| @@ -1277,22 +1272,8 @@ class brave{ | |||||||
| 		$html = fread($handle, filesize("scraper/brave-image.html")); | 		$html = fread($handle, filesize("scraper/brave-image.html")); | ||||||
| 		fclose($handle);*/ | 		fclose($handle);*/ | ||||||
| 		 | 		 | ||||||
| 		preg_match( | 		$this->fuckhtml->load($html); | ||||||
| 			'/const data = (\[{.*}\]);/', | 		$json = $this->get_js(); | ||||||
| 			$html, |  | ||||||
| 			$json |  | ||||||
| 		); |  | ||||||
| 		 |  | ||||||
| 		if(!isset($json[1])){ |  | ||||||
| 			 |  | ||||||
| 			throw new Exception("Failed to get data object"); |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		$json = |  | ||||||
| 			$this->fuckhtml |  | ||||||
| 			->parseJsObject( |  | ||||||
| 				$json[1] |  | ||||||
| 			); |  | ||||||
| 		 | 		 | ||||||
| 		foreach( | 		foreach( | ||||||
| 			$json[1] | 			$json[1] | ||||||
| @@ -1308,13 +1289,13 @@ class brave{ | |||||||
| 				"source" => [ | 				"source" => [ | ||||||
| 					[ | 					[ | ||||||
| 						"url" => $result["properties"]["url"], | 						"url" => $result["properties"]["url"], | ||||||
| 						"width" => null, | 						"width" => (int)$result["properties"]["width"], | ||||||
| 						"height" => null | 						"height" => (int)$result["properties"]["height"] | ||||||
| 					], | 					], | ||||||
| 					[ | 					[ | ||||||
| 						"url" => $result["thumbnail"]["src"], | 						"url" => $result["thumbnail"]["src"], | ||||||
| 						"width" => null, | 						"width" => (int)$result["thumbnail"]["width"], | ||||||
| 						"height" => null | 						"height" => (int)$result["thumbnail"]["height"] | ||||||
| 					] | 					] | ||||||
| 				], | 				], | ||||||
| 				"url" => $result["url"] | 				"url" => $result["url"] | ||||||
| @@ -1422,22 +1403,8 @@ class brave{ | |||||||
| 		$html = fread($handle, filesize("scraper/brave-video.html")); | 		$html = fread($handle, filesize("scraper/brave-video.html")); | ||||||
| 		fclose($handle);*/ | 		fclose($handle);*/ | ||||||
| 		 | 		 | ||||||
| 		preg_match( | 		$this->fuckhtml->load($html); | ||||||
| 			'/const data = (\[{.*}\]);/', | 		$json = $this->get_js(); | ||||||
| 			$html, |  | ||||||
| 			$json |  | ||||||
| 		); |  | ||||||
| 		 |  | ||||||
| 		if(!isset($json[1])){ |  | ||||||
| 			 |  | ||||||
| 			throw new Exception("Failed to get data object"); |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		$json = |  | ||||||
| 			$this->fuckhtml |  | ||||||
| 			->parseJsObject( |  | ||||||
| 				$json[1] |  | ||||||
| 			); |  | ||||||
| 		 | 		 | ||||||
| 		foreach( | 		foreach( | ||||||
| 			$json | 			$json | ||||||
| @@ -1809,7 +1776,21 @@ class brave{ | |||||||
| 		 | 		 | ||||||
| 		$nextpage = | 		$nextpage = | ||||||
| 			$this->fuckhtml | 			$this->fuckhtml | ||||||
| 			->getElementsByClassName("btn", "a"); | 			->getElementById( | ||||||
|  | 				"pagination", | ||||||
|  | 				"div" | ||||||
|  | 			); | ||||||
|  | 		 | ||||||
|  | 		if($nextpage){ | ||||||
|  | 			 | ||||||
|  | 			$this->fuckhtml->load($nextpage); | ||||||
|  | 			 | ||||||
|  | 			$nextpage = | ||||||
|  | 				$this->fuckhtml | ||||||
|  | 				->getElementsByClassName( | ||||||
|  | 					"button", | ||||||
|  | 					"a" | ||||||
|  | 				); | ||||||
| 			 | 			 | ||||||
| 			if(count($nextpage) !== 0){ | 			if(count($nextpage) !== 0){ | ||||||
| 				 | 				 | ||||||
| @@ -1847,6 +1828,7 @@ class brave{ | |||||||
| 						); | 						); | ||||||
| 				} | 				} | ||||||
| 			} | 			} | ||||||
|  | 		} | ||||||
| 		 | 		 | ||||||
| 		return null; | 		return null; | ||||||
| 	} | 	} | ||||||
|   | |||||||
							
								
								
									
										847
									
								
								scraper/cara.php
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										847
									
								
								scraper/cara.php
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,847 @@ | |||||||
|  | <?php | ||||||
|  |  | ||||||
|  | class cara{ | ||||||
|  | 	 | ||||||
|  | 	public function __construct(){ | ||||||
|  | 		 | ||||||
|  | 		include "lib/backend.php"; | ||||||
|  | 		$this->backend = new backend("cara"); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function getfilters($page){ | ||||||
|  | 		 | ||||||
|  | 		return [ | ||||||
|  | 			"sort" => [ | ||||||
|  | 				"display" => "Sort by", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"Top" => "Top", | ||||||
|  | 					"MostRecent" => "Most Recent" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"type" => [ | ||||||
|  | 				"display" => "Post type", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any type", | ||||||
|  | 					"portfolio" => "Portfolio", // {"posts":["portfolio"]} | ||||||
|  | 					"timeline" => "Timeline" // {"posts":["timeline"]} | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"fields" => [ | ||||||
|  | 				"display" => "Field/Medium", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any field", | ||||||
|  | 					"2D" => "2D Work", | ||||||
|  | 					"3D" => "3D Work", | ||||||
|  | 					"3DPrinting" => "3D Printing", | ||||||
|  | 					"Acrylic" => "Acrylic", | ||||||
|  | 					"AlcoholMarkers" => "Alcohol Markers", | ||||||
|  | 					"Animation" => "Animation", | ||||||
|  | 					"Chalk" => "Chalk", | ||||||
|  | 					"Charcoal" => "Charcoal", | ||||||
|  | 					"Colored pencil" => "Colored pencil", | ||||||
|  | 					"Conte" => "Conte", | ||||||
|  | 					"Crayon" => "Crayon", | ||||||
|  | 					"Digital" => "Digital", | ||||||
|  | 					"Gouache" => "Gouache", | ||||||
|  | 					"Ink" => "Ink", | ||||||
|  | 					"MixedMedia" => "Mixed-Media", | ||||||
|  | 					"Oil" => "Oil", | ||||||
|  | 					"Oil-based Markers" => "Oil-based Markers", | ||||||
|  | 					"Other" => "Other", | ||||||
|  | 					"Pastels" => "Pastels", | ||||||
|  | 					"Photography" => "Photography", | ||||||
|  | 					"Sculpture" => "Sculpture", | ||||||
|  | 					"Sketches" => "Sketches", | ||||||
|  | 					"Tattoos" => "Tattoos", | ||||||
|  | 					"Traditional" => "Traditional", | ||||||
|  | 					"VFX" => "VFX", | ||||||
|  | 					"Watercolor" => "Watercolor" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"category" => [ | ||||||
|  | 				"display" => "Category", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any category", | ||||||
|  | 					"3DScanning" => "3D Scanning", | ||||||
|  | 					"Abstract" => "Abstract", | ||||||
|  | 					"Adoptable" => "Adoptable", | ||||||
|  | 					"Anatomy" => "Anatomy", | ||||||
|  | 					"Animals" => "Animals", | ||||||
|  | 					"Anime" => "Anime", | ||||||
|  | 					"App" => "App", | ||||||
|  | 					"ArchitecturalConcepts" => "Architectural Concepts", | ||||||
|  | 					"ArchitecturalVisualization" => "Architectural Visualization", | ||||||
|  | 					"AugmentedReality" => "Augmented Reality", | ||||||
|  | 					"Automotive" => "Automotive", | ||||||
|  | 					"BoardGameArt" => "Board Game Art", | ||||||
|  | 					"BookIllustration" => "Book Illustration", | ||||||
|  | 					"CardGameArt" => "Card Game Art", | ||||||
|  | 					"CeramicsPottery" => "Ceramics/Pottery", | ||||||
|  | 					"CharacterAnimation" => "Character Animation", | ||||||
|  | 					"CharacterDesign" => "Character Design", | ||||||
|  | 					"CharacterModeling" => "Character Modeling", | ||||||
|  | 					"ChildrensArt" => "Children's Illustration", | ||||||
|  | 					"Collectibles" => "Collectibles", | ||||||
|  | 					"ColoringPage" => "Coloring Page", | ||||||
|  | 					"ComicArt" => "Comic Art", | ||||||
|  | 					"ConceptArt" => "Concept Art", | ||||||
|  | 					"Cosplay" => "Cosplay", | ||||||
|  | 					"CostumeDesign" => "Costume Design", | ||||||
|  | 					"CoverArt" => "Cover Art", | ||||||
|  | 					"Creatures" => "Creatures", | ||||||
|  | 					"Diorama" => "Diorama", | ||||||
|  | 					"EditorialIllustration" => "Editorial Illustration", | ||||||
|  | 					"EmbroiderySewing" => "Embroidery/Sewing", | ||||||
|  | 					"EnvironmentalConceptArt" => "Environmental Concept Art", | ||||||
|  | 					"EnvironmentalConceptDesign" => "Environmental Concept Design", | ||||||
|  | 					"FanArt" => "Fan Art", | ||||||
|  | 					"Fantasy" => "Fantasy", | ||||||
|  | 					"Fashion" => "Fashion", | ||||||
|  | 					"FashionStyling" => "Fashion Styling", | ||||||
|  | 					"FiberArts" => "Fiber Arts", | ||||||
|  | 					"Furry" => "Furry", | ||||||
|  | 					"GameArt" => "Game Art", | ||||||
|  | 					"GameplayDesign" => "Gameplay Design", | ||||||
|  | 					"GamesEnvironmentArt" => "Games Environment Art", | ||||||
|  | 					"Gem" => "Gem", | ||||||
|  | 					"GraphicDesign" => "Graphic Design", | ||||||
|  | 					"Handicraft" => "Handicraft", | ||||||
|  | 					"HairStyling" => "Hair Styling", | ||||||
|  | 					"HardSurface" => "Hard Surface", | ||||||
|  | 					"Horror" => "Horror", | ||||||
|  | 					"Illustration" => "Illustration", | ||||||
|  | 					"IllustrationVisualization" => "Illustration Visualization", | ||||||
|  | 					"IndustrialDesign" => "Industrial Design", | ||||||
|  | 					"Jewelry" => "Jewelry", | ||||||
|  | 					"KnittingCrochet" => "Knitting/Crochet", | ||||||
|  | 					"Landscape" => "Landscape", | ||||||
|  | 					"LevelDesign" => "Level Design", | ||||||
|  | 					"Lighting" => "Lighting", | ||||||
|  | 					"Makeup" => "Makeup", | ||||||
|  | 					"Manga" => "Manga", | ||||||
|  | 					"MapsCartography" => "Maps/Cartography", | ||||||
|  | 					"MattePainting" => "Matte Painting", | ||||||
|  | 					"Materials" => "Materials", | ||||||
|  | 					"MechanicalDesign" => "Mechanical Design", | ||||||
|  | 					"Medical" => "Medical", | ||||||
|  | 					"Mecha" => "Mecha", | ||||||
|  | 					"MiniatureArt" => "Miniature Art", | ||||||
|  | 					"MotionGraphics" => "Motion Graphics", | ||||||
|  | 					"FrescoMurals" => "Fresco/Murals", | ||||||
|  | 					"Natural" => "Natural", | ||||||
|  | 					"Original Character" => "Original Character", | ||||||
|  | 					"Overlay" => "Overlay", | ||||||
|  | 					"PleinAir" => "Plein Air", | ||||||
|  | 					"Photogrammetry" => "Photogrammetry", | ||||||
|  | 					"PixelArt" => "Pixel Art", | ||||||
|  | 					"Portraits" => "Portraits", | ||||||
|  | 					"Props" => "Props", | ||||||
|  | 					"ProductDesign" => "Product Design", | ||||||
|  | 					"PublicDomain" => "Public Domain or Royalty Free", | ||||||
|  | 					"Real-Time3DEnvironmentArt" => "Real-Time 3D Environment Art", | ||||||
|  | 					"Realism" => "Realism", | ||||||
|  | 					"ScienceFiction" => "Science Fiction", | ||||||
|  | 					"ScientificVisualization" => "Scientific Visualization", | ||||||
|  | 					"Scripts" => "Scripts", | ||||||
|  | 					"StillLife" => "Still Life", | ||||||
|  | 					"Storyboards" => "Storyboards", | ||||||
|  | 					"Stylized" => "Stylized", | ||||||
|  | 					"Surreal" => "Surreal", | ||||||
|  | 					"TechnicalArt" => "Technical Art", | ||||||
|  | 					"Textures" => "Textures", | ||||||
|  | 					"Tools" => "Tools", | ||||||
|  | 					"Toys" => "Toys", | ||||||
|  | 					"ToyPackaging" => "Toy Packaging", | ||||||
|  | 					"Tutorials" => "Tutorials", | ||||||
|  | 					"UIArt" => "User Interface (UI) Art", | ||||||
|  | 					"UrbanSketch" => "Urban Sketch", | ||||||
|  | 					"VFXforAnimation" => "VFX for Animation", | ||||||
|  | 					"VFXforFilm" => "VFX for Film", | ||||||
|  | 					"VFXforGames" => "VFX for Games", | ||||||
|  | 					"VFXforRealTime" => "VFX for Real-Time", | ||||||
|  | 					"VFXforTV" => "VFX for TV", | ||||||
|  | 					"Vehicles" => "Vehicles", | ||||||
|  | 					"VirtualReality" => "Virtual Reality", | ||||||
|  | 					"VisualDevelopment" => "Visual Development", | ||||||
|  | 					"VoxelArt" => "Voxel Art", | ||||||
|  | 					"Vtubers" => "Vtubers", | ||||||
|  | 					"WIP" => "WIP (Work in Progress)", | ||||||
|  | 					"Web" => "Web", | ||||||
|  | 					"Weapons" => "Weapons", | ||||||
|  | 					"Wildlife" => "Wildlife", | ||||||
|  | 					"Woodcutting" => "Woodcutting" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"software" => [ | ||||||
|  | 				"display" => "Software", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any software", | ||||||
|  | 					"123D" => "123D", | ||||||
|  | 					"123DCatch" => "123D Catch", | ||||||
|  | 					"3DBee" => "3DBee", | ||||||
|  | 					"3DCoat" => "3DCoat", | ||||||
|  | 					"3DCoatPrint" => "3DCoatPrint", | ||||||
|  | 					"3DCoatTextura" => "3DCoatTextura", | ||||||
|  | 					"3DEqualizer" => "3DEqualizer", | ||||||
|  | 					"3DFZephyr" => "3DF Zephyr", | ||||||
|  | 					"3Delight" => "3Delight", | ||||||
|  | 					"3dpeople" => "3dpeople", | ||||||
|  | 					"3dsMax" => "3ds Max", | ||||||
|  | 					"3DSPaint" => "3DS Paint", | ||||||
|  | 					"ACDSeeCanvas" => "ACDSee Canvas", | ||||||
|  | 					"AbletonLive" => "Ableton Live", | ||||||
|  | 					"Acrobat" => "Acrobat", | ||||||
|  | 					"AdobeDraw" => "Adobe Draw", | ||||||
|  | 					"AdobeFlash" => "Adobe Flash", | ||||||
|  | 					"AdobeFresco" => "Adobe Fresco", | ||||||
|  | 					"AdobeSubstance3Dassets" => "Adobe Substance 3D assets", | ||||||
|  | 					"AdobeXD" => "Adobe XD", | ||||||
|  | 					"AffinityDesigner" => "Affinity Designer", | ||||||
|  | 					"AffinityPhoto" => "Affinity Photo", | ||||||
|  | 					"AfterEffects" => "After Effects", | ||||||
|  | 					"Akeytsu" => "Akeytsu", | ||||||
|  | 					"Alchemy" => "Alchemy", | ||||||
|  | 					"AliasDesign" => "Alias Design", | ||||||
|  | 					"AlightMotion" => "Alight Motion", | ||||||
|  | 					"Amadine" => "Amadine", | ||||||
|  | 					"Amberlight" => "Amberlight", | ||||||
|  | 					"Animate" => "Animate", | ||||||
|  | 					"AnimationMaster" => "Animation:Master", | ||||||
|  | 					"AnimeStudio" => "Anime Studio", | ||||||
|  | 					"Apophysis" => "Apophysis", | ||||||
|  | 					"ArchiCAD" => "ArchiCAD", | ||||||
|  | 					"Arion" => "Arion", | ||||||
|  | 					"ArionFX" => "ArionFX", | ||||||
|  | 					"Arnold" => "Arnold", | ||||||
|  | 					"ArtEngine" => "ArtEngine", | ||||||
|  | 					"ArtFlow" => "ArtFlow", | ||||||
|  | 					"ArtRage" => "ArtRage", | ||||||
|  | 					"ArtstudioPro" => "Artstudio Pro", | ||||||
|  | 					"Artweaver" => "Artweaver", | ||||||
|  | 					"Aseprite" => "Aseprite", | ||||||
|  | 					"Audition" => "Audition", | ||||||
|  | 					"AutoCAD" => "AutoCAD", | ||||||
|  | 					"AutodeskSketchBook" => "Autodesk SketchBook", | ||||||
|  | 					"AvidMediaComposer" => "Avid Media Composer", | ||||||
|  | 					"AzPainter" => "AzPainter", | ||||||
|  | 					"babylonjs" => "babylon.js", | ||||||
|  | 					"BalsamiqMockup" => "Balsamiq Mockup", | ||||||
|  | 					"Bforartists" => "Bforartists", | ||||||
|  | 					"BlackInk" => "Black Ink", | ||||||
|  | 					"BlackmagicDesignFusion" => "Blackmagic Design Fusion", | ||||||
|  | 					"Blender" => "Blender", | ||||||
|  | 					"Blender DeepPaint" => "Blender DeepPaint", | ||||||
|  | 					"BlenderGreasePencil" => "Blender Grease Pencil", | ||||||
|  | 					"Blockbench" => "Blockbench", | ||||||
|  | 					"BodyPaint" => "BodyPaint", | ||||||
|  | 					"Boxcutter" => "Boxcutter", | ||||||
|  | 					"BraidMaker" => "Braid Maker", | ||||||
|  | 					"BrickLinkStudio" => "BrickLink Studio", | ||||||
|  | 					"Bridge" => "Bridge", | ||||||
|  | 					"Brushifyio" => "Brushify.io", | ||||||
|  | 					"C" => "C", | ||||||
|  | 					"C#" => "C#", | ||||||
|  | 					"C++" => "C++", | ||||||
|  | 					"CACANi" => "CACANi", | ||||||
|  | 					"CLIPSTUDIOPAINT" => "CLIP STUDIO PAINT", | ||||||
|  | 					"CLO" => "CLO", | ||||||
|  | 					"CRYENGINE" => "CRYENGINE", | ||||||
|  | 					"Callipeg" => "Callipeg", | ||||||
|  | 					"Canva" => "Canva", | ||||||
|  | 					"CaptureOne" => "Capture One", | ||||||
|  | 					"CartoonAnimator" => "Cartoon Animator", | ||||||
|  | 					"Carveco" => "Carveco", | ||||||
|  | 					"Cavalry" => "Cavalry", | ||||||
|  | 					"Chaotica" => "Chaotica", | ||||||
|  | 					"CharacterAnimator" => "Character Animator", | ||||||
|  | 					"CharacterCreator" => "Character Creator", | ||||||
|  | 					"Cinema4D" => "Cinema 4D", | ||||||
|  | 					"ClarisseiFX" => "Clarisse iFX", | ||||||
|  | 					"Coiffure" => "Coiffure", | ||||||
|  | 					"ColorsLive" => "Colors Live", | ||||||
|  | 					"Combustion" => "Combustion", | ||||||
|  | 					"Construct2" => "Construct 2", | ||||||
|  | 					"Core" => "Core", | ||||||
|  | 					"CorelPainter" => "Corel Painter", | ||||||
|  | 					"CorelDRAWGraphicsSuite" => "CorelDRAW Graphics Suite", | ||||||
|  | 					"CoronaRenderer" => "Corona Renderer", | ||||||
|  | 					"ProMotionNG" => "Cosmigo Pro Motion NG", | ||||||
|  | 					"CrazyBump" => "CrazyBump", | ||||||
|  | 					"Crocotile3D" => "Crocotile 3D", | ||||||
|  | 					"Curvy3D" => "Curvy 3D", | ||||||
|  | 					"Cycles4D" => "Cycles 4D", | ||||||
|  | 					"Darkroom" => "Darkroom", | ||||||
|  | 					"DAZStudio" => "DAZ Studio", | ||||||
|  | 					"DDO" => "DDO", | ||||||
|  | 					"DECIMA" => "DECIMA", | ||||||
|  | 					"Darktable" => "Darktable", | ||||||
|  | 					"DaVinciResolve" => "DaVinci Resolve", | ||||||
|  | 					"Dimension" => "Dimension", | ||||||
|  | 					"DragonBones" => "DragonBones", | ||||||
|  | 					"Dragonframe" => "Dragonframe", | ||||||
|  | 					"Drawpile" => "Drawpile", | ||||||
|  | 					"Dreams" => "Dreams", | ||||||
|  | 					"Dreamweaver" => "Dreamweaver", | ||||||
|  | 					"DxOPhotoLab" => "DxO PhotoLab", | ||||||
|  | 					"ECycles" => "E-Cycles", | ||||||
|  | 					"EmberGen" => "EmberGen", | ||||||
|  | 					"Encore" => "Encore", | ||||||
|  | 					"Expresii" => "Expresii", | ||||||
|  | 					"FStorm" => "FStorm", | ||||||
|  | 					"FadeIn" => "FadeIn", | ||||||
|  | 					"Feather3D" => "Feather 3D", | ||||||
|  | 					"FiberShop" => "FiberShop", | ||||||
|  | 					"Figma" => "Figma", | ||||||
|  | 					"FilmoraWondershare" => "Filmora Wondershare", | ||||||
|  | 					"FilterForge" => "Filter Forge", | ||||||
|  | 					"FinalCutPro" => "Final Cut Pro", | ||||||
|  | 					"FinalDraft" => "Final Draft", | ||||||
|  | 					"finalRender" => "finalRender", | ||||||
|  | 					"FireAlpaca" => "FireAlpaca", | ||||||
|  | 					"Fireworks" => "Fireworks", | ||||||
|  | 					"FlamePainter" => "Flame Painter", | ||||||
|  | 					"Flash" => "Flash", | ||||||
|  | 					"FlipaClip" => "FlipaClip", | ||||||
|  | 					"FlipnoteStudio" => "Flipnote Studio", | ||||||
|  | 					"Fluent" => "Fluent", | ||||||
|  | 					"ForestPack" => "Forest Pack", | ||||||
|  | 					"FormZ" => "Form-Z", | ||||||
|  | 					"Fractorium" => "Fractorium", | ||||||
|  | 					"FreeCAD" => "FreeCAD", | ||||||
|  | 					"FreeHand" => "FreeHand", | ||||||
|  | 					"Forger" => "Forger", | ||||||
|  | 					"FrostbiteEngine" => "Frostbite Engine", | ||||||
|  | 					"fSpy" => "fSpy", | ||||||
|  | 					"FumeFX" => "FumeFX", | ||||||
|  | 					"Fusion360" => "Fusion 360", | ||||||
|  | 					"GIMP" => "GIMP", | ||||||
|  | 					"GSCurveTools" => "GS CurveTools", | ||||||
|  | 					"GSToolbox" => "GS Toolbox", | ||||||
|  | 					"Gaea" => "Gaea", | ||||||
|  | 					"GameTextures" => "Game Textures", | ||||||
|  | 					"GameMakerStudio" => "GameMaker: Studio", | ||||||
|  | 					"GarageFarmNET" => "GarageFarm.NET", | ||||||
|  | 					"GeoGlyph" => "GeoGlyph", | ||||||
|  | 					"GigapixelAl" => "Gigapixel Al", | ||||||
|  | 					"Glaxnimate" => "Glaxnimate", | ||||||
|  | 					"GnomePaint" => "Gnome Paint", | ||||||
|  | 					"Godot" => "Godot", | ||||||
|  | 					"Goxel" => "Goxel", | ||||||
|  | 					"Graphite" => "Graphite", | ||||||
|  | 					"Graswald" => "Graswald", | ||||||
|  | 					"GravitySketch" => "Gravity Sketch", | ||||||
|  | 					"GuerillaRender" => "GuerillaRender", | ||||||
|  | 					"HDRLightStudio" => "HDR Light Studio", | ||||||
|  | 					"HairStrandDesigner" => "Hair Strand Designer", | ||||||
|  | 					"HairTGHairFur" => "HairTG - Hair & Fur", | ||||||
|  | 					"HairTGSurfaceFeatherEdition" => "HairTG - Surface, Feather Edition", | ||||||
|  | 					"HairTGSurfaceHairEdition" => "HairTG - Surface, Hair Edition", | ||||||
|  | 					"Handplane" => "Handplane", | ||||||
|  | 					"Hansoft" => "Hansoft", | ||||||
|  | 					"HardOps" => "Hard Ops", | ||||||
|  | 					"HardMesh" => "HardMesh", | ||||||
|  | 					"Harmony" => "Harmony", | ||||||
|  | 					"HeavypaintWebbypaint" => "Heavypaint/Webbypaint", | ||||||
|  | 					"HelloPaint" => "HelloPaint", | ||||||
|  | 					"HeliconFocus" => "Helicon Focus", | ||||||
|  | 					"Hexels" => "Hexels", | ||||||
|  | 					"HiPaint" => "HiPaint", | ||||||
|  | 					"Houdini" => "Houdini", | ||||||
|  | 					"HydraRenderer" => "Hydra Renderer", | ||||||
|  | 					"iArtbook" => "iArtbook", | ||||||
|  | 					"IbisPaint" => "ibisPaint", | ||||||
|  | 					"Ideas" => "Ideas", | ||||||
|  | 					"IllustStudio" => "Illust Studio", | ||||||
|  | 					"Illustrator" => "Illustrator", | ||||||
|  | 					"IllustratorDraw" => "Illustrator Draw", | ||||||
|  | 					"InDesign" => "InDesign", | ||||||
|  | 					"Inochi2D" => "Inochi2D", | ||||||
|  | 					"InVision" => "InVision", | ||||||
|  | 					"InVisionCraft" => "InVision Craft", | ||||||
|  | 					"InfinitePainter" => "Infinite Painter", | ||||||
|  | 					"Inkscape" => "Inkscape", | ||||||
|  | 					"Inspirit" => "Inspirit", | ||||||
|  | 					"InstaLOD" => "InstaLOD", | ||||||
|  | 					"InstaMAT" => "InstaMAT", | ||||||
|  | 					"InstantLightRealtimePBR" => "Instant Light Realtime PBR", | ||||||
|  | 					"InstantMeshes" => "Instant Meshes", | ||||||
|  | 					"InstantTerra" => "Instant Terra", | ||||||
|  | 					"Inventor" => "Inventor", | ||||||
|  | 					"Iray" => "Iray", | ||||||
|  | 					"JWildfire" => "JWildfire", | ||||||
|  | 					"Java" => "Java", | ||||||
|  | 					"Jira" => "Jira", | ||||||
|  | 					"JumpPaint" => "Jump Paint by MediBang", | ||||||
|  | 					"JSPaint" => "JS Paint", | ||||||
|  | 					"Katana" => "Katana", | ||||||
|  | 					"Keyshot" => "Keyshot", | ||||||
|  | 					"KidPix" => "Kid Pix", | ||||||
|  | 					"KitBash3D" => "KitBash3D", | ||||||
|  | 					"Knald" => "Knald", | ||||||
|  | 					"Kodon" => "Kodon", | ||||||
|  | 					"KolourPaint" => "KolourPaint", | ||||||
|  | 					"Krakatoa" => "Krakatoa", | ||||||
|  | 					"KRESKA" => "KRESKA", | ||||||
|  | 					"Krita" => "Krita", | ||||||
|  | 					"LensStudio" => "Lens Studio", | ||||||
|  | 					"LibreSprite" => "LibreSprite", | ||||||
|  | 					"LightWave3D" => "LightWave 3D", | ||||||
|  | 					"Lightroom" => "Lightroom", | ||||||
|  | 					"Linearity" => "Linearity", | ||||||
|  | 					"LiquiGen" => "LiquiGen", | ||||||
|  | 					"Live2DCubism" => "Live2D Cubism", | ||||||
|  | 					"LookatmyHair" => "Look at my Hair", | ||||||
|  | 					"Lotpixel" => "Lotpixel", | ||||||
|  | 					"Lumion" => "Lumion", | ||||||
|  | 					"LuxRender" => "LuxRender", | ||||||
|  | 					"MacPaint" => "MacPaint", | ||||||
|  | 					"MagicaCSG" => "MagicaCSG", | ||||||
|  | 					"MagicaVoxel" => "MagicaVoxel", | ||||||
|  | 					"Magma" => "Magma", | ||||||
|  | 					"MakeHuman" => "MakeHuman", | ||||||
|  | 					"Malmal" => "Malmal", | ||||||
|  | 					"Mandelbulb3D" => "Mandelbulb 3D", | ||||||
|  | 					"Mandelbulber" => "Mandelbulber", | ||||||
|  | 					"MangaStudio" => "Manga Studio", | ||||||
|  | 					"Mari" => "Mari", | ||||||
|  | 					"MarmosetToolbag" => "Marmoset Toolbag", | ||||||
|  | 					"MarvelousDesigner" => "Marvelous Designer", | ||||||
|  | 					"MasterpieceStudioPro" => "Masterpiece Studio Pro", | ||||||
|  | 					"MasterpieceVR" => "MasterpieceVR", | ||||||
|  | 					"Maverick" => "Maverick", | ||||||
|  | 					"MaxwellRender" => "Maxwell Render", | ||||||
|  | 					"Maya" => "Maya", | ||||||
|  | 					"MediBangPaint" => "MediBang Paint", | ||||||
|  | 					"MediumbyAdobe" => "Medium by Adobe", | ||||||
|  | 					"Megascans" => "Megascans", | ||||||
|  | 					"mentalray" => "mental ray", | ||||||
|  | 					"MeshLab" => "MeshLab", | ||||||
|  | 					"Meshroom" => "Meshroom", | ||||||
|  | 					"MetaHumanCreator" => "MetaHuman Creator", | ||||||
|  | 					"Metashape" => "Metashape", | ||||||
|  | 					"MightyBake" => "MightyBake", | ||||||
|  | 					"MikuMikuDance" => "MikuMikuDance", | ||||||
|  | 					"Minecraft" => "Minecraft", | ||||||
|  | 					"Mischief" => "Mischief", | ||||||
|  | 					"Mixamo" => "Mixamo", | ||||||
|  | 					"Mixer" => "Mixer", | ||||||
|  | 					"MoI3D" => "MoI3D", | ||||||
|  | 					"Mocha" => "Mocha", | ||||||
|  | 					"Modo" => "Modo", | ||||||
|  | 					"Moho" => "Moho", | ||||||
|  | 					"MotionBuilder" => "MotionBuilder", | ||||||
|  | 					"Mudbox" => "Mudbox", | ||||||
|  | 					"Muse" => "Muse", | ||||||
|  | 					"MSPaint" => "MS Paint", | ||||||
|  | 					"MyPaint" => "MyPaint", | ||||||
|  | 					"NDO" => "NDO", | ||||||
|  | 					"NX" => "NX", | ||||||
|  | 					"NdotCAD" => "NdotCAD", | ||||||
|  | 					"NintendoNotes" => "Nintendo Notes", | ||||||
|  | 					"NomadSculpt" => "Nomad Sculpt", | ||||||
|  | 					"Notability" => "Notability", | ||||||
|  | 					"Nuke" => "Nuke", | ||||||
|  | 					"Nvil" => "Nvil", | ||||||
|  | 					"OctaneRender" => "Octane Render", | ||||||
|  | 					"Omniverse" => "Omniverse", | ||||||
|  | 					"OmniverseCreate" => "Omniverse Create", | ||||||
|  | 					"ON1PhotoRAW" => "ON1 Photo RAW", | ||||||
|  | 					"Open3DEngine" => "Open 3D Engine", | ||||||
|  | 					"OpenCanvas" => "OpenCanvas", | ||||||
|  | 					"OpenGL" => "OpenGL", | ||||||
|  | 					"OpenToonz" => "OpenToonz", | ||||||
|  | 					"Ornatrix" => "Ornatrix", | ||||||
|  | 					"OsciRender" => "Osci-Render", | ||||||
|  | 					"OurPaint" => "Our Paint", | ||||||
|  | 					"PBRMAX" => "PBRMAX", | ||||||
|  | 					"PFTrack" => "PFTrack", | ||||||
|  | 					"PTGui" => "PTGui", | ||||||
|  | 					"Paintbrush" => "Paintbrush", | ||||||
|  | 					"PaintNET" => "Paint.NET", | ||||||
|  | 					"PaintShopPro" => "PaintShop Pro", | ||||||
|  | 					"PaintToolSAI" => "Paint Tool SAI", | ||||||
|  | 					"PaintstormStudio" => "Paintstorm Studio", | ||||||
|  | 					"Paper" => "Paper", | ||||||
|  | 					"Pencil2D" => "Pencil2D", | ||||||
|  | 					"Penpot" => "Penpot", | ||||||
|  | 					"PhoenixFD" => "Phoenix FD", | ||||||
|  | 					"Phonto" => "Phonto", | ||||||
|  | 					"PhotoLab2" => "PhotoLab 2", | ||||||
|  | 					"Photopea" => "Photopea", | ||||||
|  | 					"Photoscan" => "Photoscan", | ||||||
|  | 					"Photoshop" => "Photoshop", | ||||||
|  | 					"PhotoshopElements" => "Photoshop Elements", | ||||||
|  | 					"PicoCAD" => "picoCAD", | ||||||
|  | 					"PicoCAD2" => "picoCAD 2", | ||||||
|  | 					"Pinta" => "Pinta", | ||||||
|  | 					"Piskel" => "Piskel", | ||||||
|  | 					"Pixilart" => "Pixilart", | ||||||
|  | 					"Pixelitor" => "Pixelitor", | ||||||
|  | 					"Pixelmator" => "Pixelmator", | ||||||
|  | 					"Pixelorama" => "Pixelorama", | ||||||
|  | 					"PixivSketch" => "pixiv Sketch", | ||||||
|  | 					"Pixquare" => "Pixquare", | ||||||
|  | 					"PlantCatalog" => "PlantCatalog", | ||||||
|  | 					"PlantFactory" => "PlantFactory", | ||||||
|  | 					"Plasticity" => "Plasticity", | ||||||
|  | 					"PNGtuberPlus" => "PNGtuber Plus", | ||||||
|  | 					"Poliigon" => "Poliigon", | ||||||
|  | 					"Polybrush" => "Polybrush", | ||||||
|  | 					"PopcornFx" => "PopcornFx", | ||||||
|  | 					"Poser" => "Poser", | ||||||
|  | 					"Premiere" => "Premiere", | ||||||
|  | 					"PremiereElements" => "Premiere Elements", | ||||||
|  | 					"PresagisCreator" => "Presagis Creator", | ||||||
|  | 					"ProTools" => "Pro Tools", | ||||||
|  | 					"Procreate" => "Procreate", | ||||||
|  | 					"ProcreateDreams" => "Procreate Dreams", | ||||||
|  | 					"Producer" => "Producer", | ||||||
|  | 					"PrometheanAI" => "Promethean AI", | ||||||
|  | 					"PureRef" => "PureRef", | ||||||
|  | 					"Python" => "Python", | ||||||
|  | 					"PyxelEdit" => "PyxelEdit", | ||||||
|  | 					"QuadRemesher" => "Quad Remesher", | ||||||
|  | 					"QuarkXPress" => "QuarkXPress", | ||||||
|  | 					"Qubicle" => "Qubicle", | ||||||
|  | 					"Quill" => "Quill", | ||||||
|  | 					"QuixelBridge" => "Quixel Bridge", | ||||||
|  | 					"QuixelMegascans" => "Quixel Megascans", | ||||||
|  | 					"QuixelMixer" => "Quixel Mixer", | ||||||
|  | 					"QuixelSuite" => "Quixel Suite", | ||||||
|  | 					"R3DSWrap" => "R3DS Wrap", | ||||||
|  | 					"R3DSZWRAP" => "R3DS ZWRAP", | ||||||
|  | 					"RDTextures" => "RD-Textures", | ||||||
|  | 					"RailClone" => "RailClone", | ||||||
|  | 					"RealFlow" => "RealFlow", | ||||||
|  | 					"RealisticPaintStudio" => "Realistic Paint Studio", | ||||||
|  | 					"RealityCapture" => "RealityCapture", | ||||||
|  | 					"RealityScan" => "RealityScan", | ||||||
|  | 					"RealtimeBoard" => "Realtime Board", | ||||||
|  | 					"Rebelle" => "Rebelle", | ||||||
|  | 					"Redshift" => "Redshift", | ||||||
|  | 					"RenderMan" => "RenderMan", | ||||||
|  | 					"RenderNetwork" => "Render Network", | ||||||
|  | 					"Revit" => "Revit", | ||||||
|  | 					"Rhino" => "Rhino", | ||||||
|  | 					"Rhinoceros" => "Rhinoceros", | ||||||
|  | 					"RizomUV" => "RizomUV", | ||||||
|  | 					"RoughAnimator" => "Rough Animator", | ||||||
|  | 					"SamsungNotes" => "Samsung Notes", | ||||||
|  | 					"SamsungPENUP" => "Samsung PENUP", | ||||||
|  | 					"ScansLibrary" => "ScansLibrary", | ||||||
|  | 					"Scrivener" => "Scrivener", | ||||||
|  | 					"Sculpt+" => "Sculpt+", | ||||||
|  | 					"Sculptris" => "Sculptris", | ||||||
|  | 					"ShaveandaHaircut" => "Shave and a Haircut", | ||||||
|  | 					"ShiVa3D" => "ShiVa3D", | ||||||
|  | 					"Shotgun" => "Shotgun", | ||||||
|  | 					"Silo" => "Silo", | ||||||
|  | 					"Silugen" => "Silugen", | ||||||
|  | 					"Sketch" => "Sketch", | ||||||
|  | 					"SketchApp" => "Sketch App", | ||||||
|  | 					"SketchBookPro" => "SketchBook Pro", | ||||||
|  | 					"SketchClub" => "SketchClub", | ||||||
|  | 					"SketchUp" => "SketchUp", | ||||||
|  | 					"Sketchable" => "Sketchable", | ||||||
|  | 					"Sketchfab" => "Sketchfab", | ||||||
|  | 					"Skyshop" => "Skyshop", | ||||||
|  | 					"Snapseed" => "Snapseed", | ||||||
|  | 					"Snowdrop" => "Snowdrop", | ||||||
|  | 					"Softimage" => "Softimage", | ||||||
|  | 					"SolidWorks" => "SolidWorks", | ||||||
|  | 					"SonySketch" => "Sony Sketch", | ||||||
|  | 					"Soundbooth" => "Soundbooth", | ||||||
|  | 					"Source2" => "Source 2", | ||||||
|  | 					"SourceControl" => "Source Control", | ||||||
|  | 					"SourceFilmmaker" => "Source Filmmaker", | ||||||
|  | 					"SpeedTree" => "SpeedTree", | ||||||
|  | 					"Speedgrade" => "Speedgrade", | ||||||
|  | 					"SpeedyPainter" => "SpeedyPainter", | ||||||
|  | 					"Spine2D" => "Spine 2D", | ||||||
|  | 					"Spriter" => "Spriter", | ||||||
|  | 					"Stingray" => "Stingray", | ||||||
|  | 					"Storyboarder" => "Storyboarder", | ||||||
|  | 					"StoryboardPro" => "Storyboard Pro", | ||||||
|  | 					"SublimeText" => "Sublime Text", | ||||||
|  | 					"Substance3DDesigner" => "Substance 3D Designer", | ||||||
|  | 					"Substance3DModeler" => "Substance 3D Modeler", | ||||||
|  | 					"Substance3DPainter" => "Substance 3D Painter", | ||||||
|  | 					"Substance3DSampler" => "Substance 3D Sampler", | ||||||
|  | 					"Substance3DStager" => "Substance 3D Stager", | ||||||
|  | 					"SubstanceB2M" => "Substance B2M", | ||||||
|  | 					"SweetHome3D" => "Sweet Home 3D", | ||||||
|  | 					"SynthEyes" => "SynthEyes", | ||||||
|  | 					"TTools" => "TTools", | ||||||
|  | 					"TVPaint" => "TVPaint", | ||||||
|  | 					"TVPaintAnimation" => "TVPaint Animation", | ||||||
|  | 					"TayasuiSketches" => "Tayasui Sketches", | ||||||
|  | 					"TayasuiSketchesMobileApp" => "Tayasui Sketches Mobile App", | ||||||
|  | 					"TayasuiSketchesPro" => "Tayasui Sketches Pro", | ||||||
|  | 					"Terragen" => "Terragen", | ||||||
|  | 					"Texturescom" => "Textures.com", | ||||||
|  | 					"Texturingxyz" => "Texturingxyz", | ||||||
|  | 					"TeyaConceptor" => "Teya Conceptor", | ||||||
|  | 					"TheGrove3D" => "The Grove 3D", | ||||||
|  | 					"TheaRender" => "Thea Render", | ||||||
|  | 					"Threejs" => "Three.js", | ||||||
|  | 					"Tiled" => "Tiled", | ||||||
|  | 					"TiltBrush" => "Tilt Brush", | ||||||
|  | 					"Tooll3" => "Tooll3", | ||||||
|  | 					"ToonBoomHarmony" => "Toon Boom Harmony", | ||||||
|  | 					"ToonBoomStudio" => "Toon Boom Studio", | ||||||
|  | 					"ToonSquid" => "ToonSquid", | ||||||
|  | 					"TopoGun" => "TopoGun", | ||||||
|  | 					"TuxPaint" => "Tux Paint", | ||||||
|  | 					"Tvori" => "Tvori", | ||||||
|  | 					"Twinmotion" => "Twinmotion", | ||||||
|  | 					"UNIGINEEngine" => "UNIGINE Engine", | ||||||
|  | 					"UVLayout" => "UVLayout", | ||||||
|  | 					"UltraFractal" => "Ultra Fractal", | ||||||
|  | 					"uMake" => "uMake", | ||||||
|  | 					"Unfold3D" => "Unfold 3D", | ||||||
|  | 					"Unity" => "Unity", | ||||||
|  | 					"UnrealEngine" => "Unreal Engine", | ||||||
|  | 					"Vengi" => "vengi", | ||||||
|  | 					"VRay" => "V-Ray", | ||||||
|  | 					"VRED" => "VRED", | ||||||
|  | 					"VTubeStudio" => "VTube Studio", | ||||||
|  | 					"Vectary" => "Vectary", | ||||||
|  | 					"VectorayGen" => "VectorayGen", | ||||||
|  | 					"Vectorworks" => "Vectorworks", | ||||||
|  | 					"VegasPro" => "Vegas Pro", | ||||||
|  | 					"VisualDesigner3D" => "Visual Designer 3D", | ||||||
|  | 					"VisualStudio" => "Visual Studio", | ||||||
|  | 					"VRoidStudio" => "VRoid Studio", | ||||||
|  | 					"Vue" => "Vue", | ||||||
|  | 					"Vuforia" => "Vuforia", | ||||||
|  | 					"WebGL" => "WebGL", | ||||||
|  | 					"WhiteboardFox" => "Whiteboard Fox", | ||||||
|  | 					"WickEditor" => "Wick Editor", | ||||||
|  | 					"Wings3D" => "Wings 3D", | ||||||
|  | 					"Word" => "Word", | ||||||
|  | 					"WorldCreator" => "World Creator", | ||||||
|  | 					"WorldMachine" => "World Machine", | ||||||
|  | 					"XParticles" => "X-Particles", | ||||||
|  | 					"Xfrog" => "Xfrog", | ||||||
|  | 					"Xgen" => "Xgen", | ||||||
|  | 					"xNormal" => "xNormal", | ||||||
|  | 					"xTex" => "xTex", | ||||||
|  | 					"XoliulShader" => "Xoliul Shader", | ||||||
|  | 					"Yafaray" => "Yafaray", | ||||||
|  | 					"Yeti" => "Yeti", | ||||||
|  | 					"ZBrush" => "ZBrush", | ||||||
|  | 					"ZBrushCore" => "ZBrushCore", | ||||||
|  | 					"ZenBrush" => "Zen Brush" | ||||||
|  | 				] | ||||||
|  | 			] | ||||||
|  | 		]; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function get($proxy, $url, $get = [], $search){ | ||||||
|  | 		 | ||||||
|  | 		$curlproc = curl_init(); | ||||||
|  | 		 | ||||||
|  | 		if($get !== []){ | ||||||
|  | 			$get = http_build_query($get); | ||||||
|  | 			$url .= "?" . $get; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_URL, $url); | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
|  | 			["User-Agent: " . config::USER_AGENT, | ||||||
|  | 			"Accept: application/json, text/plain, */*", | ||||||
|  | 			"Accept-Language: en-US,en;q=0.5", | ||||||
|  | 			"Accept-Encoding: gzip, deflate, br, zstd", | ||||||
|  | 			//"sentry-trace: 72b0318a7141fe18cbacbd905572eddf-a60de161b66b1e6f-1 | ||||||
|  | 			//"baggage: sentry-environment=vercel-production,sentry-release=251ff5179b4de94974f36d9b8659a487bbb8a819,sentry-public_key=2b87af2b44c84643a011838ad097735f,sentry-trace_id=72b0318a7141fe18cbacbd905572eddf,sentry-transaction=GET%20%2Fsearch,sentry-sampled=true,sentry-sample_rand=0.09967130764937493,sentry-sample_rate=0.5", | ||||||
|  | 			"DNT: 1", | ||||||
|  | 			"Sec-GPC: 1", | ||||||
|  | 			"Connection: keep-alive", | ||||||
|  | 			//"Referer: https://cara.app/search?q=jak+and+daxter&type=&sortBy=Top&filters=%7B%7D", | ||||||
|  | 			"Referer: https://cara.app/search?q=" . urlencode($search), | ||||||
|  | 			//"Cookie: __Host-next-auth.csrf-token=b752c4296375bccb7b480ff010e1e916c65c35c311a4a57ac6cd871468730578%7C4d3783cfb72a98f390e534abd149806432b6cf8d50555a52d00e99216a516911; __Secure-next-auth.callback-url=https%3A%2F%2Fcara.app; crumb=BV0HDt87G5+fOWE0ZDQ5MWM0ZTQ3YTZmMzM4MGU5MGNjNDNmMzY2", | ||||||
|  | 			"Sec-Fetch-Dest: empty", | ||||||
|  | 			"Sec-Fetch-Mode: cors", | ||||||
|  | 			"Sec-Fetch-Site: same-origin", | ||||||
|  | 			"TE: trailers"] | ||||||
|  | 		); | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_RETURNTRANSFER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYHOST, 2); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYPEER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_CONNECTTIMEOUT, 30); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_TIMEOUT, 30); | ||||||
|  |  | ||||||
|  | 		$this->backend->assign_proxy($curlproc, $proxy); | ||||||
|  | 		 | ||||||
|  | 		$data = curl_exec($curlproc); | ||||||
|  | 		 | ||||||
|  | 		if(curl_errno($curlproc)){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception(curl_error($curlproc)); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_close($curlproc); | ||||||
|  | 		return $data; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function image($get){ | ||||||
|  | 		 | ||||||
|  | 		if($get["npt"]){ | ||||||
|  | 			 | ||||||
|  | 			[$npt, $proxy] = | ||||||
|  | 				$this->backend->get( | ||||||
|  | 					$get["npt"], | ||||||
|  | 					"images" | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			$npt = json_decode($npt, true); | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			$search = $get["s"]; | ||||||
|  | 			if(strlen($search) === 0){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Search term is empty!"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$proxy = $this->backend->get_ip(); | ||||||
|  | 						 | ||||||
|  | 			$npt = [ | ||||||
|  | 				"q" => $get["s"], | ||||||
|  | 				"sortBy" => $get["sort"], | ||||||
|  | 				"take" => 24, | ||||||
|  | 				"skip" => 0, | ||||||
|  | 				"filters" => [] | ||||||
|  | 			]; | ||||||
|  | 			 | ||||||
|  | 			// parse filters | ||||||
|  | 			if($get["type"] != "any"){ | ||||||
|  | 				 | ||||||
|  | 				$npt["filters"]["posts"] = [$get["type"]]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($get["fields"] != "any"){ | ||||||
|  | 				 | ||||||
|  | 				$npt["filters"]["fields"] = [$get["fields"]]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($get["category"] != "any"){ | ||||||
|  | 				 | ||||||
|  | 				$npt["filters"]["categories"] = [$get["category"]]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($get["software"] != "any"){ | ||||||
|  | 				 | ||||||
|  | 				$npt["filters"]["softwares"] = [$get["software"]]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($npt["filters"] == []){ | ||||||
|  | 				 | ||||||
|  | 				$npt["filters"] = "{}"; | ||||||
|  | 			}else{ | ||||||
|  | 				 | ||||||
|  | 				$npt["filters"] = json_encode($npt["filters"]); | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$out = [ | ||||||
|  | 			"status" => "ok", | ||||||
|  | 			"npt" => null, | ||||||
|  | 			"image" => [] | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		// https://cara.app/api/search/portfolio-posts?q=jak+and+daxter&sortBy=Top&take=24&skip=0&filters=%7B%7D | ||||||
|  | 		try{ | ||||||
|  | 			$json = | ||||||
|  | 				$this->get( | ||||||
|  | 					$proxy, | ||||||
|  | 					"https://cara.app/api/search/posts", | ||||||
|  | 					$npt, | ||||||
|  | 					$npt["q"] | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 		}catch(Exception $error){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to fetch JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$json = json_decode($json, true); | ||||||
|  | 		 | ||||||
|  | 		if($json === null){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to decode JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$imagecount = 0; | ||||||
|  | 		foreach($json as $image){ | ||||||
|  | 			 | ||||||
|  | 			if(count($image["images"]) === 0){ | ||||||
|  | 				 | ||||||
|  | 				// sometimes the api returns no images for an object | ||||||
|  | 				$imagecount++; | ||||||
|  | 				continue; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$cover = null; | ||||||
|  | 			$sources = []; | ||||||
|  | 			 | ||||||
|  | 			foreach($image["images"] as $source){ | ||||||
|  | 				 | ||||||
|  | 				if($source["isCoverImg"]){ | ||||||
|  | 					 | ||||||
|  | 					$cover = [ | ||||||
|  | 						"url" => "https://images.cara.app/" . $this->fix_url($source["src"]), | ||||||
|  | 						"width" => 500, | ||||||
|  | 						"height" => 500 | ||||||
|  | 					]; | ||||||
|  | 				}else{ | ||||||
|  | 					 | ||||||
|  | 					$sources[] = [ | ||||||
|  | 						"url" => "https://images.cara.app/" . $this->fix_url($source["src"]), | ||||||
|  | 						"width" => null, | ||||||
|  | 						"height" => null | ||||||
|  | 					]; | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($cover !== null){ | ||||||
|  | 				 | ||||||
|  | 				$sources[] = $cover; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$out["image"][] = [ | ||||||
|  | 				"title" => str_replace("\n", " ", $image["content"]), | ||||||
|  | 				"source" => $sources, | ||||||
|  | 				"url" => "https://cara.app/post/" . $image["id"] | ||||||
|  | 			]; | ||||||
|  | 			 | ||||||
|  | 			$imagecount++; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if($imagecount === 24){ | ||||||
|  | 			 | ||||||
|  | 			$npt["skip"] += 24; | ||||||
|  | 			 | ||||||
|  | 			$out["npt"] = | ||||||
|  | 				$this->backend->store( | ||||||
|  | 					json_encode($npt), | ||||||
|  | 					"images", | ||||||
|  | 					$proxy | ||||||
|  | 				); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return $out; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function fix_url($url){ | ||||||
|  | 		 | ||||||
|  | 		return | ||||||
|  | 			str_replace( | ||||||
|  | 				[" "], | ||||||
|  | 				["%20"], | ||||||
|  | 				$url | ||||||
|  | 			); | ||||||
|  | 	} | ||||||
|  | } | ||||||
							
								
								
									
										680
									
								
								scraper/coccoc.php
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										680
									
								
								scraper/coccoc.php
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,680 @@ | |||||||
|  | <?php | ||||||
|  |  | ||||||
|  | class coccoc{ | ||||||
|  | 	 | ||||||
|  | 	public function __construct(){ | ||||||
|  | 		 | ||||||
|  | 		include "lib/backend.php"; | ||||||
|  | 		$this->backend = new backend("coccoc"); | ||||||
|  | 		 | ||||||
|  | 		include "lib/fuckhtml.php"; | ||||||
|  | 		$this->fuckhtml = new fuckhtml(); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	 | ||||||
|  | 	private function get($proxy, $url, $get = []){ | ||||||
|  | 		 | ||||||
|  | 		$curlproc = curl_init(); | ||||||
|  | 		 | ||||||
|  | 		if($get !== []){ | ||||||
|  | 			$get = http_build_query($get); | ||||||
|  | 			$url .= "?" . $get; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_URL, $url); | ||||||
|  | 		 | ||||||
|  | 		// http2 bypass | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_HTTP_VERSION, CURL_HTTP_VERSION_2_0); | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_HTTPHEADER, [ | ||||||
|  | 			"Accept: text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8", | ||||||
|  | 			"Accept-Language: en-US,en;q=0.5", | ||||||
|  | 			"Accept-Encoding: gzip, deflate, br, zstd", | ||||||
|  | 			"DNT: 1", | ||||||
|  | 			"Sec-GPC: 1", | ||||||
|  | 			"Connection: keep-alive", | ||||||
|  | 			//"Cookie: _contentAB_15040_vi=V-06_01; split_test_search=new_search; uid=L_bauXyZBY1B; vid=uCVQJQSTgb9QGT3o; ls=1753742684; serp_version=29223843/7621a70; savedS=direct", | ||||||
|  | 			"Upgrade-Insecure-Requests: 1", | ||||||
|  | 			"Sec-Fetch-Dest: document", | ||||||
|  | 			"Sec-Fetch-Mode: navigate", | ||||||
|  | 			"Sec-Fetch-Site: cross-site", | ||||||
|  | 			"Priority: u=0, i" | ||||||
|  | 		]); | ||||||
|  | 		 | ||||||
|  | 		$this->backend->assign_proxy($curlproc, $proxy); | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_RETURNTRANSFER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYHOST, 2); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYPEER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_CONNECTTIMEOUT, 30); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_TIMEOUT, 30); | ||||||
|  | 		 | ||||||
|  | 		$data = curl_exec($curlproc); | ||||||
|  | 		 | ||||||
|  | 		if(curl_errno($curlproc)){ | ||||||
|  | 			throw new Exception(curl_error($curlproc)); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_close($curlproc); | ||||||
|  | 		return $data; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function getfilters($pagetype){ | ||||||
|  | 		 | ||||||
|  | 		return [ | ||||||
|  | 			"nsfw" => [ | ||||||
|  | 				"display" => "NSFW", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"yes" => "Yes", // nsfw by default???? | ||||||
|  | 					"no" => "No" // &safe=1 | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"time" => [ | ||||||
|  | 				"display" => "Time posted", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any time", | ||||||
|  | 					"1w" => "1 week ago", | ||||||
|  | 					"2w" => "2 weeks ago", | ||||||
|  | 					"1m" => "1 month ago", | ||||||
|  | 					"3m" => "3 months ago", | ||||||
|  | 					"6m" => "6 months ago", | ||||||
|  | 					"1Y" => "1 year ago" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"filter" => [ | ||||||
|  | 				"display" => "Remove duplicates", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"no" => "No", | ||||||
|  | 					"yes" => "Yes" // &filter=0 | ||||||
|  | 				] | ||||||
|  | 			] | ||||||
|  | 		]; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function web($get){ | ||||||
|  | 		 | ||||||
|  | 		if($get["npt"]){ | ||||||
|  | 			 | ||||||
|  | 			[$query, $proxy] = | ||||||
|  | 				$this->backend->get( | ||||||
|  | 					$get["npt"], | ||||||
|  | 					"web" | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			$query = json_decode($query, true); | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			$proxy = $this->backend->get_ip(); | ||||||
|  | 			 | ||||||
|  | 			$query = [ | ||||||
|  | 				"query" => $get["s"] | ||||||
|  | 			]; | ||||||
|  | 			 | ||||||
|  | 			// add filters | ||||||
|  | 			if($get["nsfw"] == "no"){ | ||||||
|  | 				 | ||||||
|  | 				$query["safe"] = 1; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($get["time"] != "any"){ | ||||||
|  | 				 | ||||||
|  | 				$query["tbs"] = $get["time"]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($get["filter"] == "yes"){ | ||||||
|  | 				 | ||||||
|  | 				$query["filter"] = 0; | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		try{ | ||||||
|  | 			 | ||||||
|  | 			$html = | ||||||
|  | 				$this->get( | ||||||
|  | 					$proxy, | ||||||
|  | 					"https://coccoc.com/search", | ||||||
|  | 					$query | ||||||
|  | 				); | ||||||
|  | 		}catch(Exception $error){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to get search page"); | ||||||
|  | 		} | ||||||
|  | 		//$html = file_get_contents("scraper/coccoc.html"); | ||||||
|  | 		 | ||||||
|  | 		 | ||||||
|  | 		$html = explode("window.composerResponse", $html, 2); | ||||||
|  | 		 | ||||||
|  | 		if(count($html) !== 2){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to grep window.composerResponse"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$html = | ||||||
|  | 			json_decode( | ||||||
|  | 				$this->fuckhtml | ||||||
|  | 				->extract_json( | ||||||
|  | 					ltrim($html[1], " =") | ||||||
|  | 				), | ||||||
|  | 				true | ||||||
|  | 			); | ||||||
|  | 		 | ||||||
|  | 		if($html === null){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to decode JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if( | ||||||
|  | 			isset($html["captcha"]) && | ||||||
|  | 			(int)$html["captcha"] === 1 | ||||||
|  | 		){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Coc Coc returned a Captcha"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if(!isset($html["search"]["search_results"])){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Coc Coc did not return a search_results object"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$out = [ | ||||||
|  | 			"status" => "ok", | ||||||
|  | 			"spelling" => [ | ||||||
|  | 				"type" => "no_correction", | ||||||
|  | 				"using" => null, | ||||||
|  | 				"correction" => null | ||||||
|  | 			], | ||||||
|  | 			"npt" => null, | ||||||
|  | 			"answer" => [], | ||||||
|  | 			"web" => [], | ||||||
|  | 			"image" => [], | ||||||
|  | 			"video" => [], | ||||||
|  | 			"news" => [], | ||||||
|  | 			"related" => [] | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		// word correction | ||||||
|  | 		foreach($html["top"] as $element){ | ||||||
|  | 			 | ||||||
|  | 			if(isset($element["spellChecker"][0]["query"])){ | ||||||
|  | 				 | ||||||
|  | 				$out["spelling"] = [ | ||||||
|  | 					"type" => "not_many", | ||||||
|  | 					"using" => $html["search"]["query"], | ||||||
|  | 					"correction" => $element["spellChecker"][0]["query"] | ||||||
|  | 				]; | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		foreach($html["search"]["search_results"] as $result){ | ||||||
|  | 			 | ||||||
|  | 			if(isset($result["type"])){ | ||||||
|  | 				 | ||||||
|  | 				switch($result["type"]){ | ||||||
|  | 					 | ||||||
|  | 					// | ||||||
|  | 					// Related searches | ||||||
|  | 					// | ||||||
|  | 					case "related_queries": | ||||||
|  | 						$out["related"] = $result["queries"]; | ||||||
|  | 						continue 2; | ||||||
|  | 					 | ||||||
|  | 					// | ||||||
|  | 					// Videos | ||||||
|  | 					// | ||||||
|  | 					case "video_hits": | ||||||
|  | 						foreach($result["results"] as $video){ | ||||||
|  | 							 | ||||||
|  | 							if( | ||||||
|  | 								isset($video["image_url"]) && | ||||||
|  | 								!empty($video["image_url"]) | ||||||
|  | 							){ | ||||||
|  | 								 | ||||||
|  | 								$thumb = [ | ||||||
|  | 									"ratio" => "16:9", | ||||||
|  | 									"url" => $video["image_url"] | ||||||
|  | 								]; | ||||||
|  | 							}else{ | ||||||
|  | 								 | ||||||
|  | 								$thumb = [ | ||||||
|  | 									"ratio" => null, | ||||||
|  | 									"url" => null | ||||||
|  | 								]; | ||||||
|  | 							} | ||||||
|  | 							 | ||||||
|  | 							$out["video"][] = [ | ||||||
|  | 								"title" => | ||||||
|  | 									$this->titledots( | ||||||
|  | 										$this->fuckhtml | ||||||
|  | 										->getTextContent( | ||||||
|  | 											$video["title"] | ||||||
|  | 										) | ||||||
|  | 									), | ||||||
|  | 								"description" => null, | ||||||
|  | 								"author" => [ | ||||||
|  | 									"name" => $video["uploader"], | ||||||
|  | 									"url" => null, | ||||||
|  | 									"avatar" => null | ||||||
|  | 								], | ||||||
|  | 								"date" => (int)$video["date"], | ||||||
|  | 								"duration" => (int)$video["duration"], | ||||||
|  | 								"views" => null, | ||||||
|  | 								"thumb" => $thumb, | ||||||
|  | 								"url" => $video["url"] | ||||||
|  | 							]; | ||||||
|  | 						} | ||||||
|  | 						continue 2; | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if( | ||||||
|  | 				!isset($result["title"]) || | ||||||
|  | 				!isset($result["url"]) | ||||||
|  | 			){ | ||||||
|  | 				 | ||||||
|  | 				// should not happen | ||||||
|  | 				continue; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if(isset($result["rich"]["data"]["image_url"])){ | ||||||
|  | 				 | ||||||
|  | 				$thumb = [ | ||||||
|  | 					"url" => $result["rich"]["data"]["image_url"], | ||||||
|  | 					"ratio" => "16:9" | ||||||
|  | 				]; | ||||||
|  | 			}else{ | ||||||
|  | 				 | ||||||
|  | 				$thumb = [ | ||||||
|  | 					"url" => null, | ||||||
|  | 					"ratio" => null | ||||||
|  | 				]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$sublinks = []; | ||||||
|  | 			 | ||||||
|  | 			if(isset($result["rich"]["data"]["linked_docs"])){ | ||||||
|  | 				 | ||||||
|  | 				foreach($result["rich"]["data"]["linked_docs"] as $sub){ | ||||||
|  | 					 | ||||||
|  | 					$sublinks[] = [ | ||||||
|  | 						"title" => | ||||||
|  | 							$this->titledots( | ||||||
|  | 								$this->fuckhtml | ||||||
|  | 								->getTextContent( | ||||||
|  | 									$sub["title"] | ||||||
|  | 								) | ||||||
|  | 							), | ||||||
|  | 						"description" => | ||||||
|  | 							$this->titledots( | ||||||
|  | 								$this->fuckhtml | ||||||
|  | 								->getTextContent( | ||||||
|  | 									$sub["content"] | ||||||
|  | 								) | ||||||
|  | 							), | ||||||
|  | 						"date" => null, | ||||||
|  | 						"url" => $sub["url"] | ||||||
|  | 					]; | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			// get date | ||||||
|  | 			if(isset($result["date"])){ | ||||||
|  | 				 | ||||||
|  | 				$date = (int)$result["date"]; | ||||||
|  | 			}else{ | ||||||
|  | 				 | ||||||
|  | 				$date = null; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			// probe for metadata | ||||||
|  | 			$table = []; | ||||||
|  | 			 | ||||||
|  | 			if(isset($result["rich"]["data"]["rating"])){ | ||||||
|  | 				 | ||||||
|  | 				$table["Rating"] = $result["rich"]["data"]["rating"]; | ||||||
|  | 				 | ||||||
|  | 				if(isset($result["rich"]["data"]["num_rating"])){ | ||||||
|  | 					 | ||||||
|  | 					$table["Rating"] .= " (" . number_format($result["rich"]["data"]["num_rating"]) . " ratings)"; | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if(isset($result["rich"]["data"]["views"])){ | ||||||
|  | 				 | ||||||
|  | 				$table["Views"] = number_format($result["rich"]["data"]["views"]); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if(isset($result["rich"]["data"]["duration"])){ | ||||||
|  | 				 | ||||||
|  | 				$table["Duration"] = $this->int2hms($result["rich"]["data"]["duration"]); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if(isset($result["rich"]["data"]["channel_name"])){ | ||||||
|  | 				 | ||||||
|  | 				$table["Author"] = $result["rich"]["data"]["channel_name"]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if(isset($result["rich"]["data"]["video_quality"])){ | ||||||
|  | 				 | ||||||
|  | 				$table["Quality"] = $result["rich"]["data"]["video_quality"]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if(isset($result["rich"]["data"]["category"])){ | ||||||
|  | 				 | ||||||
|  | 				$table["Category"] = $result["rich"]["data"]["category"]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$out["web"][] = [ | ||||||
|  | 				"title" => | ||||||
|  | 					$this->titledots( | ||||||
|  | 						$this->fuckhtml | ||||||
|  | 						->getTextContent( | ||||||
|  | 							$result["title"] | ||||||
|  | 						) | ||||||
|  | 					), | ||||||
|  | 				"description" => | ||||||
|  | 					$this->titledots( | ||||||
|  | 						$this->fuckhtml | ||||||
|  | 						->getTextContent( | ||||||
|  | 							$result["content"] | ||||||
|  | 						) | ||||||
|  | 					), | ||||||
|  | 				"url" => $result["url"], | ||||||
|  | 				"date" => $date, | ||||||
|  | 				"type" => "web", | ||||||
|  | 				"thumb" => $thumb, | ||||||
|  | 				"sublink" => $sublinks, | ||||||
|  | 				"table" => $table | ||||||
|  | 			]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		// | ||||||
|  | 		// Get wikipedia head | ||||||
|  | 		// | ||||||
|  | 		if(isset($html["right"])){ | ||||||
|  | 			 | ||||||
|  | 			foreach($html["right"] as $wiki){ | ||||||
|  | 				 | ||||||
|  | 				$description = []; | ||||||
|  | 				 | ||||||
|  | 				if(isset($wiki["short_intro"])){ | ||||||
|  | 					 | ||||||
|  | 					$description[] = | ||||||
|  | 						[ | ||||||
|  | 							"type" => "quote", | ||||||
|  | 							"value" => $wiki["short_intro"], | ||||||
|  | 						]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if(isset($wiki["intro"])){ | ||||||
|  | 					 | ||||||
|  | 					$description[] = | ||||||
|  | 						[ | ||||||
|  | 							"type" => "text", | ||||||
|  | 							"value" => $wiki["intro"], | ||||||
|  | 						]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				// get table elements | ||||||
|  | 				$table = []; | ||||||
|  | 				 | ||||||
|  | 				if(isset($wiki["fields"])){ | ||||||
|  | 					 | ||||||
|  | 					foreach($wiki["fields"] as $element){ | ||||||
|  | 						 | ||||||
|  | 						$table[$element["title"]] = implode(", ", $element["value"]); | ||||||
|  | 					} | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				// get sublinks | ||||||
|  | 				$sublinks = []; | ||||||
|  | 				 | ||||||
|  | 				if(isset($wiki["website"])){ | ||||||
|  | 					 | ||||||
|  | 					if( | ||||||
|  | 						preg_match( | ||||||
|  | 							'/^http/', | ||||||
|  | 							$wiki["website"] | ||||||
|  | 						) === 0 | ||||||
|  | 					){ | ||||||
|  | 						 | ||||||
|  | 						$sublinks["Website"] = "https://" . $wiki["website"]; | ||||||
|  | 					}else{ | ||||||
|  | 						 | ||||||
|  | 						$sublinks["Website"] = $wiki["website"]; | ||||||
|  | 					} | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				foreach($wiki["profiles"] as $sitename => $url){ | ||||||
|  | 					 | ||||||
|  | 					$sitename = explode("_", $sitename); | ||||||
|  | 					$sitename = ucfirst($sitename[count($sitename) - 1]); | ||||||
|  | 					 | ||||||
|  | 					$sublinks[$sitename] = $url; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				$out["answer"][] = [ | ||||||
|  | 					"title" => | ||||||
|  | 						$this->titledots( | ||||||
|  | 							$wiki["title"] | ||||||
|  | 						), | ||||||
|  | 					"description" => $description, | ||||||
|  | 					"url" => null, | ||||||
|  | 					"thumb" => isset($wiki["image"]["contentUrl"]) ? $wiki["image"]["contentUrl"] : null, | ||||||
|  | 					"table" => $table, | ||||||
|  | 					"sublink" => $sublinks | ||||||
|  | 				]; | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		// get next page | ||||||
|  | 		if((int)$html["search"]["page"] < (int)$html["search"]["max_page"]){ | ||||||
|  | 			 | ||||||
|  | 			// https://coccoc.com/composer?_=1754021153532&p=0&q=zbabduiqwhduwqhdnwq&reqid=bwcAs00q&s=direct&apiV=1 | ||||||
|  | 			// ^json endpoint, but we can just do &page=2 lol | ||||||
|  | 			 | ||||||
|  | 			if(!isset($query["page"])){ | ||||||
|  | 				 | ||||||
|  | 				$query["page"] = 2; | ||||||
|  | 			}else{ | ||||||
|  | 				 | ||||||
|  | 				$query["page"]++; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$out["npt"] = | ||||||
|  | 				$this->backend | ||||||
|  | 				->store( | ||||||
|  | 					json_encode($query), | ||||||
|  | 					"web", | ||||||
|  | 					$proxy | ||||||
|  | 				); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return $out; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function video($get){ | ||||||
|  | 		 | ||||||
|  | 		//$html = file_get_contents("scraper/coccoc.html"); | ||||||
|  | 		if($get["npt"]){ | ||||||
|  | 			 | ||||||
|  | 			[$query, $proxy] = | ||||||
|  | 				$this->backend->get( | ||||||
|  | 					$get["npt"], | ||||||
|  | 					"videos" | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			$query = json_decode($query, true); | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			$proxy = $this->backend->get_ip(); | ||||||
|  | 			 | ||||||
|  | 			$query = [ | ||||||
|  | 				"query" => $get["s"], | ||||||
|  | 				"tbm" => "vid" | ||||||
|  | 			]; | ||||||
|  | 			 | ||||||
|  | 			// add filters | ||||||
|  | 			if($get["nsfw"] == "no"){ | ||||||
|  | 				 | ||||||
|  | 				$query["safe"] = 1; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($get["time"] != "any"){ | ||||||
|  | 				 | ||||||
|  | 				$query["tbs"] = $get["time"]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($get["filter"] == "yes"){ | ||||||
|  | 				 | ||||||
|  | 				$query["filter"] = 0; | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		try{ | ||||||
|  | 			 | ||||||
|  | 			$html = | ||||||
|  | 				$this->get( | ||||||
|  | 					$proxy, | ||||||
|  | 					"https://coccoc.com/search", | ||||||
|  | 					$query | ||||||
|  | 				); | ||||||
|  | 		}catch(Exception $error){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to get search page"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$html = explode("window.composerResponse", $html, 2); | ||||||
|  | 		 | ||||||
|  | 		if(count($html) !== 2){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to grep window.composerResponse"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$html = | ||||||
|  | 			json_decode( | ||||||
|  | 				$this->fuckhtml | ||||||
|  | 				->extract_json( | ||||||
|  | 					ltrim($html[1], " =") | ||||||
|  | 				), | ||||||
|  | 				true | ||||||
|  | 			); | ||||||
|  | 		 | ||||||
|  | 		if($html === null){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to decode JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$out = [ | ||||||
|  | 			"status" => "ok", | ||||||
|  | 			"npt" => null, | ||||||
|  | 			"video" => [], | ||||||
|  | 			"author" => [], | ||||||
|  | 			"livestream" => [], | ||||||
|  | 			"playlist" => [], | ||||||
|  | 			"reel" => [] | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		if(!isset($html["search_video"]["search_results"])){ | ||||||
|  | 			 | ||||||
|  | 			if(isset($html["search_video"]["error"]["title"])){ | ||||||
|  | 				 | ||||||
|  | 				if($html["search_video"]["error"]["title"] == "Không tìm thấy kết quả nào"){ | ||||||
|  | 					 | ||||||
|  | 					return $out; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Coc Coc returned an error: " . $html["search_video"]["error"]["title"]); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Coc Coc did not supply a search_results object"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		foreach($html["search_video"]["search_results"] as $video){ | ||||||
|  | 			 | ||||||
|  | 			if(isset($video["rich"]["data"]["image_url"])){ | ||||||
|  | 				 | ||||||
|  | 				$thumb = [ | ||||||
|  | 					"ratio" => "16:9", | ||||||
|  | 					"url" => $video["rich"]["data"]["image_url"] | ||||||
|  | 				]; | ||||||
|  | 			}else{ | ||||||
|  | 				 | ||||||
|  | 				$thumb = [ | ||||||
|  | 					"ratio" => null, | ||||||
|  | 					"url" => null | ||||||
|  | 				]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$out["video"][] = [ | ||||||
|  | 				"title" => | ||||||
|  | 					$this->titledots( | ||||||
|  | 						$this->fuckhtml | ||||||
|  | 						->getTextContent( | ||||||
|  | 							$video["title"] | ||||||
|  | 						) | ||||||
|  | 					), | ||||||
|  | 				"description" => | ||||||
|  | 					$this->titledots( | ||||||
|  | 						$this->fuckhtml | ||||||
|  | 						->getTextContent( | ||||||
|  | 							$video["content"] | ||||||
|  | 						) | ||||||
|  | 					), | ||||||
|  | 				"author" => [ | ||||||
|  | 					"name" =>  | ||||||
|  | 						isset($video["rich"]["data"]["channel_name"]) ? | ||||||
|  | 							$video["rich"]["data"]["channel_name"] : null, | ||||||
|  | 					"url" => null, | ||||||
|  | 					"avatar" => null | ||||||
|  | 				], | ||||||
|  | 				"date" => | ||||||
|  | 					isset($video["date"]) ? | ||||||
|  | 						$video["date"] : null, | ||||||
|  | 				"duration" => | ||||||
|  | 					isset($video["rich"]["data"]["duration"]) ? | ||||||
|  | 						(int)$video["rich"]["data"]["duration"] : null, | ||||||
|  | 				"views" => null, | ||||||
|  | 				"thumb" => $thumb, | ||||||
|  | 				"url" => $video["url"] | ||||||
|  | 			]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		// get next page | ||||||
|  | 		if((int)$html["search_video"]["page"] < (int)$html["search_video"]["max_page"]){ | ||||||
|  | 			 | ||||||
|  | 			if(!isset($query["page"])){ | ||||||
|  | 				 | ||||||
|  | 				$query["page"] = 2; | ||||||
|  | 			}else{ | ||||||
|  | 				 | ||||||
|  | 				$query["page"]++; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$out["npt"] = | ||||||
|  | 				$this->backend | ||||||
|  | 				->store( | ||||||
|  | 					json_encode($query), | ||||||
|  | 					"videos", | ||||||
|  | 					$proxy | ||||||
|  | 				); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return $out; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function titledots($title){ | ||||||
|  | 		 | ||||||
|  | 		return trim($title, " .\t\n\r\0\x0B…"); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function int2hms($seconds){ | ||||||
|  | 		 | ||||||
|  | 		$hours = floor($seconds / 3600); | ||||||
|  | 		$minutes = floor(($seconds % 3600) / 60); | ||||||
|  | 		$seconds = $seconds % 60; | ||||||
|  | 		 | ||||||
|  | 		return sprintf("%02d:%02d:%02d", $hours, $minutes, $seconds); | ||||||
|  | 	} | ||||||
|  | } | ||||||
							
								
								
									
										3677
									
								
								scraper/ddg.php
									
									
									
									
									
								
							
							
						
						
									
										3677
									
								
								scraper/ddg.php
									
									
									
									
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							
							
								
								
									
										262
									
								
								scraper/fivehpx.php
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										262
									
								
								scraper/fivehpx.php
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,262 @@ | |||||||
|  | <?php | ||||||
|  |  | ||||||
|  | class fivehpx{ | ||||||
|  | 	 | ||||||
|  | 	public function __construct(){ | ||||||
|  | 		 | ||||||
|  | 		include "lib/backend.php"; | ||||||
|  | 		$this->backend = new backend("fivehpx"); | ||||||
|  | 		 | ||||||
|  | 		include "lib/fuckhtml.php"; | ||||||
|  | 		$this->fuckhtml = new fuckhtml(); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function getfilters($page){ | ||||||
|  | 		 | ||||||
|  | 		return [ | ||||||
|  | 			"sort" => [ | ||||||
|  | 				"display" => "Sort", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"relevance" => "Relevance", | ||||||
|  | 					"pulse" => "Pulse", | ||||||
|  | 					"newest" => "Newest" | ||||||
|  | 				] | ||||||
|  | 			] | ||||||
|  | 		]; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function get($proxy, $url, $get = [], $post_data = null){ | ||||||
|  | 		 | ||||||
|  | 		$curlproc = curl_init(); | ||||||
|  | 		 | ||||||
|  | 		if($get !== []){ | ||||||
|  | 			$get = http_build_query($get); | ||||||
|  | 			$url .= "?" . $get; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_URL, $url); | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | ||||||
|  | 		 | ||||||
|  | 		if($post_data === null){ | ||||||
|  | 			 | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
|  | 				["User-Agent: " . config::USER_AGENT, | ||||||
|  | 				"Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8", | ||||||
|  | 				"Accept-Language: en-US,en;q=0.5", | ||||||
|  | 				"Accept-Encoding: gzip", | ||||||
|  | 				"DNT: 1", | ||||||
|  | 				"Sec-GPC: 1", | ||||||
|  | 				"Connection: keep-alive", | ||||||
|  | 				"Upgrade-Insecure-Requests: 1", | ||||||
|  | 				"Sec-Fetch-Dest: document", | ||||||
|  | 				"Sec-Fetch-Mode: navigate", | ||||||
|  | 				"Sec-Fetch-Site: same-origin", | ||||||
|  | 				"Sec-Fetch-User: ?1", | ||||||
|  | 				"Priority: u=0, i", | ||||||
|  | 				"TE: trailers"] | ||||||
|  | 			); | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
|  | 				["User-Agent: " . config::USER_AGENT, | ||||||
|  | 				"Accept: */*", | ||||||
|  | 				"Accept-Language: en-US,en;q=0.5", | ||||||
|  | 				"Accept-Encoding: gzip", | ||||||
|  | 				"Referer: https://500px.com/", | ||||||
|  | 				"content-type: application/json", | ||||||
|  | 				//"x-csrf-token: undefined", | ||||||
|  | 				"x-500px-source: Search", | ||||||
|  | 				"Content-Length: " . strlen($post_data), | ||||||
|  | 				"Origin: https://500px.com", | ||||||
|  | 				"DNT: 1", | ||||||
|  | 				"Sec-GPC: 1", | ||||||
|  | 				"Connection: keep-alive", | ||||||
|  | 				// "Cookie: _pin_unauth, _fbp, _sharedID, _sharedID_cst", | ||||||
|  | 				"Sec-Fetch-Dest: empty", | ||||||
|  | 				"Sec-Fetch-Mode: cors", | ||||||
|  | 				"Sec-Fetch-Site: same-site", | ||||||
|  | 				"Priority: u=4", | ||||||
|  | 				"TE: trailers"] | ||||||
|  | 			); | ||||||
|  | 						 | ||||||
|  | 			// set post data | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_POST, true); | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_POSTFIELDS, $post_data); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_RETURNTRANSFER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYHOST, 2); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYPEER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_CONNECTTIMEOUT, 30); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_TIMEOUT, 30); | ||||||
|  | 		 | ||||||
|  | 		// http2 bypass | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_HTTP_VERSION, CURL_HTTP_VERSION_2_0); | ||||||
|  | 		 | ||||||
|  | 		$this->backend->assign_proxy($curlproc, $proxy); | ||||||
|  | 		 | ||||||
|  | 		$data = curl_exec($curlproc); | ||||||
|  | 		 | ||||||
|  | 		if(curl_errno($curlproc)){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception(curl_error($curlproc)); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_close($curlproc); | ||||||
|  | 		return $data; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function image($get){ | ||||||
|  | 		 | ||||||
|  | 		if($get["npt"]){ | ||||||
|  | 			 | ||||||
|  | 			[$pagination, $proxy] = | ||||||
|  | 				$this->backend->get( | ||||||
|  | 					$get["npt"], "images" | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			$pagination = json_decode($pagination, true); | ||||||
|  | 			$search = $pagination["search"]; | ||||||
|  | 			 | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			$search = $get["s"]; | ||||||
|  | 			if(strlen($search) === 0){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Search term is empty!"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$proxy = $this->backend->get_ip(); | ||||||
|  | 			$pagination = [ | ||||||
|  | 				"sort" => strtoupper($get["sort"]), | ||||||
|  | 				"search" => $search, | ||||||
|  | 				"filters" => [], | ||||||
|  | 				"nlp" => false, | ||||||
|  | 			]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		try{ | ||||||
|  | 			 | ||||||
|  | 			$json = | ||||||
|  | 				$this->get( | ||||||
|  | 					$proxy, | ||||||
|  | 					"https://api.500px.com/graphql", | ||||||
|  | 					[], | ||||||
|  | 					json_encode([ | ||||||
|  | 						"operationName" => "PhotoSearchPaginationContainerQuery", | ||||||
|  | 						"variables" => $pagination, | ||||||
|  | 						"query" => | ||||||
|  | 							'query PhotoSearchPaginationContainerQuery(' . | ||||||
|  | 							(isset($pagination["cursor"]) ? '$cursor: String, ' : "") . | ||||||
|  | 							'$sort: PhotoSort, $search: String!, $filters: [PhotoSearchFilter!], $nlp: Boolean) {  ...PhotoSearchPaginationContainer_query_1vzAZD} fragment PhotoSearchPaginationContainer_query_1vzAZD on Query { photoSearch(sort: $sort, first: 100, ' . | ||||||
|  | 							(isset($pagination["cursor"]) ? 'after: $cursor, ' : "") . | ||||||
|  | 							'search: $search, filters: $filters, nlp: $nlp) { edges { node { id legacyId canonicalPath name description width height images(sizes: [33, 36]) { size url id } } } totalCount pageInfo { endCursor hasNextPage } }}' | ||||||
|  | 					]) | ||||||
|  | 				); | ||||||
|  | 		}catch(Exception $error){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to fetch graphQL object"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$json = json_decode($json, true); | ||||||
|  | 		 | ||||||
|  | 		if($json === null){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to decode graphQL object"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if(isset($json["errors"][0]["message"])){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("500px returned an API error: " . $json["errors"][0]["message"]); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if(!isset($json["data"]["photoSearch"]["edges"])){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("No edges returned by API"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$out = [ | ||||||
|  | 			"status" => "ok", | ||||||
|  | 			"npt" => null, | ||||||
|  | 			"image" => [] | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		foreach($json["data"]["photoSearch"]["edges"] as $image){ | ||||||
|  | 			 | ||||||
|  | 			$image = $image["node"]; | ||||||
|  | 			$title = | ||||||
|  | 				trim( | ||||||
|  | 					$this->fuckhtml | ||||||
|  | 					->getTextContent( | ||||||
|  | 						$image["name"] | ||||||
|  | 					) . ": " . | ||||||
|  | 					$this->fuckhtml | ||||||
|  | 					->getTextContent( | ||||||
|  | 						$image["description"] | ||||||
|  | 					) | ||||||
|  | 					, " :" | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			$small = $this->image_ratio(600, $image["width"], $image["height"]); | ||||||
|  | 			$large = $this->image_ratio(2048, $image["width"], $image["height"]); | ||||||
|  | 			 | ||||||
|  | 			$out["image"][] = [ | ||||||
|  | 				"title" => $title, | ||||||
|  | 				"source" => [ | ||||||
|  | 					[ | ||||||
|  | 						"url" => $image["images"][1]["url"], | ||||||
|  | 						"width" => $large[0], | ||||||
|  | 						"height" => $large[1] | ||||||
|  | 					], | ||||||
|  | 					[ | ||||||
|  | 						"url" => $image["images"][0]["url"], | ||||||
|  | 						"width" => $small[0], | ||||||
|  | 						"height" => $small[1] | ||||||
|  | 					] | ||||||
|  | 				], | ||||||
|  | 				"url" => "https://500px.com" . $image["canonicalPath"] | ||||||
|  | 			]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		// get NPT token | ||||||
|  | 		if($json["data"]["photoSearch"]["pageInfo"]["hasNextPage"] === true){ | ||||||
|  | 			 | ||||||
|  | 			$out["npt"] = | ||||||
|  | 				$this->backend->store( | ||||||
|  | 					json_encode([ | ||||||
|  | 						"cursor" => $json["data"]["photoSearch"]["pageInfo"]["endCursor"], | ||||||
|  | 						"search" => $search, | ||||||
|  | 						"sort" => $pagination["sort"], | ||||||
|  | 						"filters" => [], | ||||||
|  | 						"nlp" => false | ||||||
|  | 					]), | ||||||
|  | 					"images", | ||||||
|  | 					$proxy | ||||||
|  | 				); | ||||||
|  | 		} | ||||||
|  | 			 | ||||||
|  | 		return $out; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function image_ratio($longest_edge, $width, $height){ | ||||||
|  | 		 | ||||||
|  | 		$ratio = [ | ||||||
|  | 			$longest_edge / $width, | ||||||
|  | 			$longest_edge / $height | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		if($ratio[0] < $ratio[1]){ | ||||||
|  | 			 | ||||||
|  | 			$ratio = $ratio[0]; | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			$ratio = $ratio[1]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return [ | ||||||
|  | 			floor($width * $ratio), | ||||||
|  | 			floor($height * $ratio) | ||||||
|  | 		]; | ||||||
|  | 	} | ||||||
|  | } | ||||||
							
								
								
									
										415
									
								
								scraper/flickr.php
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										415
									
								
								scraper/flickr.php
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,415 @@ | |||||||
|  | <?php | ||||||
|  |  | ||||||
|  | class flickr{ | ||||||
|  | 	 | ||||||
|  | 	const req_web = 0; | ||||||
|  | 	const req_xhr = 1; | ||||||
|  | 	 | ||||||
|  | 	public function __construct(){ | ||||||
|  | 		 | ||||||
|  | 		include "lib/backend.php"; | ||||||
|  | 		$this->backend = new backend("flickr"); | ||||||
|  | 		 | ||||||
|  | 		include "lib/fuckhtml.php"; | ||||||
|  | 		$this->fuckhtml = new fuckhtml(); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function getfilters($page){ | ||||||
|  | 		 | ||||||
|  | 		return [ | ||||||
|  | 			"nsfw" => [ | ||||||
|  | 				"display" => "NSFW", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"yes" => "Yes", | ||||||
|  | 					"maybe" => "Maybe", | ||||||
|  | 					"no" => "No", | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"sort" => [ | ||||||
|  | 				"display" => "Sort by", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"relevance" => "Relevance", | ||||||
|  | 					"date-posted-desc" => "Newest uploads", | ||||||
|  | 					"date-posted-asc" => "Oldest uploads", | ||||||
|  | 					"date-taken-desc" => "Newest taken", | ||||||
|  | 					"date-taken-asc" => "Oldest taken", | ||||||
|  | 					"interestingness-desc" => "Interesting" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"color" => [ | ||||||
|  | 				"display" => "Color", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any color", | ||||||
|  | 					// color_codes= | ||||||
|  | 					"0" => "Red", | ||||||
|  | 					"1" => "Brown", | ||||||
|  | 					"2" => "Orange", | ||||||
|  | 					"b" => "Pink", | ||||||
|  | 					"4" => "Yellow", | ||||||
|  | 					"3" => "Golden", | ||||||
|  | 					"5" => "Lime", | ||||||
|  | 					"6" => "Green", | ||||||
|  | 					"7" => "Sky blue", | ||||||
|  | 					"8" => "Blue", | ||||||
|  | 					"9" => "Purple", | ||||||
|  | 					"a" => "Hot pink", | ||||||
|  | 					"c" => "White", | ||||||
|  | 					"d" => "Gray", | ||||||
|  | 					"e" => "Black", | ||||||
|  | 					// styles= override | ||||||
|  | 					"blackandwhite" => "Black & white", | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"style" => [ // styles= | ||||||
|  | 				"display" => "Style", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any style", | ||||||
|  | 					"depthoffield" => "Depth of field", | ||||||
|  | 					"minimalism" => "Minimalism", | ||||||
|  | 					"pattern" => "Patterns" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"license" => [ | ||||||
|  | 				"display" => "License", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any license", | ||||||
|  | 					"1,2,3,4,5,6,9,11,12,13,14,15,16" => "All creative commons", | ||||||
|  | 					"4,5,6,9,10,11,12,13" => "Commercial use allowed", | ||||||
|  | 					"1,2,4,5,9,10,11,12,14,15" => "Modifications allowed", | ||||||
|  | 					"4,5,9,10,11,12" => "Commercial use & mods allowed", | ||||||
|  | 					"7,9,10" => "No known copyright restrictions", | ||||||
|  | 					"8" => "U.S Government works" | ||||||
|  | 				] | ||||||
|  | 			] | ||||||
|  | 		]; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function get($proxy, $url, $get = [], $reqtype){ | ||||||
|  | 		 | ||||||
|  | 		$curlproc = curl_init(); | ||||||
|  | 		 | ||||||
|  | 		if($get !== []){ | ||||||
|  | 			$get = http_build_query($get); | ||||||
|  | 			$url .= "?" . $get; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_URL, $url); | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | ||||||
|  | 		 | ||||||
|  | 		if($reqtype === flickr::req_web){ | ||||||
|  | 			 | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
|  | 				["User-Agent: " . config::USER_AGENT, | ||||||
|  | 				"Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8", | ||||||
|  | 				"Accept-Language: en-US,en;q=0.5", | ||||||
|  | 				"Accept-Encoding: gzip", | ||||||
|  | 				"DNT: 1", | ||||||
|  | 				"Sec-GPC: 1", | ||||||
|  | 				"Connection: keep-alive", | ||||||
|  | 				"Upgrade-Insecure-Requests: 1", | ||||||
|  | 				"Sec-Fetch-Dest: document", | ||||||
|  | 				"Sec-Fetch-Mode: navigate", | ||||||
|  | 				"Sec-Fetch-Site: same-origin", | ||||||
|  | 				"Sec-Fetch-User: ?1", | ||||||
|  | 				"Priority: u=0, i", | ||||||
|  | 				"TE: trailers"] | ||||||
|  | 			); | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
|  | 				["User-Agent: " . config::USER_AGENT, | ||||||
|  | 				"Accept: */*", | ||||||
|  | 				"Accept-Language: en-US,en;q=0.5", | ||||||
|  | 				"Accept-Encoding: gzip", | ||||||
|  | 				"Origin: https://www.flickr.com", | ||||||
|  | 				"DNT: 1", | ||||||
|  | 				"Sec-GPC: 1", | ||||||
|  | 				"Connection: keep-alive", | ||||||
|  | 				"Referer: https://www.flickr.com/", | ||||||
|  | 				// Cookie: | ||||||
|  | 				"Sec-Fetch-Dest: empty", | ||||||
|  | 				"Sec-Fetch-Mode: cors", | ||||||
|  | 				"Sec-Fetch-Site: same-site", | ||||||
|  | 				"TE: trailers"] | ||||||
|  | 			); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_RETURNTRANSFER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYHOST, 2); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYPEER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_CONNECTTIMEOUT, 30); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_TIMEOUT, 30); | ||||||
|  | 		 | ||||||
|  | 		// http2 bypass | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_HTTP_VERSION, CURL_HTTP_VERSION_2_0); | ||||||
|  | 		 | ||||||
|  | 		$this->backend->assign_proxy($curlproc, $proxy); | ||||||
|  | 		 | ||||||
|  | 		$data = curl_exec($curlproc); | ||||||
|  | 		 | ||||||
|  | 		if(curl_errno($curlproc)){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception(curl_error($curlproc)); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_close($curlproc); | ||||||
|  | 		return $data; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function image($get){ | ||||||
|  | 		 | ||||||
|  | 		if($get["npt"]){ | ||||||
|  | 			 | ||||||
|  | 			[$filters, $proxy] = | ||||||
|  | 				$this->backend->get( | ||||||
|  | 					$get["npt"], "images" | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			$filters = json_decode($filters, true); | ||||||
|  | 			 | ||||||
|  | 			// Workaround for the future, if flickr deprecates &page argument on html page | ||||||
|  | 			/* | ||||||
|  | 			try{ | ||||||
|  | 				 | ||||||
|  | 				$json = | ||||||
|  | 					$this->get( | ||||||
|  | 						$proxy, | ||||||
|  | 						"https://api.flickr.com/services/rest", | ||||||
|  | 						[ | ||||||
|  | 							"sort" => $data["sort"], | ||||||
|  | 							"parse_tags" => 1, | ||||||
|  | 							// url_s,url_n,url_w,url_m,url_z,url_c,url_l,url_h,url_k,url_3k,url_4k,url_5k,url_6k,url_o | ||||||
|  | 							"extras" => "can_comment,can_print,count_comments,count_faves,description,isfavorite,license,media,needs_interstitial,owner_name,path_alias,realname,rotation,url_sq,url_q,url_t,url_s,url_n,url_w,url_m,url_z,url_c,url_l", | ||||||
|  | 							"per_page" => 100, | ||||||
|  | 							"page" => $data["page"], | ||||||
|  | 							"lang" => "en-US", | ||||||
|  | 							"text" => $data["search"], | ||||||
|  | 							"viewerNSID" => "", | ||||||
|  | 							"method" => "flickr.photos.search", | ||||||
|  | 							"csrf" => "", | ||||||
|  | 							"api_key" => $data["api_key"], | ||||||
|  | 							"format" => "json", | ||||||
|  | 							"hermes" => 1, | ||||||
|  | 							"hermesClient" => 1, | ||||||
|  | 							"reqId" => $data["reqId"], | ||||||
|  | 							"nojsoncallback" => 1 | ||||||
|  | 						] | ||||||
|  | 					); | ||||||
|  | 			}catch(Exception $error){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to fetch JSON"); | ||||||
|  | 			}*/ | ||||||
|  | 			 | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			if(strlen($get["s"]) === 0){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Search term is empty!"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$proxy = $this->backend->get_ip(); | ||||||
|  | 						 | ||||||
|  | 			// compute filters | ||||||
|  | 			$filters = [ | ||||||
|  | 				"page" => 1, | ||||||
|  | 				"sort" => $get["sort"] | ||||||
|  | 			]; | ||||||
|  | 			 | ||||||
|  | 			if($get["style"] != "any"){ | ||||||
|  | 				 | ||||||
|  | 				$filters["styles"] = $get["style"]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($get["color"] != "any"){ | ||||||
|  | 				 | ||||||
|  | 				if($get["color"] != "blackandwhite"){ | ||||||
|  | 					 | ||||||
|  | 					$filters["color_codes"] = $get["color"]; | ||||||
|  | 				}else{ | ||||||
|  | 					 | ||||||
|  | 					$filters["styles"] = "blackandwhite"; | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($get["license"] != "any"){ | ||||||
|  | 				 | ||||||
|  | 				$filters["license"] = $get["license"]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			switch($get["nsfw"]){ | ||||||
|  | 				 | ||||||
|  | 				case "yes": $filters["safe_search"] = 0; break; | ||||||
|  | 				case "maybe": $filters["safe_search"] = 2; break; | ||||||
|  | 				case "no": $filters["safe_search"] = 1; break; | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$get_params = [ | ||||||
|  | 			"text" => $get["s"], | ||||||
|  | 			"per_page" => 50, | ||||||
|  | 			// scrape highest resolution | ||||||
|  | 			"extras" => "url_s,url_n,url_w,url_m,url_z,url_c,url_l,url_h,url_k,url_3k,url_4k,url_5k,url_6k,url_o", | ||||||
|  | 			"view_all" => 1 | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		$get_params = array_merge($get_params, $filters); | ||||||
|  | 		 | ||||||
|  | 		$html = | ||||||
|  | 			$this->get( | ||||||
|  | 				$proxy, | ||||||
|  | 				"https://www.flickr.com/search/", | ||||||
|  | 				$get_params, | ||||||
|  | 				flickr::req_web | ||||||
|  | 			); | ||||||
|  | 		 | ||||||
|  | 		// @TODO | ||||||
|  | 		// get api_key and reqId, if flickr deprecates &page | ||||||
|  | 		 | ||||||
|  | 		$this->fuckhtml->load($html); | ||||||
|  | 		 | ||||||
|  | 		// | ||||||
|  | 		// get response JSON | ||||||
|  | 		// | ||||||
|  | 		$scripts = | ||||||
|  | 			$this->fuckhtml | ||||||
|  | 			->getElementsByClassName( | ||||||
|  | 				"modelExport", | ||||||
|  | 				"script" | ||||||
|  | 			); | ||||||
|  | 		 | ||||||
|  | 		$found = false; | ||||||
|  | 		foreach($scripts as $script){ | ||||||
|  | 			 | ||||||
|  | 			$json =	 | ||||||
|  | 				preg_split( | ||||||
|  | 					'/modelExport: ?/', | ||||||
|  | 					$script["innerHTML"], | ||||||
|  | 					2 | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			if(count($json) !== 0){ | ||||||
|  | 				 | ||||||
|  | 				$found = true; | ||||||
|  | 				$json = $json[1]; | ||||||
|  | 				break; | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if($found === false){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to grep JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$json = | ||||||
|  | 			json_decode( | ||||||
|  | 				$this->fuckhtml | ||||||
|  | 				->extract_json( | ||||||
|  | 					$json | ||||||
|  | 				), | ||||||
|  | 				true | ||||||
|  | 			); | ||||||
|  | 		 | ||||||
|  | 		if($json === null){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to decode JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$out = [ | ||||||
|  | 			"status" => "ok", | ||||||
|  | 			"npt" => null, | ||||||
|  | 			"image" => [] | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		if(!isset($json["main"]["search-photos-lite-models"][0]["data"]["photos"]["data"]["_data"])){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to access data object"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		foreach($json["main"]["search-photos-lite-models"][0]["data"]["photos"]["data"]["_data"] as $image){ | ||||||
|  | 			 | ||||||
|  | 			if(!isset($image["data"])){ | ||||||
|  | 				 | ||||||
|  | 				// flickr likes to gives us empty array objects | ||||||
|  | 				continue; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$image = $image["data"]; | ||||||
|  | 			 | ||||||
|  | 			$title = []; | ||||||
|  | 			 | ||||||
|  | 			if(isset($image["title"])){ | ||||||
|  | 				 | ||||||
|  | 				$title[] = | ||||||
|  | 					$this->fuckhtml | ||||||
|  | 					->getTextContent( | ||||||
|  | 						$image["title"] | ||||||
|  | 					); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if(isset($image["description"])){ | ||||||
|  | 				 | ||||||
|  | 				$title[] = | ||||||
|  | 					$this->fuckhtml | ||||||
|  | 					->getTextContent( | ||||||
|  | 						str_replace( | ||||||
|  | 							"\n", | ||||||
|  | 							" ", | ||||||
|  | 							$image["description"] | ||||||
|  | 						) | ||||||
|  | 					); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$title = implode(": ", $title); | ||||||
|  | 			 | ||||||
|  | 			$sources = array_values($image["sizes"]["data"]); | ||||||
|  | 			 | ||||||
|  | 			$suitable_sizes = ["n", "m", "w", "s"]; | ||||||
|  | 			 | ||||||
|  | 			$thumb = &$sources[0]["data"]; | ||||||
|  | 			foreach($suitable_sizes as $testing_size){ | ||||||
|  | 				 | ||||||
|  | 				if(isset($image["sizes"]["data"][$testing_size])){ | ||||||
|  | 					 | ||||||
|  | 					$thumb = &$image["sizes"]["data"][$testing_size]["data"]; | ||||||
|  | 					break; | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$og = &$sources[count($sources) - 1]["data"]; | ||||||
|  | 			 | ||||||
|  | 			$out["image"][] = [ | ||||||
|  | 				"title" => $title, | ||||||
|  | 				"source" => [ | ||||||
|  | 					[ | ||||||
|  | 						"url" => "https:" . $og["displayUrl"], | ||||||
|  | 						"width" => (int)$og["width"], | ||||||
|  | 						"height" => (int)$og["height"] | ||||||
|  | 					], | ||||||
|  | 					[ | ||||||
|  | 						"url" => "https:" . $thumb["displayUrl"], | ||||||
|  | 						"width" => (int)$thumb["width"], | ||||||
|  | 						"height" => (int)$thumb["height"] | ||||||
|  | 					] | ||||||
|  | 				], | ||||||
|  | 				"url" => "https://www.flickr.com/photos/" . $image["ownerNsid"] . "/" . $image["id"] . "/" | ||||||
|  | 			]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$total_items = (int)$json["main"]["search-photos-lite-models"][0]["data"]["photos"]["data"]["totalItems"]; | ||||||
|  | 		 | ||||||
|  | 		if(($filters["page"]) * 50 < $total_items){ | ||||||
|  | 			 | ||||||
|  | 			$filters["page"]++; | ||||||
|  | 			 | ||||||
|  | 			$out["npt"] = | ||||||
|  | 				$this->backend->store( | ||||||
|  | 					json_encode($filters), | ||||||
|  | 					"images", | ||||||
|  | 					$proxy | ||||||
|  | 				); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return $out; | ||||||
|  | 	} | ||||||
|  | } | ||||||
| @@ -136,7 +136,7 @@ class ftm{ | |||||||
| 				"source" => [ | 				"source" => [ | ||||||
| 					[ | 					[ | ||||||
| 						"url" => | 						"url" => | ||||||
| 							"https://findthatmeme.us-southeast-1.linodeobjects.com/" . | 							"https://s3.thehackerblog.com/findthatmeme/" . | ||||||
| 							$thumb, | 							$thumb, | ||||||
| 						"width" => null, | 						"width" => null, | ||||||
| 						"height" => null | 						"height" => null | ||||||
|   | |||||||
							
								
								
									
										4493
									
								
								scraper/google.php
									
									
									
									
									
								
							
							
						
						
									
										4493
									
								
								scraper/google.php
									
									
									
									
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							
							
								
								
									
										738
									
								
								scraper/google_api.php
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										738
									
								
								scraper/google_api.php
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,738 @@ | |||||||
|  | <?php | ||||||
|  |  | ||||||
|  | // @TODO check for consent.google.com page, if need be | ||||||
|  |  | ||||||
|  | class google_api{ | ||||||
|  | 	 | ||||||
|  | 	public function __construct(){ | ||||||
|  | 		 | ||||||
|  | 		include "lib/backend.php"; | ||||||
|  | 		$this->backend = new backend("google_api"); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function getfilters($page){ | ||||||
|  | 		 | ||||||
|  | 		$base = [ | ||||||
|  | 			"country" => [ // gl=<country> (image: cr=countryAF) | ||||||
|  | 				"display" => "Country", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Instance's country", | ||||||
|  | 					"af" => "Afghanistan", | ||||||
|  | 					"al" => "Albania", | ||||||
|  | 					"dz" => "Algeria", | ||||||
|  | 					"as" => "American Samoa", | ||||||
|  | 					"ad" => "Andorra", | ||||||
|  | 					"ao" => "Angola", | ||||||
|  | 					"ai" => "Anguilla", | ||||||
|  | 					"aq" => "Antarctica", | ||||||
|  | 					"ag" => "Antigua and Barbuda", | ||||||
|  | 					"ar" => "Argentina", | ||||||
|  | 					"am" => "Armenia", | ||||||
|  | 					"aw" => "Aruba", | ||||||
|  | 					"au" => "Australia", | ||||||
|  | 					"at" => "Austria", | ||||||
|  | 					"az" => "Azerbaijan", | ||||||
|  | 					"bs" => "Bahamas", | ||||||
|  | 					"bh" => "Bahrain", | ||||||
|  | 					"bd" => "Bangladesh", | ||||||
|  | 					"bb" => "Barbados", | ||||||
|  | 					"by" => "Belarus", | ||||||
|  | 					"be" => "Belgium", | ||||||
|  | 					"bz" => "Belize", | ||||||
|  | 					"bj" => "Benin", | ||||||
|  | 					"bm" => "Bermuda", | ||||||
|  | 					"bt" => "Bhutan", | ||||||
|  | 					"bo" => "Bolivia", | ||||||
|  | 					"ba" => "Bosnia and Herzegovina", | ||||||
|  | 					"bw" => "Botswana", | ||||||
|  | 					"bv" => "Bouvet Island", | ||||||
|  | 					"br" => "Brazil", | ||||||
|  | 					"io" => "British Indian Ocean Territory", | ||||||
|  | 					"bn" => "Brunei Darussalam", | ||||||
|  | 					"bg" => "Bulgaria", | ||||||
|  | 					"bf" => "Burkina Faso", | ||||||
|  | 					"bi" => "Burundi", | ||||||
|  | 					"kh" => "Cambodia", | ||||||
|  | 					"cm" => "Cameroon", | ||||||
|  | 					"ca" => "Canada", | ||||||
|  | 					"cv" => "Cape Verde", | ||||||
|  | 					"ky" => "Cayman Islands", | ||||||
|  | 					"cf" => "Central African Republic", | ||||||
|  | 					"td" => "Chad", | ||||||
|  | 					"cl" => "Chile", | ||||||
|  | 					"cn" => "China", | ||||||
|  | 					"cx" => "Christmas Island", | ||||||
|  | 					"cc" => "Cocos (Keeling) Islands", | ||||||
|  | 					"co" => "Colombia", | ||||||
|  | 					"km" => "Comoros", | ||||||
|  | 					"cg" => "Congo", | ||||||
|  | 					"cd" => "Congo, the Democratic Republic", | ||||||
|  | 					"ck" => "Cook Islands", | ||||||
|  | 					"cr" => "Costa Rica", | ||||||
|  | 					"ci" => "Cote D'ivoire", | ||||||
|  | 					"hr" => "Croatia", | ||||||
|  | 					"cu" => "Cuba", | ||||||
|  | 					"cy" => "Cyprus", | ||||||
|  | 					"cz" => "Czech Republic", | ||||||
|  | 					"dk" => "Denmark", | ||||||
|  | 					"dj" => "Djibouti", | ||||||
|  | 					"dm" => "Dominica", | ||||||
|  | 					"do" => "Dominican Republic", | ||||||
|  | 					"ec" => "Ecuador", | ||||||
|  | 					"eg" => "Egypt", | ||||||
|  | 					"sv" => "El Salvador", | ||||||
|  | 					"gq" => "Equatorial Guinea", | ||||||
|  | 					"er" => "Eritrea", | ||||||
|  | 					"ee" => "Estonia", | ||||||
|  | 					"et" => "Ethiopia", | ||||||
|  | 					"fk" => "Falkland Islands (Malvinas)", | ||||||
|  | 					"fo" => "Faroe Islands", | ||||||
|  | 					"fj" => "Fiji", | ||||||
|  | 					"fi" => "Finland", | ||||||
|  | 					"fr" => "France", | ||||||
|  | 					"gf" => "French Guiana", | ||||||
|  | 					"pf" => "French Polynesia", | ||||||
|  | 					"tf" => "French Southern Territories", | ||||||
|  | 					"ga" => "Gabon", | ||||||
|  | 					"gm" => "Gambia", | ||||||
|  | 					"ge" => "Georgia", | ||||||
|  | 					"de" => "Germany", | ||||||
|  | 					"gh" => "Ghana", | ||||||
|  | 					"gi" => "Gibraltar", | ||||||
|  | 					"gr" => "Greece", | ||||||
|  | 					"gl" => "Greenland", | ||||||
|  | 					"gd" => "Grenada", | ||||||
|  | 					"gp" => "Guadeloupe", | ||||||
|  | 					"gu" => "Guam", | ||||||
|  | 					"gt" => "Guatemala", | ||||||
|  | 					"gn" => "Guinea", | ||||||
|  | 					"gw" => "Guinea-Bissau", | ||||||
|  | 					"gy" => "Guyana", | ||||||
|  | 					"ht" => "Haiti", | ||||||
|  | 					"hm" => "Heard Island and Mcdonald Islands", | ||||||
|  | 					"va" => "Holy See (Vatican City State)", | ||||||
|  | 					"hn" => "Honduras", | ||||||
|  | 					"hk" => "Hong Kong", | ||||||
|  | 					"hu" => "Hungary", | ||||||
|  | 					"is" => "Iceland", | ||||||
|  | 					"in" => "India", | ||||||
|  | 					"id" => "Indonesia", | ||||||
|  | 					"ir" => "Iran, Islamic Republic", | ||||||
|  | 					"iq" => "Iraq", | ||||||
|  | 					"ie" => "Ireland", | ||||||
|  | 					"il" => "Israel", | ||||||
|  | 					"it" => "Italy", | ||||||
|  | 					"jm" => "Jamaica", | ||||||
|  | 					"jp" => "Japan", | ||||||
|  | 					"jo" => "Jordan", | ||||||
|  | 					"kz" => "Kazakhstan", | ||||||
|  | 					"ke" => "Kenya", | ||||||
|  | 					"ki" => "Kiribati", | ||||||
|  | 					"kp" => "Korea, Democratic People's Republic", | ||||||
|  | 					"kr" => "Korea, Republic", | ||||||
|  | 					"kw" => "Kuwait", | ||||||
|  | 					"kg" => "Kyrgyzstan", | ||||||
|  | 					"la" => "Lao People's Democratic Republic", | ||||||
|  | 					"lv" => "Latvia", | ||||||
|  | 					"lb" => "Lebanon", | ||||||
|  | 					"ls" => "Lesotho", | ||||||
|  | 					"lr" => "Liberia", | ||||||
|  | 					"ly" => "Libyan Arab Jamahiriya", | ||||||
|  | 					"li" => "Liechtenstein", | ||||||
|  | 					"lt" => "Lithuania", | ||||||
|  | 					"lu" => "Luxembourg", | ||||||
|  | 					"mo" => "Macao", | ||||||
|  | 					"mk" => "Macedonia, the Former Yugosalv Republic", | ||||||
|  | 					"mg" => "Madagascar", | ||||||
|  | 					"mw" => "Malawi", | ||||||
|  | 					"my" => "Malaysia", | ||||||
|  | 					"mv" => "Maldives", | ||||||
|  | 					"ml" => "Mali", | ||||||
|  | 					"mt" => "Malta", | ||||||
|  | 					"mh" => "Marshall Islands", | ||||||
|  | 					"mq" => "Martinique", | ||||||
|  | 					"mr" => "Mauritania", | ||||||
|  | 					"mu" => "Mauritius", | ||||||
|  | 					"yt" => "Mayotte", | ||||||
|  | 					"mx" => "Mexico", | ||||||
|  | 					"fm" => "Micronesia, Federated States", | ||||||
|  | 					"md" => "Moldova, Republic", | ||||||
|  | 					"mc" => "Monaco", | ||||||
|  | 					"mn" => "Mongolia", | ||||||
|  | 					"ms" => "Montserrat", | ||||||
|  | 					"ma" => "Morocco", | ||||||
|  | 					"mz" => "Mozambique", | ||||||
|  | 					"mm" => "Myanmar", | ||||||
|  | 					"na" => "Namibia", | ||||||
|  | 					"nr" => "Nauru", | ||||||
|  | 					"np" => "Nepal", | ||||||
|  | 					"nl" => "Netherlands", | ||||||
|  | 					"an" => "Netherlands Antilles", | ||||||
|  | 					"nc" => "New Caledonia", | ||||||
|  | 					"nz" => "New Zealand", | ||||||
|  | 					"ni" => "Nicaragua", | ||||||
|  | 					"ne" => "Niger", | ||||||
|  | 					"ng" => "Nigeria", | ||||||
|  | 					"nu" => "Niue", | ||||||
|  | 					"nf" => "Norfolk Island", | ||||||
|  | 					"mp" => "Northern Mariana Islands", | ||||||
|  | 					"no" => "Norway", | ||||||
|  | 					"om" => "Oman", | ||||||
|  | 					"pk" => "Pakistan", | ||||||
|  | 					"pw" => "Palau", | ||||||
|  | 					"ps" => "Palestinian Territory, Occupied", | ||||||
|  | 					"pa" => "Panama", | ||||||
|  | 					"pg" => "Papua New Guinea", | ||||||
|  | 					"py" => "Paraguay", | ||||||
|  | 					"pe" => "Peru", | ||||||
|  | 					"ph" => "Philippines", | ||||||
|  | 					"pn" => "Pitcairn", | ||||||
|  | 					"pl" => "Poland", | ||||||
|  | 					"pt" => "Portugal", | ||||||
|  | 					"pr" => "Puerto Rico", | ||||||
|  | 					"qa" => "Qatar", | ||||||
|  | 					"re" => "Reunion", | ||||||
|  | 					"ro" => "Romania", | ||||||
|  | 					"ru" => "Russian Federation", | ||||||
|  | 					"rw" => "Rwanda", | ||||||
|  | 					"sh" => "Saint Helena", | ||||||
|  | 					"kn" => "Saint Kitts and Nevis", | ||||||
|  | 					"lc" => "Saint Lucia", | ||||||
|  | 					"pm" => "Saint Pierre and Miquelon", | ||||||
|  | 					"vc" => "Saint Vincent and the Grenadines", | ||||||
|  | 					"ws" => "Samoa", | ||||||
|  | 					"sm" => "San Marino", | ||||||
|  | 					"st" => "Sao Tome and Principe", | ||||||
|  | 					"sa" => "Saudi Arabia", | ||||||
|  | 					"sn" => "Senegal", | ||||||
|  | 					"cs" => "Serbia and Montenegro", | ||||||
|  | 					"sc" => "Seychelles", | ||||||
|  | 					"sl" => "Sierra Leone", | ||||||
|  | 					"sg" => "Singapore", | ||||||
|  | 					"sk" => "Slovakia", | ||||||
|  | 					"si" => "Slovenia", | ||||||
|  | 					"sb" => "Solomon Islands", | ||||||
|  | 					"so" => "Somalia", | ||||||
|  | 					"za" => "South Africa", | ||||||
|  | 					"gs" => "South Georgia and the South Sandwich Islands", | ||||||
|  | 					"es" => "Spain", | ||||||
|  | 					"lk" => "Sri Lanka", | ||||||
|  | 					"sd" => "Sudan", | ||||||
|  | 					"sr" => "Suriname", | ||||||
|  | 					"sj" => "Svalbard and Jan Mayen", | ||||||
|  | 					"sz" => "Swaziland", | ||||||
|  | 					"se" => "Sweden", | ||||||
|  | 					"ch" => "Switzerland", | ||||||
|  | 					"sy" => "Syrian Arab Republic", | ||||||
|  | 					"tw" => "Taiwan, Province of China", | ||||||
|  | 					"tj" => "Tajikistan", | ||||||
|  | 					"tz" => "Tanzania, United Republic", | ||||||
|  | 					"th" => "Thailand", | ||||||
|  | 					"tl" => "Timor-Leste", | ||||||
|  | 					"tg" => "Togo", | ||||||
|  | 					"tk" => "Tokelau", | ||||||
|  | 					"to" => "Tonga", | ||||||
|  | 					"tt" => "Trinidad and Tobago", | ||||||
|  | 					"tn" => "Tunisia", | ||||||
|  | 					"tr" => "Turkey", | ||||||
|  | 					"tm" => "Turkmenistan", | ||||||
|  | 					"tc" => "Turks and Caicos Islands", | ||||||
|  | 					"tv" => "Tuvalu", | ||||||
|  | 					"ug" => "Uganda", | ||||||
|  | 					"ua" => "Ukraine", | ||||||
|  | 					"ae" => "United Arab Emirates", | ||||||
|  | 					"uk" => "United Kingdom", | ||||||
|  | 					"us" => "United States", | ||||||
|  | 					"um" => "United States Minor Outlying Islands", | ||||||
|  | 					"uy" => "Uruguay", | ||||||
|  | 					"uz" => "Uzbekistan", | ||||||
|  | 					"vu" => "Vanuatu", | ||||||
|  | 					"ve" => "Venezuela", | ||||||
|  | 					"vn" => "Viet Nam", | ||||||
|  | 					"vg" => "Virgin Islands, British", | ||||||
|  | 					"vi" => "Virgin Islands, U.S.", | ||||||
|  | 					"wf" => "Wallis and Futuna", | ||||||
|  | 					"eh" => "Western Sahara", | ||||||
|  | 					"ye" => "Yemen", | ||||||
|  | 					"zm" => "Zambia", | ||||||
|  | 					"zw" => "Zimbabwe" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"nsfw" => [ | ||||||
|  | 				"display" => "NSFW", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"yes" => "Yes", // safe=active | ||||||
|  | 					"no" => "No" // safe=off | ||||||
|  | 				] | ||||||
|  | 			] | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		switch($page){ | ||||||
|  | 			 | ||||||
|  | 			case "web": | ||||||
|  | 				return array_merge( | ||||||
|  | 					$base, | ||||||
|  | 					[ | ||||||
|  | 						"lang" => [ // lr=<lang> (prefix lang with "lang_") | ||||||
|  | 							"display" => "Language", | ||||||
|  | 							"option" => [ | ||||||
|  | 								"any" => "Any language", | ||||||
|  | 								"ar" => "Arabic", | ||||||
|  | 								"bg" => "Bulgarian", | ||||||
|  | 								"ca" => "Catalan", | ||||||
|  | 								"cs" => "Czech", | ||||||
|  | 								"da" => "Danish", | ||||||
|  | 								"de" => "German", | ||||||
|  | 								"el" => "Greek", | ||||||
|  | 								"en" => "English", | ||||||
|  | 								"es" => "Spanish", | ||||||
|  | 								"et" => "Estonian", | ||||||
|  | 								"fi" => "Finnish", | ||||||
|  | 								"fr" => "French", | ||||||
|  | 								"hr" => "Croatian", | ||||||
|  | 								"hu" => "Hungarian", | ||||||
|  | 								"id" => "Indonesian", | ||||||
|  | 								"is" => "Icelandic", | ||||||
|  | 								"it" => "Italian", | ||||||
|  | 								"iw" => "Hebrew", | ||||||
|  | 								"ja" => "Japanese", | ||||||
|  | 								"ko" => "Korean", | ||||||
|  | 								"lt" => "Lithuanian", | ||||||
|  | 								"lv" => "Latvian", | ||||||
|  | 								"nl" => "Dutch", | ||||||
|  | 								"no" => "Norwegian", | ||||||
|  | 								"pl" => "Polish", | ||||||
|  | 								"pt" => "Portuguese", | ||||||
|  | 								"ro" => "Romanian", | ||||||
|  | 								"ru" => "Russian", | ||||||
|  | 								"sk" => "Slovak", | ||||||
|  | 								"sl" => "Slovenian", | ||||||
|  | 								"sr" => "Serbian", | ||||||
|  | 								"sv" => "Swedish", | ||||||
|  | 								"tr" => "Turkish", | ||||||
|  | 								"zh-CN" => "Chinese (Simplified)", | ||||||
|  | 								"zh-TW" => "Chinese (Traditional)" | ||||||
|  | 							] | ||||||
|  | 						], | ||||||
|  | 						"sort" => [ | ||||||
|  | 							"display" => "Sort by", | ||||||
|  | 							"option" => [ | ||||||
|  | 								"any" => "Any order", | ||||||
|  | 								"date:d" => "Oldest", | ||||||
|  | 								"date:a" => "Newest" | ||||||
|  | 							] | ||||||
|  | 						], | ||||||
|  | 						"newer" => [ | ||||||
|  | 							"display" => "Newer than", | ||||||
|  | 							"option" => "_DATE" | ||||||
|  | 						], | ||||||
|  | 						"rm_dupes" => [ | ||||||
|  | 							"display" => "Remove duplicates", | ||||||
|  | 							"option" => [ | ||||||
|  | 								"yes" => "Yes", | ||||||
|  | 								"no" => "No" | ||||||
|  | 							] | ||||||
|  | 						] | ||||||
|  | 					] | ||||||
|  | 				); | ||||||
|  | 				break; | ||||||
|  | 			/* | ||||||
|  | 			case "images": | ||||||
|  | 				return array_merge( | ||||||
|  | 					$base, | ||||||
|  | 					[ | ||||||
|  | 						"time" => [ // tbs=qdr:<time> | ||||||
|  | 							"display" => "Time posted", | ||||||
|  | 							"option" => [ | ||||||
|  | 								"any" => "Any time", | ||||||
|  | 								"d" => "Past 24 hours", | ||||||
|  | 								"w" => "Past week", | ||||||
|  | 								"m" => "Past month", | ||||||
|  | 								"y" => "Past year" | ||||||
|  | 							] | ||||||
|  | 						], | ||||||
|  | 						"size" => [ // imgsz | ||||||
|  | 							"display" => "Size", | ||||||
|  | 							"option" => [ | ||||||
|  | 								"any" => "Any size", | ||||||
|  | 								"l" => "Large", | ||||||
|  | 								"m" => "Medium", | ||||||
|  | 								"i" => "Icon", | ||||||
|  | 								"qsvga" => "Larger than 400x300", | ||||||
|  | 								"vga" => "Larger than 640x480", | ||||||
|  | 								"svga" => "Larger than 800x600", | ||||||
|  | 								"xga" => "Larger than 1024x768", | ||||||
|  | 								"2mp" => "Larger than 2MP", | ||||||
|  | 								"4mp" => "Larger than 4MP", | ||||||
|  | 								"6mp" => "Larger than 6MP", | ||||||
|  | 								"8mp" => "Larger than 8MP", | ||||||
|  | 								"10mp" => "Larger than 10MP", | ||||||
|  | 								"12mp" => "Larger than 12MP", | ||||||
|  | 								"15mp" => "Larger than 15MP", | ||||||
|  | 								"20mp" => "Larger than 20MP", | ||||||
|  | 								"40mp" => "Larger than 40MP", | ||||||
|  | 								"70mp" => "Larger than 70MP" | ||||||
|  | 							] | ||||||
|  | 						], | ||||||
|  | 						"ratio" => [ // imgar | ||||||
|  | 							"display" => "Aspect ratio", | ||||||
|  | 							"option" => [ | ||||||
|  | 								"any" => "Any ratio", | ||||||
|  | 								"t|xt" => "Tall", | ||||||
|  | 								"s" => "Square", | ||||||
|  | 								"w" => "Wide", | ||||||
|  | 								"xw" => "Panoramic" | ||||||
|  | 							] | ||||||
|  | 						], | ||||||
|  | 						"color" => [ // imgc | ||||||
|  | 							"display" => "Color", | ||||||
|  | 							"option" => [ | ||||||
|  | 								"any" => "Any color", | ||||||
|  | 								"color" => "Full color", | ||||||
|  | 								"bnw" => "Black & white", | ||||||
|  | 								"trans" => "Transparent", | ||||||
|  | 								// from here, imgcolor | ||||||
|  | 								"red" => "Red", | ||||||
|  | 								"orange" => "Orange", | ||||||
|  | 								"yellow" => "Yellow", | ||||||
|  | 								"green" => "Green", | ||||||
|  | 								"teal" => "Teal", | ||||||
|  | 								"blue" => "Blue", | ||||||
|  | 								"purple" => "Purple", | ||||||
|  | 								"pink" => "Pink", | ||||||
|  | 								"white" => "White", | ||||||
|  | 								"gray" => "Gray", | ||||||
|  | 								"black" => "Black", | ||||||
|  | 								"brown" => "Brown" | ||||||
|  | 							] | ||||||
|  | 						], | ||||||
|  | 						"type" => [ // tbs=itp:<type> | ||||||
|  | 							"display" => "Type", | ||||||
|  | 							"option" => [ | ||||||
|  | 								"any" => "Any type", | ||||||
|  | 								"clipart" => "Clip Art", | ||||||
|  | 								"lineart" => "Line Drawing", | ||||||
|  | 								"animated" => "Animated" | ||||||
|  | 							] | ||||||
|  | 						], | ||||||
|  | 						"format" => [ // as_filetype | ||||||
|  | 							"display" => "Format", | ||||||
|  | 							"option" => [ | ||||||
|  | 								"any" => "Any format", | ||||||
|  | 								"jpg" => "JPG", | ||||||
|  | 								"gif" => "GIF", | ||||||
|  | 								"png" => "PNG", | ||||||
|  | 								"bmp" => "BMP", | ||||||
|  | 								"svg" => "SVG", | ||||||
|  | 								"webp" => "WEBP", | ||||||
|  | 								"ico" => "ICO", | ||||||
|  | 								"craw" => "RAW" | ||||||
|  | 							] | ||||||
|  | 						], | ||||||
|  | 						"rights" => [ // tbs=sur:<rights> | ||||||
|  | 							"display" => "Usage rights", | ||||||
|  | 							"option" => [ | ||||||
|  | 								"any" => "Any license", | ||||||
|  | 								"cl" => "Creative Commons licenses", | ||||||
|  | 								"ol" => "Commercial & other licenses" | ||||||
|  | 							] | ||||||
|  | 						] | ||||||
|  | 					] | ||||||
|  | 				); | ||||||
|  | 				break;*/ | ||||||
|  | 		} | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function get($proxy, $url, $get = []){ | ||||||
|  | 		 | ||||||
|  | 		$curlproc = curl_init(); | ||||||
|  | 			 | ||||||
|  | 		$headers = [ | ||||||
|  | 			"Accept: application/json", | ||||||
|  | 			"Accept-Encoding: gzip" | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		if($get !== []){ | ||||||
|  | 			$get = http_build_query($get); | ||||||
|  | 			$url .= "?" . $get; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_URL, $url); | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_HTTPHEADER, $headers); | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_RETURNTRANSFER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYHOST, 2); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYPEER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_CONNECTTIMEOUT, 30); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_TIMEOUT, 30); | ||||||
|  | 		 | ||||||
|  | 		// follow redirects | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_FOLLOWLOCATION, true); | ||||||
|  |  | ||||||
|  | 		$this->backend->assign_proxy($curlproc, $proxy); | ||||||
|  | 		 | ||||||
|  | 		$data = curl_exec($curlproc); | ||||||
|  | 		 | ||||||
|  | 		if(curl_errno($curlproc)){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception(curl_error($curlproc)); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_close($curlproc); | ||||||
|  | 		 | ||||||
|  | 		return $data; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function web($get){ | ||||||
|  | 		 | ||||||
|  | 		// rotate proxy + key on EVERY request | ||||||
|  | 		$keydata = $this->backend->get_key(); | ||||||
|  | 		$proxy = $this->backend->get_ip($keydata["increment"]); | ||||||
|  | 		 | ||||||
|  | 		if($get["npt"]){ | ||||||
|  | 			 | ||||||
|  | 			// $p is never used | ||||||
|  | 			[$params, $p] = $this->backend->get( | ||||||
|  | 				$get["npt"], | ||||||
|  | 				"web" | ||||||
|  | 			); | ||||||
|  | 			 | ||||||
|  | 			$params = json_decode($params, true); | ||||||
|  | 			 | ||||||
|  | 			$params["key"] = $keydata["key"]; | ||||||
|  | 			 | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			//$json = file_get_contents("scraper/google.json"); | ||||||
|  | 			$params = [ | ||||||
|  | 				"q" => $get["s"], | ||||||
|  | 				"cx" => config::GOOGLE_CX_ENDPOINT, | ||||||
|  | 				"num" => 10, | ||||||
|  | 				"start" => 1, | ||||||
|  | 				"key" => $keydata["key"] | ||||||
|  | 			]; | ||||||
|  | 			 | ||||||
|  | 			// | ||||||
|  | 			// parse filters | ||||||
|  | 			// | ||||||
|  | 			if($get["newer"] !== false){ | ||||||
|  | 				 | ||||||
|  | 				$params["dateRestrict"] = "d" . (round((time() - $get["newer"]) / 100000)); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($get["rm_dupes"] == "no"){ $params["filter"] = "0"; } | ||||||
|  | 			if($get["country"] != "any"){ $params["gl"] = $get["country"]; } | ||||||
|  | 			if($get["lang"] != "any"){ $params["lr"] = "lang_" . $get["lang"]; } | ||||||
|  | 			 | ||||||
|  | 			if($get["nsfw"] == "yes"){ | ||||||
|  | 				 | ||||||
|  | 				$params["safe"] = "off"; | ||||||
|  | 			}else{ | ||||||
|  | 				 | ||||||
|  | 				$params["safe"] = "active"; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($get["sort"] != "any"){ $params["sort"] = $get["sort"]; } | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		try{ | ||||||
|  | 			$json = | ||||||
|  | 				$this->get( | ||||||
|  | 					$proxy, | ||||||
|  | 					"https://www.googleapis.com/customsearch/v1", | ||||||
|  | 					$params | ||||||
|  | 				); | ||||||
|  | 		}catch(Exception $error){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to fetch JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$json = json_decode($json, true); | ||||||
|  | 		 | ||||||
|  | 		if($json === null){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to decode JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$out = [ | ||||||
|  | 			"status" => "ok", | ||||||
|  | 			"spelling" => [ | ||||||
|  | 				"type" => "no_correction", | ||||||
|  | 				"using" => null, | ||||||
|  | 				"correction" => null | ||||||
|  | 			], | ||||||
|  | 			"npt" => null, | ||||||
|  | 			"answer" => [], | ||||||
|  | 			"web" => [], | ||||||
|  | 			"image" => [], | ||||||
|  | 			"video" => [], | ||||||
|  | 			"news" => [], | ||||||
|  | 			"related" => [] | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		if(isset($json["error"]["message"])){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception( | ||||||
|  | 				"API returned an error: " . | ||||||
|  | 				$json["error"]["message"] . | ||||||
|  | 				" (key #" . $keydata["increment"] . ")" | ||||||
|  | 			); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if(!isset($json["items"])){ | ||||||
|  | 			 | ||||||
|  | 			// google just doesnt return items when theres no results | ||||||
|  | 			return $out; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		foreach($json["items"] as $result){ | ||||||
|  | 			 | ||||||
|  | 			// | ||||||
|  | 			// probe for thumbnail | ||||||
|  | 			// | ||||||
|  | 			$probes = [ | ||||||
|  | 				isset($result["pagemap"]["cse_thumbnail"][0]["src"]) ? $result["pagemap"]["cse_thumbnail"][0]["src"] : null, | ||||||
|  | 				isset($result["pagemap"]["cse_image"][0]["src"]) ? $result["pagemap"]["cse_image"][0]["src"] : null, | ||||||
|  | 				isset($result["pagemap"]["metatags"][0]["twitter:image"]) ? $result["pagemap"]["metatags"][0]["twitter:image"] : null, | ||||||
|  | 				isset($result["pagemap"]["metatags"][0]["og:image"]) ? $result["pagemap"]["metatags"][0]["og:image"] : null | ||||||
|  | 			]; | ||||||
|  | 			 | ||||||
|  | 			$thumb = [ | ||||||
|  | 				"url" => null, | ||||||
|  | 				"ratio" => null | ||||||
|  | 			]; | ||||||
|  | 			 | ||||||
|  | 			foreach($probes as $probe){ | ||||||
|  | 				 | ||||||
|  | 				if($probe !== null){ | ||||||
|  | 				 | ||||||
|  | 					$thumb = [ | ||||||
|  | 						"url" => $probe, | ||||||
|  | 						"ratio" => "16:9" | ||||||
|  | 					]; | ||||||
|  | 					break; | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			// | ||||||
|  | 			// probe for page format | ||||||
|  | 			// | ||||||
|  | 			$mime = "web"; | ||||||
|  | 			if(isset($result["mime"])){ | ||||||
|  | 				 | ||||||
|  | 				$result["mime"] = | ||||||
|  | 					explode( | ||||||
|  | 						"/", | ||||||
|  | 						$result["mime"], | ||||||
|  | 						2 | ||||||
|  | 					); | ||||||
|  | 				 | ||||||
|  | 				if(count($result["mime"]) === 2){ | ||||||
|  | 					 | ||||||
|  | 					$mime = strtoupper($result["mime"][1]); | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$description = $result["snippet"]; | ||||||
|  | 			 | ||||||
|  | 			// | ||||||
|  | 			// Get date | ||||||
|  | 			// | ||||||
|  | 			$description_split = | ||||||
|  | 				explode( | ||||||
|  | 					"...", $description, 2 | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			if(count($description_split) === 1){ | ||||||
|  | 				 | ||||||
|  | 				$description = $result["snippet"]; | ||||||
|  | 			}elseif(strlen($description_split[0]) < 17){ | ||||||
|  | 				 | ||||||
|  | 				$date = trim($description_split[0]); | ||||||
|  | 				$date_probe = strtotime($date); | ||||||
|  | 				 | ||||||
|  | 				if($date_probe !== false){ | ||||||
|  | 					 | ||||||
|  | 					$description = $description_split[1]; | ||||||
|  | 				}else{ | ||||||
|  | 					 | ||||||
|  | 					// | ||||||
|  | 					// fallback to getting date from meta tags | ||||||
|  | 					// | ||||||
|  | 					if(isset($result["pagemap"]["metatags"][0]["creationdate"])){ | ||||||
|  | 						 | ||||||
|  | 						$date = $result["pagemap"]["metatags"][0]["creationdate"]; | ||||||
|  | 						 | ||||||
|  | 					}elseif(isset($result["pagemap"]["metatags"][0]["moddate"])){ | ||||||
|  | 						 | ||||||
|  | 						$date = $result["pagemap"]["metatags"][0]["moddate"]; | ||||||
|  | 					}else{ | ||||||
|  | 						 | ||||||
|  | 						$date = null; | ||||||
|  | 					} | ||||||
|  | 					 | ||||||
|  | 					$description = $result["snippet"]; | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($date !== null){ | ||||||
|  | 				 | ||||||
|  | 				$date = | ||||||
|  | 					strtotime( | ||||||
|  | 						trim( | ||||||
|  | 							str_replace( | ||||||
|  | 								["D:", "'"], | ||||||
|  | 								"", | ||||||
|  | 								$date | ||||||
|  | 							) | ||||||
|  | 						) | ||||||
|  | 					); | ||||||
|  | 				 | ||||||
|  | 				if($date === false){ | ||||||
|  | 					 | ||||||
|  | 					$date = null; | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$out["web"][] = [ | ||||||
|  | 				"title" => | ||||||
|  | 					$this->titledots( | ||||||
|  | 						$result["title"] | ||||||
|  | 					), | ||||||
|  | 				"description" => | ||||||
|  | 					$this->titledots( | ||||||
|  | 						$description | ||||||
|  | 					), | ||||||
|  | 				"url" => $result["link"], | ||||||
|  | 				"date" => $date, | ||||||
|  | 				"type" => $mime, | ||||||
|  | 				"thumb" => $thumb, | ||||||
|  | 				"sublink" => [], | ||||||
|  | 				"table" => [] | ||||||
|  | 			]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		// get npt | ||||||
|  | 		if(isset($json["queries"]["nextPage"][0]["startIndex"])){ | ||||||
|  | 			 | ||||||
|  | 			unset($params["key"]); | ||||||
|  | 			$params["start"] = (int)$json["queries"]["nextPage"][0]["startIndex"]; | ||||||
|  | 			 | ||||||
|  | 			$out["npt"] = | ||||||
|  | 				$this->backend->store( | ||||||
|  | 					json_encode($params), | ||||||
|  | 					"web", | ||||||
|  | 					$proxy | ||||||
|  | 				); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return $out; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function titledots($title){ | ||||||
|  | 		 | ||||||
|  | 		return trim($title, " .\t\n\r\0\x0B…"); | ||||||
|  | 	} | ||||||
|  | } | ||||||
| @@ -1,4 +1,6 @@ | |||||||
| <?php | <?php | ||||||
|  | // greppr dev probably monitors 4get code, lol | ||||||
|  | // hello greppr dude, add an API you moron | ||||||
|  |  | ||||||
| class greppr{ | class greppr{ | ||||||
| 	 | 	 | ||||||
| @@ -16,20 +18,30 @@ class greppr{ | |||||||
| 		return []; | 		return []; | ||||||
| 	} | 	} | ||||||
| 	 | 	 | ||||||
| 	private function get($proxy, $url, $get = [], $cookie = false){ | 	private function get($proxy, $url, $get = [], $cookies = [], $post = false){ | ||||||
| 		 | 		 | ||||||
| 		$curlproc = curl_init(); | 		$curlproc = curl_init(); | ||||||
| 		 | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_URL, $url); | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | ||||||
|  | 		 | ||||||
|  | 		$cookie = []; | ||||||
|  | 		foreach($cookies as $k => $v){ | ||||||
|  | 			 | ||||||
|  | 			$cookie[] = "{$k}={$v}"; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$cookie = implode("; ", $cookie); | ||||||
|  | 		 | ||||||
|  | 		if($post === false){ | ||||||
|  | 						 | ||||||
| 			if($get !== []){ | 			if($get !== []){ | ||||||
| 				$get = http_build_query($get); | 				$get = http_build_query($get); | ||||||
| 				$url .= "?" . $get; | 				$url .= "?" . $get; | ||||||
| 			} | 			} | ||||||
| 			 | 			 | ||||||
| 		curl_setopt($curlproc, CURLOPT_URL, $url); | 			if($cookie == ""){ | ||||||
| 		 |  | ||||||
| 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding |  | ||||||
| 		 |  | ||||||
| 		if($cookie === false){ |  | ||||||
| 				 | 				 | ||||||
| 				curl_setopt($curlproc, CURLOPT_HTTPHEADER, | 				curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
| 					["User-Agent: " . config::USER_AGENT, | 					["User-Agent: " . config::USER_AGENT, | ||||||
| @@ -48,17 +60,48 @@ class greppr{ | |||||||
| 				 | 				 | ||||||
| 				curl_setopt($curlproc, CURLOPT_HTTPHEADER, | 				curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
| 					["User-Agent: " . config::USER_AGENT, | 					["User-Agent: " . config::USER_AGENT, | ||||||
| 				"Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8", | 					"Accept: text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8", | ||||||
| 					"Accept-Language: en-US,en;q=0.5", | 					"Accept-Language: en-US,en;q=0.5", | ||||||
| 				"Accept-Encoding: gzip", | 					"Accept-Encoding: gzip, deflate, br, zstd", | ||||||
| 				"Cookie: PHPSESSID=" . $cookie, |  | ||||||
| 					"DNT: 1", | 					"DNT: 1", | ||||||
|  | 					"Sec-GPC: 1", | ||||||
| 					"Connection: keep-alive", | 					"Connection: keep-alive", | ||||||
|  | 					"Referer: https://greppr.org/search", | ||||||
|  | 					"Cookie: {$cookie}", | ||||||
| 					"Upgrade-Insecure-Requests: 1", | 					"Upgrade-Insecure-Requests: 1", | ||||||
| 					"Sec-Fetch-Dest: document", | 					"Sec-Fetch-Dest: document", | ||||||
| 					"Sec-Fetch-Mode: navigate", | 					"Sec-Fetch-Mode: navigate", | ||||||
| 				"Sec-Fetch-Site: none", | 					"Sec-Fetch-Site: same-origin", | ||||||
| 				"Sec-Fetch-User: ?1"] | 					"Sec-Fetch-User: ?1", | ||||||
|  | 					"Priority: u=0, i"] | ||||||
|  | 				); | ||||||
|  | 			} | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			$get = http_build_query($get); | ||||||
|  | 			 | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_POST, true); | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_POSTFIELDS, $get); | ||||||
|  | 			 | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
|  | 				["User-Agent: " . config::USER_AGENT, | ||||||
|  | 				"Accept: text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8", | ||||||
|  | 				"Accept-Language: en-US,en;q=0.5", | ||||||
|  | 				"Accept-Encoding: gzip, deflate, br, zstd", | ||||||
|  | 				"Content-Type: application/x-www-form-urlencoded", | ||||||
|  | 				"Content-Length: " . strlen($get), | ||||||
|  | 				"Origin: https://greppr.org", | ||||||
|  | 				"DNT: 1", | ||||||
|  | 				"Sec-GPC: 1", | ||||||
|  | 				"Connection: keep-alive", | ||||||
|  | 				"Referer: https://greppr.org/", | ||||||
|  | 				"Cookie: {$cookie}", | ||||||
|  | 				"Upgrade-Insecure-Requests: 1", | ||||||
|  | 				"Sec-Fetch-Dest: document", | ||||||
|  | 				"Sec-Fetch-Mode: navigate", | ||||||
|  | 				"Sec-Fetch-Site: same-origin", | ||||||
|  | 				"Sec-Fetch-User: ?1", | ||||||
|  | 				"Priority: u=0, i"] | ||||||
| 			); | 			); | ||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
| @@ -86,7 +129,7 @@ class greppr{ | |||||||
| 					return $len; | 					return $len; | ||||||
| 				} | 				} | ||||||
| 				 | 				 | ||||||
| 				$headers[strtolower(trim($header[0]))] = trim($header[1]); | 				$headers[strtolower(trim($header[0]))][] = trim($header[1]); | ||||||
|  |  | ||||||
| 				return $len; | 				return $len; | ||||||
| 			} | 			} | ||||||
| @@ -113,7 +156,24 @@ class greppr{ | |||||||
| 			 | 			 | ||||||
| 			[$q, $proxy] = $this->backend->get($get["npt"], "web"); | 			[$q, $proxy] = $this->backend->get($get["npt"], "web"); | ||||||
| 			 | 			 | ||||||
| 			$q = json_decode($q, true); | 			$tokens = json_decode($q, true); | ||||||
|  | 			 | ||||||
|  | 			// | ||||||
|  | 			// Get paginated page | ||||||
|  | 			// | ||||||
|  | 			try{ | ||||||
|  | 			 | ||||||
|  | 				$html = $this->get( | ||||||
|  | 					$proxy, | ||||||
|  | 					"https://greppr.org" . $tokens["get"], | ||||||
|  | 					[], | ||||||
|  | 					$tokens["cookies"], | ||||||
|  | 					false | ||||||
|  | 				); | ||||||
|  | 			}catch(Exception $error){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to fetch search page"); | ||||||
|  | 			} | ||||||
| 			 | 			 | ||||||
| 		}else{ | 		}else{ | ||||||
| 			 | 			 | ||||||
| @@ -124,88 +184,121 @@ class greppr{ | |||||||
| 			} | 			} | ||||||
| 			 | 			 | ||||||
| 			$proxy = $this->backend->get_ip(); | 			$proxy = $this->backend->get_ip(); | ||||||
| 		} |  | ||||||
| 			 | 			 | ||||||
|  | 			// | ||||||
| 			// get token | 			// get token | ||||||
| 		// token[0] = static token that changes once a day | 			// | ||||||
| 		// token[1] = dynamic token that changes on every request |  | ||||||
| 		// token[1] = PHPSESSID cookie |  | ||||||
| 		$tokens = apcu_fetch("greppr_token"); |  | ||||||
| 		 |  | ||||||
| 		if( |  | ||||||
| 			$tokens === false || |  | ||||||
| 			$first_attempt === false // force token fetch |  | ||||||
| 		){ |  | ||||||
| 			 |  | ||||||
| 			// we haven't gotten the token yet, get it |  | ||||||
| 			try{ | 			try{ | ||||||
| 				 | 				 | ||||||
| 				$response = | 				$html = | ||||||
| 					$this->get( | 					$this->get( | ||||||
| 						$proxy, | 						$proxy, | ||||||
| 						"https://greppr.org", | 						"https://greppr.org", | ||||||
| 						[] | 						[], | ||||||
|  | 						[], | ||||||
|  | 						false | ||||||
| 					); | 					); | ||||||
| 			}catch(Exception $error){ | 			}catch(Exception $error){ | ||||||
| 				 | 				 | ||||||
| 				throw new Exception("Failed to fetch search tokens"); | 				throw new Exception("Failed to fetch homepage"); | ||||||
| 			} | 			} | ||||||
| 			 | 			 | ||||||
| 			$tokens = $this->parse_token($response); | 			// | ||||||
|  | 			// Parse token | ||||||
|  | 			// | ||||||
|  | 			$this->fuckhtml->load($html["data"]); | ||||||
| 		 | 		 | ||||||
| 			if($tokens === false){ | 			$tokens = [ | ||||||
|  | 				"req" => null, | ||||||
|  | 				"data" => null, | ||||||
|  | 				"cookies" => null | ||||||
|  | 			]; | ||||||
| 			 | 			 | ||||||
| 				throw new Exception("Failed to grep search tokens"); | 			$inputs = | ||||||
|  | 				$this->fuckhtml | ||||||
|  | 				->getElementsByTagName( | ||||||
|  | 					"input" | ||||||
|  | 				); | ||||||
|  | 				 | ||||||
|  | 			foreach($inputs as $input){ | ||||||
|  | 				 | ||||||
|  | 				if(!isset($input["attributes"]["name"])){ | ||||||
|  | 					 | ||||||
|  | 					continue; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if( | ||||||
|  | 					isset($input["attributes"]["value"]) && | ||||||
|  | 					!empty($input["attributes"]["value"]) | ||||||
|  | 				){ | ||||||
|  | 					 | ||||||
|  | 					$tokens | ||||||
|  | 						["data"] | ||||||
|  | 						[$this->fuckhtml | ||||||
|  | 						->getTextContent( | ||||||
|  | 							$input["attributes"]["name"] | ||||||
|  | 						)] = | ||||||
|  | 						$this->fuckhtml | ||||||
|  | 						->getTextContent( | ||||||
|  | 							$input["attributes"]["value"] | ||||||
|  | 						); | ||||||
|  | 				}else{ | ||||||
|  | 					 | ||||||
|  | 					$tokens["req"] = | ||||||
|  | 						$this->fuckhtml | ||||||
|  | 						->getTextContent( | ||||||
|  | 							$input["attributes"]["name"] | ||||||
|  | 						); | ||||||
| 				} | 				} | ||||||
| 			} | 			} | ||||||
| 			 | 			 | ||||||
|  | 			if($tokens["req"] === null){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to get request ID"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if(isset($html["headers"]["set-cookie"])){ | ||||||
|  | 				 | ||||||
|  | 				foreach($html["headers"]["set-cookie"] as $cookie){ | ||||||
|  | 					 | ||||||
|  | 					if( | ||||||
|  | 						preg_match( | ||||||
|  | 							'/([^=]+)=([^;]+)/', | ||||||
|  | 							$cookie, | ||||||
|  | 							$matches | ||||||
|  | 						) | ||||||
|  | 					){ | ||||||
|  | 						 | ||||||
|  | 						$tokens["cookies"][$matches[1]] = $matches[2]; | ||||||
|  | 					} | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			// | ||||||
|  | 			// Get initial search page | ||||||
|  | 			// | ||||||
|  | 			$tokens_req = $tokens["data"]; | ||||||
|  | 			$tokens_req[$tokens["req"]] = $search; | ||||||
|  | 			 | ||||||
| 			try{ | 			try{ | ||||||
| 				 | 				 | ||||||
| 			if($get["npt"]){ | 				$html = $this->get( | ||||||
| 				 |  | ||||||
| 				$params = [ |  | ||||||
| 					$tokens[0] => $q["q"], |  | ||||||
| 					"s" => $q["s"], |  | ||||||
| 					"l" => 30, |  | ||||||
| 					"n" => $tokens[1] |  | ||||||
| 				]; |  | ||||||
| 			}else{ |  | ||||||
| 				 |  | ||||||
| 				$params = [ |  | ||||||
| 					$tokens[0] => $search, |  | ||||||
| 					"n" => $tokens[1] |  | ||||||
| 				]; |  | ||||||
| 			} |  | ||||||
| 			 |  | ||||||
| 			$searchresults = $this->get( |  | ||||||
| 					$proxy, | 					$proxy, | ||||||
| 					"https://greppr.org/search", | 					"https://greppr.org/search", | ||||||
| 				$params, | 					$tokens_req, | ||||||
| 				$tokens[2] | 					$tokens["cookies"], | ||||||
|  | 					true | ||||||
| 				); | 				); | ||||||
| 			}catch(Exception $error){ | 			}catch(Exception $error){ | ||||||
| 				 | 				 | ||||||
| 				throw new Exception("Failed to fetch search page"); | 				throw new Exception("Failed to fetch search page"); | ||||||
| 			} | 			} | ||||||
| 		 |  | ||||||
| 		if(strlen($searchresults["data"]) === 0){ |  | ||||||
| 			 |  | ||||||
| 			// redirected to main page, which means we got old token |  | ||||||
| 			// generate a new one |  | ||||||
| 			 |  | ||||||
| 			// ... unless we just tried to do that |  | ||||||
| 			if($first_attempt === false){ |  | ||||||
| 				 |  | ||||||
| 				throw new Exception("Failed to get a new search token"); |  | ||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
| 			return $this->web($get, false); | 		//$html = file_get_contents("scraper/greppr.html"); | ||||||
| 		} | 		//$this->fuckhtml->load($html); | ||||||
|  | 		$this->fuckhtml->load($html["data"]); | ||||||
| 		 | 		 | ||||||
| 		// refresh the token with new data (this also triggers fuckhtml load) |  | ||||||
| 		$this->parse_token($searchresults, $tokens[2]); |  | ||||||
| 		 |  | ||||||
| 		// response object |  | ||||||
| 		$out = [ | 		$out = [ | ||||||
| 			"status" => "ok", | 			"status" => "ok", | ||||||
| 			"spelling" => [ | 			"spelling" => [ | ||||||
| @@ -254,24 +347,16 @@ class greppr{ | |||||||
| 				 | 				 | ||||||
| 				if($break === true){ | 				if($break === true){ | ||||||
| 					 | 					 | ||||||
| 					parse_str( | 					$out["npt"] = | ||||||
|  | 						$this->backend->store( | ||||||
|  | 							json_encode([ | ||||||
|  | 								"get" => | ||||||
| 									$this->fuckhtml | 									$this->fuckhtml | ||||||
| 									->getTextContent( | 									->getTextContent( | ||||||
| 										$a["attributes"]["href"] | 										$a["attributes"]["href"] | ||||||
| 									), | 									), | ||||||
| 						$values | 								"cookies" => $tokens["cookies"] | ||||||
| 					); | 							]), | ||||||
| 					 |  | ||||||
| 					$values = array_values($values); |  | ||||||
| 					 |  | ||||||
| 					$out["npt"] = |  | ||||||
| 						$this->backend->store( |  | ||||||
| 							json_encode( |  | ||||||
| 								[ |  | ||||||
| 									"q" => $values[0], |  | ||||||
| 									"s" => $values[1] |  | ||||||
| 								] |  | ||||||
| 							), |  | ||||||
| 							"web", | 							"web", | ||||||
| 							$proxy | 							$proxy | ||||||
| 						); | 						); | ||||||
| @@ -360,74 +445,6 @@ class greppr{ | |||||||
| 		return $out; | 		return $out; | ||||||
| 	} | 	} | ||||||
| 	 | 	 | ||||||
| 	private function parse_token($response, $cookie = false){ |  | ||||||
| 		 |  | ||||||
| 		$this->fuckhtml->load($response["data"]); |  | ||||||
|  |  | ||||||
| 		$scripts = |  | ||||||
| 			$this->fuckhtml |  | ||||||
| 			->getElementsByTagName("script"); |  | ||||||
| 		 |  | ||||||
| 		$found = false; |  | ||||||
| 		foreach($scripts as $script){ |  | ||||||
| 			 |  | ||||||
| 			preg_match( |  | ||||||
| 				'/window\.location ?= ?\'\/search\?([^=]+).*&n=([0-9]+)/', |  | ||||||
| 				$script["innerHTML"], |  | ||||||
| 				$tokens |  | ||||||
| 			); |  | ||||||
| 			 |  | ||||||
| 			if(isset($tokens[1])){ |  | ||||||
| 				 |  | ||||||
| 				$found = true; |  | ||||||
| 				break; |  | ||||||
| 			} |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		if($found === false){ |  | ||||||
| 			 |  | ||||||
| 			return false; |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		$tokens = [ |  | ||||||
| 			$tokens[1], |  | ||||||
| 			$tokens[2] |  | ||||||
| 		]; |  | ||||||
| 		 |  | ||||||
| 		if($cookie !== false){ |  | ||||||
| 			 |  | ||||||
| 			// we already specified a cookie, so use the one we have already |  | ||||||
| 			$tokens[] = $cookie; |  | ||||||
| 			apcu_store("greppr_token", $tokens); |  | ||||||
| 			 |  | ||||||
| 			return $tokens; |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		if(!isset($response["headers"]["set-cookie"])){ |  | ||||||
| 			 |  | ||||||
| 			// server didn't send a cookie |  | ||||||
| 			return false; |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		// get cookie |  | ||||||
| 		preg_match( |  | ||||||
| 			'/PHPSESSID=([^;]+)/', |  | ||||||
| 			$response["headers"]["set-cookie"], |  | ||||||
| 			$cookie |  | ||||||
| 		); |  | ||||||
| 		 |  | ||||||
| 		if(!isset($cookie[1])){ |  | ||||||
| 			 |  | ||||||
| 			// server sent an unexpected cookie |  | ||||||
| 			return false; |  | ||||||
| 		} |  | ||||||
| 		 |  | ||||||
| 		$tokens[] = $cookie[1]; |  | ||||||
| 		apcu_store("greppr_token", $tokens); |  | ||||||
| 		 |  | ||||||
| 		return $tokens; |  | ||||||
| 	} |  | ||||||
| 	 |  | ||||||
| 	private function limitstrlen($text){ | 	private function limitstrlen($text){ | ||||||
| 		 | 		 | ||||||
| 		return explode("\n", wordwrap($text, 300, "\n"))[0]; | 		return explode("\n", wordwrap($text, 300, "\n"))[0]; | ||||||
|   | |||||||
| @@ -182,6 +182,23 @@ class imgur{ | |||||||
| 			throw new Exception("Failed to fetch HTML"); | 			throw new Exception("Failed to fetch HTML"); | ||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
|  | 		$json = json_decode($html, true); | ||||||
|  | 		 | ||||||
|  | 		if($json){ | ||||||
|  | 			 | ||||||
|  | 			// {"data":{"error":"Imgur is temporarily over capacity. Please try again later."},"success":false,"status":403} | ||||||
|  | 			 | ||||||
|  | 			if(isset($json["data"]["error"])){ | ||||||
|  | 				 | ||||||
|  | 				if(stripos($json["data"]["error"], "capacity")){ | ||||||
|  | 					 | ||||||
|  | 					throw new Exception("Imgur IP blocked this 4get instance or request proxy. Try again"); | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Imgur returned an unknown error (IP ban?)"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
| 		$this->fuckhtml->load($html); | 		$this->fuckhtml->load($html); | ||||||
| 		 | 		 | ||||||
| 		$posts = | 		$posts = | ||||||
| @@ -197,7 +214,14 @@ class imgur{ | |||||||
| 			 | 			 | ||||||
| 			$image = | 			$image = | ||||||
| 				$this->fuckhtml | 				$this->fuckhtml | ||||||
| 				->getElementsByTagName("img")[0]; | 				->getElementsByTagName("img"); | ||||||
|  | 			 | ||||||
|  | 			if(count($image) === 0){ | ||||||
|  | 				 | ||||||
|  | 				continue; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$image = $image[0]; | ||||||
| 			 | 			 | ||||||
| 			$image_url = "https:" . substr($this->fuckhtml->getTextContent($image["attributes"]["src"]), 0, -5); | 			$image_url = "https:" . substr($this->fuckhtml->getTextContent($image["attributes"]["src"]), 0, -5); | ||||||
| 			 | 			 | ||||||
|   | |||||||
| @@ -3,7 +3,10 @@ | |||||||
| class marginalia{ | class marginalia{ | ||||||
| 	public function __construct(){ | 	public function __construct(){ | ||||||
| 		 | 		 | ||||||
| 		include "lib/fuckhtml.php"; | 		include "lib/anubis.php"; | ||||||
|  | 		$this->anubis = new anubis(); | ||||||
|  | 		 | ||||||
|  | 		include_once "lib/fuckhtml.php"; | ||||||
| 		$this->fuckhtml = new fuckhtml(); | 		$this->fuckhtml = new fuckhtml(); | ||||||
| 		 | 		 | ||||||
| 		include "lib/backend.php"; | 		include "lib/backend.php"; | ||||||
| @@ -102,7 +105,40 @@ class marginalia{ | |||||||
| 		); | 		); | ||||||
| 	} | 	} | ||||||
| 	 | 	 | ||||||
| 	private function get($proxy, $url, $get = []){ | 	private function get($proxy, $url, $get = [], $get_cookies = 1){ | ||||||
|  | 		 | ||||||
|  | 		$curlproc = curl_init(); | ||||||
|  | 		 | ||||||
|  | 		switch($get_cookies){ | ||||||
|  | 			 | ||||||
|  | 			case 0: | ||||||
|  | 				$cookies = ""; | ||||||
|  | 				$cookies_tmp = []; | ||||||
|  | 				curl_setopt($curlproc, CURLOPT_HEADERFUNCTION, function($curlproc, $header) use (&$cookies_tmp){ | ||||||
|  | 					 | ||||||
|  | 					$length = strlen($header); | ||||||
|  | 					 | ||||||
|  | 					$header = explode(":", $header, 2); | ||||||
|  | 					 | ||||||
|  | 					if(trim(strtolower($header[0])) == "set-cookie"){ | ||||||
|  | 						 | ||||||
|  | 						$cookie_tmp = explode("=", trim($header[1]), 2); | ||||||
|  | 						 | ||||||
|  | 						$cookies_tmp[trim($cookie_tmp[0])] = | ||||||
|  | 							explode(";", $cookie_tmp[1], 2)[0]; | ||||||
|  | 					} | ||||||
|  | 					 | ||||||
|  | 					return $length; | ||||||
|  | 				}); | ||||||
|  | 				break; | ||||||
|  | 			 | ||||||
|  | 			case 1: | ||||||
|  | 				$cookies = ""; | ||||||
|  | 				break; | ||||||
|  | 			 | ||||||
|  | 			default: | ||||||
|  | 				$cookies = "Cookie: " . $get_cookies; | ||||||
|  | 		} | ||||||
| 		 | 		 | ||||||
| 		$headers = [ | 		$headers = [ | ||||||
| 			"User-Agent: " . config::USER_AGENT, | 			"User-Agent: " . config::USER_AGENT, | ||||||
| @@ -110,6 +146,7 @@ class marginalia{ | |||||||
| 			"Accept-Language: en-US,en;q=0.5", | 			"Accept-Language: en-US,en;q=0.5", | ||||||
| 			"Accept-Encoding: gzip", | 			"Accept-Encoding: gzip", | ||||||
| 			"DNT: 1", | 			"DNT: 1", | ||||||
|  | 			$cookies, | ||||||
| 			"Connection: keep-alive", | 			"Connection: keep-alive", | ||||||
| 			"Upgrade-Insecure-Requests: 1", | 			"Upgrade-Insecure-Requests: 1", | ||||||
| 			"Sec-Fetch-Dest: document", | 			"Sec-Fetch-Dest: document", | ||||||
| @@ -118,8 +155,6 @@ class marginalia{ | |||||||
| 			"Sec-Fetch-User: ?1" | 			"Sec-Fetch-User: ?1" | ||||||
| 		]; | 		]; | ||||||
| 		 | 		 | ||||||
| 		$curlproc = curl_init(); |  | ||||||
| 		 |  | ||||||
| 		if($get !== []){ | 		if($get !== []){ | ||||||
| 			$get = http_build_query($get); | 			$get = http_build_query($get); | ||||||
| 			$url .= "?" . $get; | 			$url .= "?" . $get; | ||||||
| @@ -145,7 +180,19 @@ class marginalia{ | |||||||
| 			throw new Exception(curl_error($curlproc)); | 			throw new Exception(curl_error($curlproc)); | ||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
|  | 		if($get_cookies === 0){ | ||||||
|  | 			 | ||||||
|  | 			$cookie = []; | ||||||
|  | 			 | ||||||
|  | 			foreach($cookies_tmp as $key => $value){ | ||||||
|  | 				 | ||||||
|  | 				$cookie[] = $key . "=" . $value; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
| 			curl_close($curlproc); | 			curl_close($curlproc); | ||||||
|  | 			return implode(";", $cookie); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
| 		return $data; | 		return $data; | ||||||
| 	} | 	} | ||||||
| 	 | 	 | ||||||
| @@ -227,7 +274,7 @@ class marginalia{ | |||||||
| 				$json = | 				$json = | ||||||
| 					$this->get( | 					$this->get( | ||||||
| 						$this->backend->get_ip(), // no nextpage | 						$this->backend->get_ip(), // no nextpage | ||||||
| 						"https://api.marginalia.nu/" . config::MARGINALIA_API_KEY . "/search/" . urlencode($search), | 						"https://api.marginalia-search.com/" . config::MARGINALIA_API_KEY . "/search/" . urlencode($search), | ||||||
| 						[ | 						[ | ||||||
| 							"count" => 20 | 							"count" => 20 | ||||||
| 						] | 						] | ||||||
| @@ -267,6 +314,60 @@ class marginalia{ | |||||||
| 		// HTML parser | 		// HTML parser | ||||||
| 		$proxy = $this->backend->get_ip(); | 		$proxy = $this->backend->get_ip(); | ||||||
| 		 | 		 | ||||||
|  | 		// | ||||||
|  | 		// Bypass anubis check | ||||||
|  | 		// | ||||||
|  | 		/* | ||||||
|  | 		if(($anubis_key = apcu_fetch("marginalia_cookie")) === false){ | ||||||
|  | 			 | ||||||
|  | 			try{ | ||||||
|  | 				$html = | ||||||
|  | 					$this->get( | ||||||
|  | 						$proxy, | ||||||
|  | 						"https://old-search.marginalia.nu/search", | ||||||
|  | 						[ | ||||||
|  | 							"query" => $search | ||||||
|  | 						] | ||||||
|  | 					); | ||||||
|  | 					 | ||||||
|  | 			}catch(Exception $error){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to get anubis challenge"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			try{ | ||||||
|  | 				 | ||||||
|  | 				$anubis_data = $this->anubis->scrape($html); | ||||||
|  | 			}catch(Exception $error){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception($error); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			// send anubis response & get cookies | ||||||
|  | 			// https://old-search.marginalia.nu/.within.website/x/cmd/anubis/api/pass-challenge?response=0000018966b086834f738bacba6031028adb5aa875974ead197a8b75778baf3a&nonce=39947&redir=https%3A%2F%2Fold-search.marginalia.nu%2F&elapsedTime=1164 | ||||||
|  | 			 | ||||||
|  | 			try{ | ||||||
|  | 				 | ||||||
|  | 				$anubis_key = | ||||||
|  | 					$this->get( | ||||||
|  | 						$proxy, | ||||||
|  | 						"https://old-search.marginalia.nu/.within.website/x/cmd/anubis/api/pass-challenge", | ||||||
|  | 						[ | ||||||
|  | 							"response" => $anubis_data["response"], | ||||||
|  | 							"nonce" => $anubis_data["nonce"], | ||||||
|  | 							"redir" => "https://old-search.marginalia.nu/", | ||||||
|  | 							"elapsedTime" => random_int(1000, 2000) | ||||||
|  | 						], | ||||||
|  | 						0 | ||||||
|  | 					); | ||||||
|  | 			}catch(Exception $error){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to submit anubis challenge"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			apcu_store("marginalia_cookie", $anubis_key); | ||||||
|  | 		}*/ | ||||||
|  | 		 | ||||||
| 		if($get["npt"]){ | 		if($get["npt"]){ | ||||||
| 			 | 			 | ||||||
| 			[$params, $proxy] = | 			[$params, $proxy] = | ||||||
| @@ -279,7 +380,9 @@ class marginalia{ | |||||||
| 				$html = | 				$html = | ||||||
| 					$this->get( | 					$this->get( | ||||||
| 						$proxy, | 						$proxy, | ||||||
| 						"https://search.marginalia.nu/search?" . $params | 						"https://old-search.marginalia.nu/search?" . $params, | ||||||
|  | 						[], | ||||||
|  | 						//$anubis_key | ||||||
| 					); | 					); | ||||||
| 			}catch(Exception $error){ | 			}catch(Exception $error){ | ||||||
| 				 | 				 | ||||||
| @@ -308,8 +411,9 @@ class marginalia{ | |||||||
| 				$html = | 				$html = | ||||||
| 					$this->get( | 					$this->get( | ||||||
| 						$proxy, | 						$proxy, | ||||||
| 						"https://search.marginalia.nu/search", | 						"https://old-search.marginalia.nu/search", | ||||||
| 						$params | 						$params, | ||||||
|  | 						//$anubis_key | ||||||
| 					); | 					); | ||||||
| 			}catch(Exception $error){ | 			}catch(Exception $error){ | ||||||
| 				 | 				 | ||||||
|   | |||||||
| @@ -457,7 +457,7 @@ class mojeek{ | |||||||
| 				"tn" => 7, // number of news results/page | 				"tn" => 7, // number of news results/page | ||||||
| 				"date" => 1, // show date | 				"date" => 1, // show date | ||||||
| 				"tlen" => 128, // max length of title | 				"tlen" => 128, // max length of title | ||||||
| 				"dlen" => 511, // max length of description | 				//"dlen" => 511, // max length of description | ||||||
| 				"arc" => ($country == "any" ? "none" : $country) // location. don't use autodetect! | 				"arc" => ($country == "any" ? "none" : $country) // location. don't use autodetect! | ||||||
| 			]; | 			]; | ||||||
| 			 | 			 | ||||||
| @@ -501,11 +501,6 @@ class mojeek{ | |||||||
| 				 | 				 | ||||||
| 				throw new Exception("Failed to get HTML"); | 				throw new Exception("Failed to get HTML"); | ||||||
| 			} | 			} | ||||||
| 			/* |  | ||||||
| 			$handle = fopen("scraper/mojeek.html", "r"); |  | ||||||
| 			$html = fread($handle, filesize("scraper/mojeek.html")); |  | ||||||
| 			fclose($handle);*/ |  | ||||||
| 			 |  | ||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
| 		$out = [ | 		$out = [ | ||||||
| @@ -526,6 +521,8 @@ class mojeek{ | |||||||
| 		 | 		 | ||||||
| 		$this->fuckhtml->load($html); | 		$this->fuckhtml->load($html); | ||||||
| 		 | 		 | ||||||
|  | 		$this->detect_block(); | ||||||
|  | 		 | ||||||
| 		$results = | 		$results = | ||||||
| 			$this->fuckhtml | 			$this->fuckhtml | ||||||
| 			->getElementsByClassName("results-standard", "ul"); | 			->getElementsByClassName("results-standard", "ul"); | ||||||
| @@ -695,17 +692,18 @@ class mojeek{ | |||||||
| 				preg_match( | 				preg_match( | ||||||
| 					'/\/image\?img=([^&]+)/i', | 					'/\/image\?img=([^&]+)/i', | ||||||
| 					$thumb[0]["attributes"]["src"], | 					$thumb[0]["attributes"]["src"], | ||||||
| 					$thumb | 					$matches | ||||||
| 				); | 				); | ||||||
| 				 | 				 | ||||||
| 				if(count($thumb) === 2){ | 				if(count($matches) === 2){ | ||||||
| 					 | 					 | ||||||
|  | 					// for some reason, if we dont get the image from mojeek | ||||||
|  | 					// it sometimes fail to fetch the right image URL | ||||||
| 					$answer["thumb"] = | 					$answer["thumb"] = | ||||||
| 						urldecode( | 						"https://mojeek.com" . | ||||||
| 						$this->fuckhtml | 						$this->fuckhtml | ||||||
| 						->getTextContent( | 						->getTextContent( | ||||||
| 								$thumb[1] | 							$thumb[0]["attributes"]["src"] | ||||||
| 							) |  | ||||||
| 						); | 						); | ||||||
| 				} | 				} | ||||||
| 			} | 			} | ||||||
| @@ -1034,6 +1032,8 @@ class mojeek{ | |||||||
| 		 | 		 | ||||||
| 		$this->fuckhtml->load($html); | 		$this->fuckhtml->load($html); | ||||||
| 		 | 		 | ||||||
|  | 		$this->detect_block(); | ||||||
|  | 		 | ||||||
| 		$articles = | 		$articles = | ||||||
| 			$this->fuckhtml->getElementsByTagName("article"); | 			$this->fuckhtml->getElementsByTagName("article"); | ||||||
| 		 | 		 | ||||||
| @@ -1166,6 +1166,26 @@ class mojeek{ | |||||||
| 		return $out; | 		return $out; | ||||||
| 	} | 	} | ||||||
| 	 | 	 | ||||||
|  | 	private function detect_block(){ | ||||||
|  | 		 | ||||||
|  | 		$title = | ||||||
|  | 			$this->fuckhtml | ||||||
|  | 			->getElementsByTagName( | ||||||
|  | 				"title" | ||||||
|  | 			); | ||||||
|  | 		 | ||||||
|  | 		if( | ||||||
|  | 			count($title) !== 0 && | ||||||
|  | 			$this->fuckhtml | ||||||
|  | 			->getTextContent( | ||||||
|  | 				$title[0]["innerHTML"] | ||||||
|  | 			) == "403 - Forbidden" | ||||||
|  | 		){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Mojeek blocked this instance or request proxy."); | ||||||
|  | 		} | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
| 	private function titledots($title){ | 	private function titledots($title){ | ||||||
| 		 | 		 | ||||||
| 		return trim($title, ". \t\n\r\0\x0B"); | 		return trim($title, ". \t\n\r\0\x0B"); | ||||||
|   | |||||||
							
								
								
									
										342
									
								
								scraper/mullvad.php
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										342
									
								
								scraper/mullvad.php
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,342 @@ | |||||||
|  | <?php | ||||||
|  |  | ||||||
|  | class mullvad{ | ||||||
|  | 	 | ||||||
|  | 	public function __construct($engine){ | ||||||
|  | 		 | ||||||
|  | 		$this->engine = $engine; | ||||||
|  | 		 | ||||||
|  | 		include "lib/backend.php"; | ||||||
|  | 		$this->backend = new backend("mullvad_{$this->engine}"); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function getfilters($page){ | ||||||
|  | 		return [ | ||||||
|  | 			"country" => [ // &country= | ||||||
|  | 				"display" => "Country", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any country", | ||||||
|  | 					"ar" => "Argentina", | ||||||
|  | 					"au" => "Australia", | ||||||
|  | 					"at" => "Austria", | ||||||
|  | 					"be" => "Belgium", | ||||||
|  | 					"br" => "Brazil", | ||||||
|  | 					"ca" => "Canada", | ||||||
|  | 					"cl" => "Chile", | ||||||
|  | 					"cn" => "China", | ||||||
|  | 					"dk" => "Denmark", | ||||||
|  | 					"fi" => "Finland", | ||||||
|  | 					"fr" => "France", | ||||||
|  | 					"de" => "Germany", | ||||||
|  | 					"hk" => "Hong Kong", | ||||||
|  | 					"in" => "India", | ||||||
|  | 					"id" => "Indonesia", | ||||||
|  | 					"it" => "Italy", | ||||||
|  | 					"jp" => "Japan", | ||||||
|  | 					"kr" => "Korea, Republic", | ||||||
|  | 					"my" => "Malaysia", | ||||||
|  | 					"mx" => "Mexico", | ||||||
|  | 					"nl" => "Netherlands", | ||||||
|  | 					"nz" => "New Zealand", | ||||||
|  | 					"no" => "Norway", | ||||||
|  | 					"ph" => "Philippines", | ||||||
|  | 					"pl" => "Poland", | ||||||
|  | 					"pt" => "Portugal", | ||||||
|  | 					"ru" => "Russian Federation", | ||||||
|  | 					"sa" => "Saudi Arabia", | ||||||
|  | 					"za" => "South Africa", | ||||||
|  | 					"es" => "Spain", | ||||||
|  | 					"se" => "Sweden", | ||||||
|  | 					"ch" => "Switzerland", | ||||||
|  | 					"tw" => "Taiwan", | ||||||
|  | 					"tr" => "Turkey", | ||||||
|  | 					"uk" => "United Kingdom", | ||||||
|  | 					"us" => "United States" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"language" => [ // &language= | ||||||
|  | 				"display" => "Language", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any language", | ||||||
|  | 					"ar" => "Arabic", | ||||||
|  | 					"bg" => "Bulgarian", | ||||||
|  | 					"ca" => "Catalan", | ||||||
|  | 					"zh-hans" => "Chinese (Simplified)", | ||||||
|  | 					"zh-hant" => "Chinese (Traditional)", | ||||||
|  | 					"hr" => "Croatian", | ||||||
|  | 					"cs" => "Czech", | ||||||
|  | 					"da" => "Danish", | ||||||
|  | 					"nl" => "Dutch", | ||||||
|  | 					"en" => "English", | ||||||
|  | 					"et" => "Estonian", | ||||||
|  | 					"fi" => "Finnish", | ||||||
|  | 					"fr" => "French", | ||||||
|  | 					"de" => "German", | ||||||
|  | 					"he" => "Hebrew", | ||||||
|  | 					"hu" => "Hungarian", | ||||||
|  | 					"is" => "Icelandic", | ||||||
|  | 					"it" => "Italian", | ||||||
|  | 					"jp" => "Japanese", | ||||||
|  | 					"ko" => "Korean", | ||||||
|  | 					"lv" => "Latvian", | ||||||
|  | 					"lt" => "Lithuanian", | ||||||
|  | 					"nb" => "Norwegian", | ||||||
|  | 					"pl" => "Polish", | ||||||
|  | 					"pt" => "Portuguese", | ||||||
|  | 					"ro" => "Romanian", | ||||||
|  | 					"ru" => "Russian", | ||||||
|  | 					"sr" => "Serbian", | ||||||
|  | 					"sk" => "Slovak", | ||||||
|  | 					"sl" => "Slovenian", | ||||||
|  | 					"es" => "Spanish", | ||||||
|  | 					"sv" => "Swedish", | ||||||
|  | 					"tr" => "Turkish" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"time" => [ // &lastUpdated= | ||||||
|  | 				"display" => "Time posted", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any time", | ||||||
|  | 					"d" => "Past day", | ||||||
|  | 					"w" => "Past week", | ||||||
|  | 					"m" => "Past month", | ||||||
|  | 					"y" => "Past year" | ||||||
|  | 				] | ||||||
|  | 			] | ||||||
|  | 		]; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function get($proxy, $url, $get = []){ | ||||||
|  | 		 | ||||||
|  | 		$curlproc = curl_init(); | ||||||
|  | 		 | ||||||
|  | 		if($get !== []){ | ||||||
|  | 			$get = http_build_query($get); | ||||||
|  | 			$url .= "?" . $get; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_URL, $url); | ||||||
|  | 		 | ||||||
|  | 		// http2 bypass | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_HTTP_VERSION, CURL_HTTP_VERSION_2_0); | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
|  | 			["User-Agent: " . config::USER_AGENT, | ||||||
|  | 			"Accept: */*", | ||||||
|  | 			"Accept-Language: en-US,en;q=0.5", | ||||||
|  | 			"Accept-Encoding: gzip, deflate, br, zstd", | ||||||
|  | 			"Referer: https://leta.mullvad.net/search", | ||||||
|  | 			"DNT: 1", | ||||||
|  | 			"Sec-GPC: 1", | ||||||
|  | 			"Connection: keep-alive", | ||||||
|  | 			"Cookie: engine=brave", | ||||||
|  | 			"Sec-Fetch-Dest: empty", | ||||||
|  | 			"Sec-Fetch-Mode: cors", | ||||||
|  | 			"Sec-Fetch-Site: same-origin", | ||||||
|  | 			"Priority: u=0", | ||||||
|  | 			"TE: trailers"] | ||||||
|  | 		); | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_RETURNTRANSFER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYHOST, 2); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYPEER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_CONNECTTIMEOUT, 30); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_TIMEOUT, 30); | ||||||
|  | 		 | ||||||
|  | 		$this->backend->assign_proxy($curlproc, $proxy); | ||||||
|  | 		 | ||||||
|  | 		$data = curl_exec($curlproc); | ||||||
|  | 		 | ||||||
|  | 		if(curl_errno($curlproc)){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception(curl_error($curlproc)); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_close($curlproc); | ||||||
|  | 		return $data; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function web($get){ | ||||||
|  | 		 | ||||||
|  | 		if($get["npt"]){ | ||||||
|  | 			 | ||||||
|  | 			[$params, $proxy] = $this->backend->get($get["npt"], "web"); | ||||||
|  | 			$params = json_decode($params, true); | ||||||
|  | 			 | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			if(strlen($get["s"]) === 0){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Search term is empty!"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			// generate filters | ||||||
|  | 			$params = [ | ||||||
|  | 				"q" => $get["s"], | ||||||
|  | 				"engine" => $this->engine, | ||||||
|  | 				"page" => 1 | ||||||
|  | 			]; | ||||||
|  | 			 | ||||||
|  | 			if($get["country"] != "any"){ | ||||||
|  | 				 | ||||||
|  | 				$params["country"] = $get["country"]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($get["language"] != "any"){ | ||||||
|  | 				 | ||||||
|  | 				$params["language"] = $get["language"]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if($get["time"] != "any"){ | ||||||
|  | 				 | ||||||
|  | 				$params["lastUpdated"] = $get["time"]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$proxy = $this->backend->get_ip(); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		try{ | ||||||
|  | 			$json = $this->get( | ||||||
|  | 				$proxy, | ||||||
|  | 				"https://leta.mullvad.net/search/__data.json", | ||||||
|  | 				$params | ||||||
|  | 			); | ||||||
|  | 		}catch(Exception $error){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to fetch search page"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$json = json_decode($json, true); | ||||||
|  | 		 | ||||||
|  | 		if($json === null){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to decode JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if(!isset($json["nodes"])){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Mullvad did not return a nodes object"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$out = [ | ||||||
|  | 			"status" => "ok", | ||||||
|  | 			"spelling" => [ | ||||||
|  | 				"type" => "no_correction", | ||||||
|  | 				"using" => null, | ||||||
|  | 				"correction" => null | ||||||
|  | 			], | ||||||
|  | 			"npt" => $nextpage, | ||||||
|  | 			"answer" => [], | ||||||
|  | 			"web" => [], | ||||||
|  | 			"image" => [], | ||||||
|  | 			"video" => [], | ||||||
|  | 			"news" => [], | ||||||
|  | 			"related" => [] | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		// parse json payload | ||||||
|  | 		foreach($json["nodes"] as $node){ | ||||||
|  | 			 | ||||||
|  | 			if(!isset($node["data"][0]["q"])){ | ||||||
|  | 				 | ||||||
|  | 				// not iterating through the query object | ||||||
|  | 				continue; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			// node 0 contains pointers to what we need to iterate through | ||||||
|  | 			$node0 = &$node["data"][0]; | ||||||
|  | 			 | ||||||
|  | 			if(!isset($node["data"][$node0["success"]])){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Mullvad did not return a success object"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$success = &$node["data"][$node0["success"]]; | ||||||
|  | 			 | ||||||
|  | 			if($success === false){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Mullvad flagged the response as unsuccessful"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if(!isset($node["data"][$node0["items"]])){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Mullvad did not return an items object"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$search_pointers = &$node["data"][$node0["items"]]; | ||||||
|  | 			 | ||||||
|  | 			// | ||||||
|  | 			// Iterate over results | ||||||
|  | 			// | ||||||
|  | 			foreach($search_pointers as $pointer){ | ||||||
|  | 				 | ||||||
|  | 				$pointer = &$node["data"][$pointer]; | ||||||
|  | 				 | ||||||
|  | 				$link = &$node["data"][$pointer["link"]]; | ||||||
|  | 				$title = &$node["data"][$pointer["title"]]; | ||||||
|  | 				$description = &$node["data"][$pointer["snippet"]]; | ||||||
|  | 				 | ||||||
|  | 				$date = null; | ||||||
|  | 				if($this->engine == "google"){ | ||||||
|  | 					 | ||||||
|  | 					// attempt to extract date | ||||||
|  | 					// Jan 12, 2017 | ||||||
|  | 					$date_parts = explode(" ... ", $description, 2); | ||||||
|  | 					 | ||||||
|  | 					if( | ||||||
|  | 						count($date_parts) === 2 && | ||||||
|  | 						strlen($date_parts[0]) < 15 | ||||||
|  | 					){ | ||||||
|  | 						 | ||||||
|  | 						$date = strtotime(trim($date_parts[0])); | ||||||
|  | 						 | ||||||
|  | 						if($date === false){ | ||||||
|  | 							 | ||||||
|  | 							$date = null; | ||||||
|  | 						}else{ | ||||||
|  | 							 | ||||||
|  | 							$description = trim($date_parts[1]); | ||||||
|  | 						} | ||||||
|  | 					} | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				$out["web"][] = [ | ||||||
|  | 					"title" => $this->titledots($title), | ||||||
|  | 					"description" => $this->titledots($description), | ||||||
|  | 					"url" => $link, | ||||||
|  | 					"date" => $date, | ||||||
|  | 					"type" => "web", | ||||||
|  | 					"thumb" => [ | ||||||
|  | 						"url" => null, | ||||||
|  | 						"ratio" => null | ||||||
|  | 					], | ||||||
|  | 					"sublink" => [], | ||||||
|  | 					"table" => [] | ||||||
|  | 				]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			// | ||||||
|  | 			// Get nextpage | ||||||
|  | 			// | ||||||
|  | 			if(isset($node["data"][$node0["next"]])){ | ||||||
|  | 				 | ||||||
|  | 				$params["page"] = (int)$node["data"][$node0["next"]]; | ||||||
|  | 				 | ||||||
|  | 				$out["npt"] = | ||||||
|  | 					$this->backend->store( | ||||||
|  | 						json_encode($params), | ||||||
|  | 						"web", | ||||||
|  | 						$proxy | ||||||
|  | 					); | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return $out; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function titledots($title){ | ||||||
|  | 		 | ||||||
|  | 		return trim($title, " .\t\n\r\0\x0B…"); | ||||||
|  | 	} | ||||||
|  | } | ||||||
							
								
								
									
										20
									
								
								scraper/mullvad_brave.php
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										20
									
								
								scraper/mullvad_brave.php
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,20 @@ | |||||||
|  | <?php | ||||||
|  |  | ||||||
|  | class mullvad_brave{ | ||||||
|  | 	 | ||||||
|  | 	public function __construct(){ | ||||||
|  | 		 | ||||||
|  | 		include "scraper/mullvad.php"; | ||||||
|  | 		$this->mullvad = new mullvad("brave"); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function getfilters($page){ | ||||||
|  | 		 | ||||||
|  | 		return $this->mullvad->getfilters($page); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function web($get){ | ||||||
|  | 		 | ||||||
|  | 		return $this->mullvad->web($get); | ||||||
|  | 	} | ||||||
|  | } | ||||||
							
								
								
									
										20
									
								
								scraper/mullvad_google.php
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										20
									
								
								scraper/mullvad_google.php
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,20 @@ | |||||||
|  | <?php | ||||||
|  |  | ||||||
|  | class mullvad_google{ | ||||||
|  | 	 | ||||||
|  | 	public function __construct(){ | ||||||
|  | 		 | ||||||
|  | 		include "scraper/mullvad.php"; | ||||||
|  | 		$this->mullvad = new mullvad("google"); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function getfilters($page){ | ||||||
|  | 		 | ||||||
|  | 		return $this->mullvad->getfilters($page); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function web($get){ | ||||||
|  | 		 | ||||||
|  | 		return $this->mullvad->web($get); | ||||||
|  | 	} | ||||||
|  | } | ||||||
| @@ -13,31 +13,104 @@ class pinterest{ | |||||||
| 		return []; | 		return []; | ||||||
| 	} | 	} | ||||||
| 	 | 	 | ||||||
| 	private function get($proxy, $url, $get = []){ | 	private function get($proxy, $url, $get = [], &$cookies, $header_data_post = null){ | ||||||
| 		 | 		 | ||||||
| 		$curlproc = curl_init(); | 		$curlproc = curl_init(); | ||||||
| 		 | 		 | ||||||
|  | 		if($header_data_post === null){ | ||||||
|  | 			 | ||||||
|  | 			// handling GET | ||||||
|  | 						 | ||||||
|  | 			// extract cookies | ||||||
|  | 			$cookies_tmp = []; | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_HEADERFUNCTION, function($curlproc, $header) use (&$cookies_tmp){ | ||||||
|  | 				 | ||||||
|  | 				$length = strlen($header); | ||||||
|  | 				 | ||||||
|  | 				$header = explode(":", $header, 2); | ||||||
|  | 				 | ||||||
|  | 				if(trim(strtolower($header[0])) == "set-cookie"){ | ||||||
|  | 					 | ||||||
|  | 					$cookie_tmp = explode("=", trim($header[1]), 2); | ||||||
|  | 					 | ||||||
|  | 					$cookies_tmp[trim($cookie_tmp[0])] = | ||||||
|  | 						explode(";", $cookie_tmp[1], 2)[0]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				return $length; | ||||||
|  | 			}); | ||||||
|  | 			 | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
|  | 				["User-Agent: " . config::USER_AGENT, | ||||||
|  | 				"Accept: application/json, text/javascript, */*, q=0.01", | ||||||
|  | 				"Accept-Language: en-US,en;q=0.5", | ||||||
|  | 				"Accept-Encoding: gzip", | ||||||
|  | 				"Referer: https://ca.pinterest.com/", | ||||||
|  | 				"X-Requested-With: XMLHttpRequest", | ||||||
|  | 				"X-APP-VERSION: 78f8764", | ||||||
|  | 				"X-Pinterest-AppState: active", | ||||||
|  | 				"X-Pinterest-Source-Url: /", | ||||||
|  | 				"X-Pinterest-PWS-Handler: www/index.js", | ||||||
|  | 				"screen-dpr: 1", | ||||||
|  | 				"is-preload-enabled: 1", | ||||||
|  | 				"DNT: 1", | ||||||
|  | 				"Sec-GPC: 1", | ||||||
|  | 				"Sec-Fetch-Dest: empty", | ||||||
|  | 				"Sec-Fetch-Mode: cors", | ||||||
|  | 				"Sec-Fetch-Site: same-origin", | ||||||
|  | 				"Connection: keep-alive", | ||||||
|  | 				"Alt-Used: ca.pinterest.com", | ||||||
|  | 				"Priority: u=0", | ||||||
|  | 				"TE: trailers"] | ||||||
|  | 			); | ||||||
|  | 			 | ||||||
| 			if($get !== []){ | 			if($get !== []){ | ||||||
| 				$get = http_build_query($get); | 				$get = http_build_query($get); | ||||||
| 				$url .= "?" . $get; | 				$url .= "?" . $get; | ||||||
| 			} | 			} | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			// handling POST (pagination) | ||||||
|  | 			$get = http_build_query($get); | ||||||
|  | 			 | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
|  | 				["User-Agent: " . config::USER_AGENT, | ||||||
|  | 				"Accept: application/json, text/javascript, */*, q=0.01", | ||||||
|  | 				"Accept-Language: en-US,en;q=0.5", | ||||||
|  | 				"Accept-Encoding: gzip", | ||||||
|  | 				"Content-Type: application/x-www-form-urlencoded", | ||||||
|  | 				"Content-Length: " . strlen($get), | ||||||
|  | 				"Referer: https://ca.pinterest.com/", | ||||||
|  | 				"X-Requested-With: XMLHttpRequest", | ||||||
|  | 				"X-APP-VERSION: 78f8764", | ||||||
|  | 				"X-CSRFToken: " . $cookies["csrf"], | ||||||
|  | 				"X-Pinterest-AppState: active", | ||||||
|  | 				"X-Pinterest-Source-Url: /search/pins/?rs=ac&len=2&q=" . urlencode($header_data_post) . "&eq=" . urlencode($header_data_post), | ||||||
|  | 				"X-Pinterest-PWS-Handler: www/search/[scope].js", | ||||||
|  | 				"screen-dpr: 1", | ||||||
|  | 				"is-preload-enabled: 1", | ||||||
|  | 				"Origin: https://ca.pinterest.com", | ||||||
|  | 				"DNT: 1", | ||||||
|  | 				"Sec-GPC: 1", | ||||||
|  | 				"Sec-Fetch-Dest: empty", | ||||||
|  | 				"Sec-Fetch-Mode: cors", | ||||||
|  | 				"Sec-Fetch-Site: same-origin", | ||||||
|  | 				"Connection: keep-alive", | ||||||
|  | 				"Alt-Used: ca.pinterest.com", | ||||||
|  | 				"Cookie: " . $cookies["cookie"], | ||||||
|  | 				"TE: trailers"] | ||||||
|  | 			); | ||||||
|  | 			 | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_POST, true); | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_POSTFIELDS, $get); | ||||||
|  | 		} | ||||||
| 		 | 		 | ||||||
| 		curl_setopt($curlproc, CURLOPT_URL, $url); | 		curl_setopt($curlproc, CURLOPT_URL, $url); | ||||||
| 		 | 		 | ||||||
| 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | ||||||
| 		curl_setopt($curlproc, CURLOPT_HTTPHEADER, | 		 | ||||||
| 			["User-Agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:107.0) Gecko/20100101 Firefox/110.0", | 		// http2 bypass | ||||||
| 			"Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8", | 		curl_setopt($curlproc, CURLOPT_HTTP_VERSION, CURL_HTTP_VERSION_2_0); | ||||||
| 			"Accept-Language: en-US,en;q=0.5", |  | ||||||
| 			"Accept-Encoding: gzip", |  | ||||||
| 			"DNT: 1", |  | ||||||
| 			"Connection: keep-alive", |  | ||||||
| 			"Upgrade-Insecure-Requests: 1", |  | ||||||
| 			"Sec-Fetch-Dest: document", |  | ||||||
| 			"Sec-Fetch-Mode: navigate", |  | ||||||
| 			"Sec-Fetch-Site: none", |  | ||||||
| 			"Sec-Fetch-User: ?1"] |  | ||||||
| 		); |  | ||||||
| 		 | 		 | ||||||
| 		curl_setopt($curlproc, CURLOPT_RETURNTRANSFER, true); | 		curl_setopt($curlproc, CURLOPT_RETURNTRANSFER, true); | ||||||
| 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYHOST, 2); | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYHOST, 2); | ||||||
| @@ -54,6 +127,26 @@ class pinterest{ | |||||||
| 			throw new Exception(curl_error($curlproc)); | 			throw new Exception(curl_error($curlproc)); | ||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
|  | 		if($header_data_post === null){ | ||||||
|  | 			 | ||||||
|  | 			if(!isset($cookies_tmp["csrftoken"])){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to grep CSRF token"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$cookies = ""; | ||||||
|  | 			 | ||||||
|  | 			foreach($cookies_tmp as $cookie_name => $cookie_value){ | ||||||
|  | 				 | ||||||
|  | 				$cookies .= $cookie_name . "=" . $cookie_value . "; "; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$cookies = [ | ||||||
|  | 				"csrf" => $cookies_tmp["csrftoken"], | ||||||
|  | 				"cookie" => rtrim($cookies, " ;") | ||||||
|  | 			]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
| 		curl_close($curlproc); | 		curl_close($curlproc); | ||||||
| 		return $data; | 		return $data; | ||||||
| 	} | 	} | ||||||
| @@ -62,17 +155,68 @@ class pinterest{ | |||||||
| 		 | 		 | ||||||
| 		if($get["npt"]){ | 		if($get["npt"]){ | ||||||
| 			 | 			 | ||||||
| 			// @TODO | 			[$data, $proxy] = | ||||||
| 			// post data for next page | 				$this->backend->get( | ||||||
| 			$data = [ | 					$get["npt"], "images" | ||||||
| 				"source_url" => "/search/pins/?q=" . urlencode($search) . "&rs=typed", |  | ||||||
| 				"data" => |  | ||||||
| 					json_encode( |  | ||||||
| 						[ |  | ||||||
| 							// {"options":{"applied_filters":null,"appliedProductFilters":"---","article":null,"auto_correction_disabled":false,"corpus":null,"customized_rerank_type":null,"domains":null,"filters":null,"journey_depth":null,"page_size":null,"price_max":null,"price_min":null,"query_pin_sigs":null,"query":"higurashi","redux_normalize_feed":true,"rs":"typed","scope":"pins","selected_one_bar_modules":null,"source_id":null,"source_module_id":null,"top_pin_id":null,"bookmarks":["Y2JVSG81V2sxcmNHRlpWM1J5VFVad1ZsWlVRbXhpVmtreVZsZHpOV0pIU2tkV2FscFhVbXhhVkZreU1WSmtNREZWVjIxR1RrMXNTbEJXYlhSaFVtMVdjMVZ1U2xaaWEzQnpXVlJPVTJWV1pISlhhM1JYVm10V05sVldVbE5XVjBwMVVXMUdWVll6VFhoVWJYaFhWMVp3Ums1V1RsTmlSbGt5Vm10YWFtVkdWbkpOU0dSUFZsZG9XRmxzWkc5VlZscHlWbGhrYkdKR1NubFdWelZQWVVaYWRHVkVRbFppUmtwVVZrUktWMlJIVWtWV2JHaHBVakZLU0Zkc1pEUmtNVnBZVW10b2FsSXdXbkJXYlRWRFpHeGFSMWRzVG1oaGVrWllXV3RvVTFVeFpFaFZiRUpoVm5wRk1GbHFSbXRYVjA1R1YyczFWMVpHV2pSWFZtaDNVakZrY2sxWVRsaGlhM0JXV1ZSR1MyRkdiRlZTYm1SVVVteHdXbGxWVlRGVk1VbDVWRmhrVjAxdVVuWlVhMXBTWlVaT2MxcEhSbE5TTWswMVdtdGFWMU5YU2paVmJYaFRUVmhDUjFZeU5YZFVNVkY0VjJ0b1ZXRnJOVlpVVmxwTFVURndXR042VmxOV2ExcGFXVlZWTlZVeFNYZE5WRTVYVWtWYVZGWkhNVTlXTVU1WllVWk9hR1ZyV2s1WFZ6QXhZakpPVjFWWWFHRlNWbkJRVm14U1IwMUdXWGxOVkVKVlRWWnNORll5TURWV1YwVjVWV3hDV21FeGNETmFSVnByVjFkS1IyTkhhR2xYUjJkM1ZtdGFhMlF4VVhsVGJGcE9Wa1p3YjFwWGVFdFZWbFp4VW14YWJGWnRVbHBaTUdoTFZHMUtTR1ZJYUZkV2VrWjJWMVphU21ReVJYcGpSbFpwVW10d1RGZHJVa0pPVms1SFZHNVNUbFl3V2xoVmJYUldaVVpaZUZremFGUk5hM0JYVkZaYVYyRkZNSGxWYkVKYVlrWlZlRnBGV210WFIwNUpVMnMxVTFaR1dscFdWekI0VFVaV1IxTllaR3BUUlhCb1dWUkdWbVZHVm5SbFJuQnNZbFpKTWxSVlVYaFBSVGxGV1hwR1QyVnJSVEZVVlZKT1RrVXhSVkpVUWs5bGJFVXhWRmhzZDFOR1ZsWmtNMFp0VWpGYWIxZFhjRXBsUlRGSVZWaHdUbFl4YTNoVVZWSnFUVVUxV0ZadGFFOVNSVnB6Vkd0a1drMUdiRFpUVkVaT1pXMWplRmRzVWxkaFJuQllWVlJTVDJWdFRqWlVNVkpTWlZad2NWcEhkRTlsYTFwMFZGVlNhMkpWTVZWVFZFcE9Wa1pzTmxkWE1WSk9WVEYwVlcweFVGWXdXVFJXUjNSWFYwZGFRbEJVTVRoUFJHTXhUbnBCTlUxRVRUUk5SRVV3VG5wUk5VMTVjRWhWVlhkeFprUlZlRTlFVVRKWlZHc3lUMWRSTWsxVVVUSk9iVnBvV1RKWmVrNTZXWGhPTWs1cFQwUkZNVTlFVm1sTlZGcHBUV3BTYTFsWFRtcE9SR015VG1wVk5GbHFaR2haVjFacldWUmFiVmxxWkdoYVZGWnFUa1JXT0ZSclZsaG1RVDA5fFVIbzVhRkpYZUc1WFYyUlpWVEpHYkdGNk1XWk5ha1ptVFZSR09FOUVZekZPZWtFMVRVUk5ORTFFUlRCT2VsRTFUWGx3U0ZWVmQzRm1SMWw1VFZSUk1WbDZUVEJhUjFGNVQxZFNhVnB0VlRGT1JFVXdXVlJuZVU1cVRUUk5hbU40VDBSSk1VNXFWVEZOYlZwcVdsUnJlRTFFVVhwWmVsVjNXbXBvYkU1dFJYbE9ha0Y2VDFSSk5VMTZWVEJaYWtJNFZHdFdXR1pCUFQwPXxOb25lfDg3NTcwOTAzODAxNDc0OTMqR1FMKnwzMjM3YjM3ZGNhMGU3YjYyYzYzYzAyZGJkNGU1MjdlNzMyMTExMTNlMmUyMzEyOWM2MDAzYmU1ZTlmZjkwYjAwfE5FV3w="]},"context":{}} |  | ||||||
| 						] |  | ||||||
| 				); | 				); | ||||||
| 			]; | 			 | ||||||
|  | 			$data = json_decode($data, true); | ||||||
|  | 			 | ||||||
|  | 			$search = $data["q"]; | ||||||
|  | 			$cookies = $data["cookies"]; | ||||||
|  | 			 | ||||||
|  | 			try{ | ||||||
|  | 				$json = | ||||||
|  | 					$this->get( | ||||||
|  | 						$proxy, | ||||||
|  | 						"https://ca.pinterest.com/resource/BaseSearchResource/get/", | ||||||
|  | 						[ | ||||||
|  | 							"source_url" => "/search/pins/?q=" . urlencode($search) . "&rs=typed", | ||||||
|  | 							"data" => json_encode( | ||||||
|  | 								[ | ||||||
|  | 									"options" => [ | ||||||
|  | 										"applied_unified_filters" => null, | ||||||
|  | 										"appliedProductFilters" => "---", | ||||||
|  | 										"article" => null, | ||||||
|  | 										"auto_correction_disabled" => false, | ||||||
|  | 										"corpus" => null, | ||||||
|  | 										"customized_rerank_type" => null, | ||||||
|  | 										"domains" => null, | ||||||
|  | 										"dynamicPageSizeExpGroup" => null, | ||||||
|  | 										"filters" => null, | ||||||
|  | 										"journey_depth" => null, | ||||||
|  | 										"page_size" => null, | ||||||
|  | 										"price_max" => null, | ||||||
|  | 										"price_min" => null, | ||||||
|  | 										"query_pin_sigs" => null, | ||||||
|  | 										"query" => $data["q"], | ||||||
|  | 										"redux_normalize_feed" => true, | ||||||
|  | 										"request_params" => null, | ||||||
|  | 										"rs" => "typed", | ||||||
|  | 										"scope" => "pins", | ||||||
|  | 										"selected_one_bar_modules" => null, | ||||||
|  | 										"source_id" => null, | ||||||
|  | 										"source_module_id" => null, | ||||||
|  | 										"source_url" => "/search/pins/?q=" . urlencode($search) . "&rs=typed", | ||||||
|  | 										"top_pin_id" => null, | ||||||
|  | 										"top_pin_ids" => null, | ||||||
|  | 										"bookmarks" => [ | ||||||
|  | 											$data["bookmark"] | ||||||
|  | 										] | ||||||
|  | 									], | ||||||
|  | 									"context" => [] | ||||||
|  | 								], | ||||||
|  | 								JSON_UNESCAPED_SLASHES | ||||||
|  | 							) | ||||||
|  | 						], | ||||||
|  | 						$cookies, | ||||||
|  | 						$search | ||||||
|  | 					); | ||||||
|  | 				 | ||||||
|  | 			}catch(Exception $error){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to fetch JSON"); | ||||||
|  | 			} | ||||||
| 			 | 			 | ||||||
| 		}else{ | 		}else{ | ||||||
| 			 | 			 | ||||||
| @@ -82,26 +226,44 @@ class pinterest{ | |||||||
| 				throw new Exception("Search term is empty!"); | 				throw new Exception("Search term is empty!"); | ||||||
| 			} | 			} | ||||||
| 						 | 						 | ||||||
|  | 			// https://ca.pinterest.com/resource/BaseSearchResource/get/?source_url=%2Fsearch%2Fpins%2F%3Feq%3Dhigurashi%26etslf%3D5966%26len%3D2%26q%3Dhigurashi%2520when%2520they%2520cry%26rs%3Dac&data=%7B%22options%22%3A%7B%22applied_unified_filters%22%3Anull%2C%22appliedProductFilters%22%3A%22---%22%2C%22article%22%3Anull%2C%22auto_correction_disabled%22%3Afalse%2C%22corpus%22%3Anull%2C%22customized_rerank_type%22%3Anull%2C%22domains%22%3Anull%2C%22dynamicPageSizeExpGroup%22%3Anull%2C%22filters%22%3Anull%2C%22journey_depth%22%3Anull%2C%22page_size%22%3Anull%2C%22price_max%22%3Anull%2C%22price_min%22%3Anull%2C%22query_pin_sigs%22%3Anull%2C%22query%22%3A%22higurashi%20when%20they%20cry%22%2C%22redux_normalize_feed%22%3Atrue%2C%22request_params%22%3Anull%2C%22rs%22%3A%22ac%22%2C%22scope%22%3A%22pins%22%2C%22selected_one_bar_modules%22%3Anull%2C%22source_id%22%3Anull%2C%22source_module_id%22%3Anull%2C%22source_url%22%3A%22%2Fsearch%2Fpins%2F%3Feq%3Dhigurashi%26etslf%3D5966%26len%3D2%26q%3Dhigurashi%2520when%2520they%2520cry%26rs%3Dac%22%2C%22top_pin_id%22%3Anull%2C%22top_pin_ids%22%3Anull%7D%2C%22context%22%3A%7B%7D%7D&_=1736116313987 | ||||||
|  | 			// source_url=%2Fsearch%2Fpins%2F%3Feq%3Dhigurashi%26etslf%3D5966%26len%3D2%26q%3Dhigurashi%2520when%2520they%2520cry%26rs%3Dac | ||||||
|  | 			// &data=%7B%22options%22%3A%7B%22applied_unified_filters%22%3Anull%2C%22appliedProductFilters%22%3A%22---%22%2C%22article%22%3Anull%2C%22auto_correction_disabled%22%3Afalse%2C%22corpus%22%3Anull%2C%22customized_rerank_type%22%3Anull%2C%22domains%22%3Anull%2C%22dynamicPageSizeExpGroup%22%3Anull%2C%22filters%22%3Anull%2C%22journey_depth%22%3Anull%2C%22page_size%22%3Anull%2C%22price_max%22%3Anull%2C%22price_min%22%3Anull%2C%22query_pin_sigs%22%3Anull%2C%22query%22%3A%22higurashi%20when%20they%20cry%22%2C%22redux_normalize_feed%22%3Atrue%2C%22request_params%22%3Anull%2C%22rs%22%3A%22ac%22%2C%22scope%22%3A%22pins%22%2C%22selected_one_bar_modules%22%3Anull%2C%22source_id%22%3Anull%2C%22source_module_id%22%3Anull%2C%22source_url%22%3A%22%2Fsearch%2Fpins%2F%3Feq%3Dhigurashi%26etslf%3D5966%26len%3D2%26q%3Dhigurashi%2520when%2520they%2520cry%26rs%3Dac%22%2C%22top_pin_id%22%3Anull%2C%22top_pin_ids%22%3Anull%7D%2C%22context%22%3A%7B%7D%7D | ||||||
|  | 			// &_=1736116313987 | ||||||
|  | 			 | ||||||
|  | 			$source_url = "/search/pins/?q=" . urlencode($search) . "&rs=" . urlencode($search); | ||||||
|  | 			 | ||||||
| 			$filter = [ | 			$filter = [ | ||||||
| 				"source_url" => "/search/pins/?q=" . urlencode($search), | 				"source_url" => $source_url, | ||||||
| 				"rs" => "typed", | 				"rs" => "typed", | ||||||
| 				"data" => | 				"data" => | ||||||
| 					json_encode( | 					json_encode( | ||||||
| 						[ | 						[ | ||||||
| 							"options" => [ | 							"options" => [ | ||||||
| 								"article" => null, | 								"applied_unified_filters" => null, | ||||||
| 								"applied_filters" => null, |  | ||||||
| 								"appliedProductFilters" => "---", | 								"appliedProductFilters" => "---", | ||||||
| 								"auto_correction_disabled" => false, | 								"article" => null, | ||||||
| 								"corpus" => null, | 								"corpus" => null, | ||||||
| 								"customized_rerank_type" => null, | 								"customized_rerank_type" => null, | ||||||
|  | 								"domains" => null, | ||||||
|  | 								"dynamicPageSizeExpGroup" => null, | ||||||
| 								"filters" => null, | 								"filters" => null, | ||||||
| 								"query" => $search, | 								"journey_depth" => null, | ||||||
|  | 								"page_size" => null, | ||||||
|  | 								"price_max" => null, | ||||||
|  | 								"price_min" => null, | ||||||
| 								"query_pin_sigs" => null, | 								"query_pin_sigs" => null, | ||||||
|  | 								"query" => $search, | ||||||
| 								"redux_normalize_feed" => true, | 								"redux_normalize_feed" => true, | ||||||
| 								"rs" => "typed", | 								"request_params" => null, | ||||||
|  | 								"rs" => "ac", | ||||||
| 								"scope" => "pins", // pins, boards, videos,  | 								"scope" => "pins", // pins, boards, videos,  | ||||||
| 								"source_id" => null | 								"selected_one_bar_modules" => null, | ||||||
|  | 								"source_id" => null, | ||||||
|  | 								"source_module_id" => null, | ||||||
|  | 								"source_url" => $source_url, | ||||||
|  | 								"top_pin_id" => null, | ||||||
|  | 								"top_pin_ids" => null | ||||||
| 							], | 							], | ||||||
| 							"context" => [] | 							"context" => [] | ||||||
| 						] | 						] | ||||||
| @@ -110,23 +272,25 @@ class pinterest{ | |||||||
| 			]; | 			]; | ||||||
| 			 | 			 | ||||||
| 			$proxy = $this->backend->get_ip(); | 			$proxy = $this->backend->get_ip(); | ||||||
| 		} | 			$cookies = []; | ||||||
| 			 | 			 | ||||||
| 			try{ | 			try{ | ||||||
| 				$json = | 				$json = | ||||||
| 				json_decode( |  | ||||||
| 					$this->get( | 					$this->get( | ||||||
| 						$proxy, | 						$proxy, | ||||||
| 						"https://www.pinterest.ca/resource/BaseSearchResource/get/", | 						"https://ca.pinterest.com/resource/BaseSearchResource/get/", | ||||||
| 						$filter | 						$filter, | ||||||
| 					), | 						$cookies, | ||||||
| 					true | 						null | ||||||
| 					); | 					); | ||||||
| 				 | 				 | ||||||
| 			}catch(Exception $error){ | 			}catch(Exception $error){ | ||||||
| 				 | 				 | ||||||
| 				throw new Exception("Failed to fetch JSON"); | 				throw new Exception("Failed to fetch JSON"); | ||||||
| 			} | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$json = json_decode($json, true); | ||||||
| 		 | 		 | ||||||
| 		if($json === null){ | 		if($json === null){ | ||||||
| 			 | 			 | ||||||
| @@ -139,6 +303,60 @@ class pinterest{ | |||||||
| 			"image" => [] | 			"image" => [] | ||||||
| 		]; | 		]; | ||||||
| 		 | 		 | ||||||
|  | 		if( | ||||||
|  | 			!isset( | ||||||
|  | 				$json["resource_response"] | ||||||
|  | 				["status"] | ||||||
|  | 			) | ||||||
|  | 		){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Unknown API failure"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if($json["resource_response"]["status"] != "success"){ | ||||||
|  | 			 | ||||||
|  | 			$status = "Got non-OK response: " . $json["resource_response"]["status"]; | ||||||
|  | 			 | ||||||
|  | 			if( | ||||||
|  | 				isset( | ||||||
|  | 					$json["resource_response"]["message"] | ||||||
|  | 				) | ||||||
|  | 			){ | ||||||
|  | 				 | ||||||
|  | 				$status .= " - " . $json["resource_response"]["message"]; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			throw new Exception($status); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if( | ||||||
|  | 			isset( | ||||||
|  | 				$json["resource_response"]["sensitivity"] | ||||||
|  | 				["notices"][0]["description"]["text"] | ||||||
|  | 			) | ||||||
|  | 		){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception( | ||||||
|  | 				"Pinterest returned a notice: " . | ||||||
|  | 				$json["resource_response"]["sensitivity"]["notices"][0]["description"]["text"] | ||||||
|  | 			); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		// get NPT | ||||||
|  | 		if(isset($json["resource_response"]["bookmark"])){ | ||||||
|  | 			 | ||||||
|  | 			$out["npt"] = | ||||||
|  | 				$this->backend->store( | ||||||
|  | 					json_encode([ | ||||||
|  | 						"q" => $search, | ||||||
|  | 						"bookmark" => $json["resource_response"]["bookmark"], | ||||||
|  | 						"cookies" => $cookies | ||||||
|  | 					]), | ||||||
|  | 					"images", | ||||||
|  | 					$proxy | ||||||
|  | 				); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
| 		foreach( | 		foreach( | ||||||
| 			$json | 			$json | ||||||
| 			["resource_response"] | 			["resource_response"] | ||||||
| @@ -150,6 +368,7 @@ class pinterest{ | |||||||
| 			switch($item["type"]){ | 			switch($item["type"]){ | ||||||
| 				 | 				 | ||||||
| 				case "pin": | 				case "pin": | ||||||
|  | 				case "board": | ||||||
| 					 | 					 | ||||||
| 					/* | 					/* | ||||||
| 						Handle image object | 						Handle image object | ||||||
| @@ -206,42 +425,15 @@ class pinterest{ | |||||||
| 								"height" => (int)$thumb["height"] | 								"height" => (int)$thumb["height"] | ||||||
| 							] | 							] | ||||||
| 						], | 						], | ||||||
| 						"url" => "https://www.pinterest.com/pin/" . $item["id"] |  | ||||||
| 					]; |  | ||||||
| 					break; |  | ||||||
| 				 |  | ||||||
| 				case "board": |  | ||||||
| 					if(isset($item["cover_pin"]["image_url"])){ |  | ||||||
| 						 |  | ||||||
| 						$image = [ |  | ||||||
| 							"url" => $item["cover_pin"]["image_url"], |  | ||||||
| 							"width" => (int)$item["cover_pin"]["size"][0], |  | ||||||
| 							"height" => (int)$item["cover_pin"]["size"][1] |  | ||||||
| 						]; |  | ||||||
| 					}elseif(isset($item["image_cover_url_hd"])){ |  | ||||||
| 						/* |  | ||||||
| 						$image = [ |  | ||||||
| 						"url" => | 						"url" => | ||||||
| 							"width" => null, | 							$item["link"] === null ? | ||||||
| 							"height" => null | 							"https://ca.pinterest.com/pin/" . $item["id"] : | ||||||
| 						];*/ | 							$item["link"] | ||||||
| 					} | 					]; | ||||||
| 					break; | 					break; | ||||||
| 			} | 			} | ||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
| 		return $out; | 		return $out; | ||||||
| 	} | 	} | ||||||
| 	 |  | ||||||
| 	private function getfullresimage($image, $has_og){ |  | ||||||
| 		 |  | ||||||
| 		$has_og = $has_og ? "1200x" : "originals"; |  | ||||||
| 		 |  | ||||||
| 		return |  | ||||||
| 			preg_replace( |  | ||||||
| 				'/https:\/\/i\.pinimg\.com\/[^\/]+\//', |  | ||||||
| 				"https://i.pinimg.com/" . $has_og . "/", |  | ||||||
| 				$image |  | ||||||
| 			); |  | ||||||
| 	} |  | ||||||
| } | } | ||||||
|   | |||||||
| @@ -410,10 +410,7 @@ class qwant{ | |||||||
| 					"thumb" => | 					"thumb" => | ||||||
| 						$answer["data"]["result"]["thumbnail"]["landscape"] == null ? | 						$answer["data"]["result"]["thumbnail"]["landscape"] == null ? | ||||||
| 						null : | 						null : | ||||||
| 						$this->unshitimage( | 						$this->unshitimage($answer["data"]["result"]["thumbnail"]["landscape"]), | ||||||
| 							$answer["data"]["result"]["thumbnail"]["landscape"], |  | ||||||
| 							false |  | ||||||
| 						), |  | ||||||
| 					"table" => [], | 					"table" => [], | ||||||
| 					"sublink" => [] | 					"sublink" => [] | ||||||
| 				]; | 				]; | ||||||
| @@ -770,7 +767,7 @@ class qwant{ | |||||||
| 			}else{ | 			}else{ | ||||||
| 				 | 				 | ||||||
| 				$thumb = [ | 				$thumb = [ | ||||||
| 					"url" => $this->unshitimage($video["thumbnail"], false), | 					"url" => $this->unshitimage($video["thumbnail"]), | ||||||
| 					"ratio" => "16:9" | 					"ratio" => "16:9" | ||||||
| 				]; | 				]; | ||||||
| 			} | 			} | ||||||
| @@ -870,7 +867,7 @@ class qwant{ | |||||||
| 			}else{ | 			}else{ | ||||||
| 				 | 				 | ||||||
| 				$thumb = [ | 				$thumb = [ | ||||||
| 					"url" => $this->unshitimage($news["media"][0]["pict_big"]["url"], false), | 					"url" => $this->unshitimage($news["media"][0]["pict_big"]["url"]), | ||||||
| 					"ratio" => "16:9" | 					"ratio" => "16:9" | ||||||
| 				]; | 				]; | ||||||
| 			} | 			} | ||||||
| @@ -920,18 +917,77 @@ class qwant{ | |||||||
| 		return trim($text, ". "); | 		return trim($text, ". "); | ||||||
| 	} | 	} | ||||||
| 	 | 	 | ||||||
| 	private function unshitimage($url, $is_bing = true){ | 	private function unshitimage($url){ | ||||||
| 		 | 		 | ||||||
| 		// https://s1.qwant.com/thumbr/0x0/8/d/f6de4deb2c2b12f55d8bdcaae576f9f62fd58a05ec0feeac117b354d1bf5c2/th.jpg?u=https%3A%2F%2Fwww.bing.com%2Fth%3Fid%3DOIP.vvDWsagzxjoKKP_rOqhwrQAAAA%26w%3D160%26h%3D160%26c%3D7%26pid%3D5.1&q=0&b=1&p=0&a=0 | 		// https://s1.qwant.com/thumbr/0x0/8/d/f6de4deb2c2b12f55d8bdcaae576f9f62fd58a05ec0feeac117b354d1bf5c2/th.jpg?u=https%3A%2F%2Fwww.bing.com%2Fth%3Fid%3DOIP.vvDWsagzxjoKKP_rOqhwrQAAAA%26w%3D160%26h%3D160%26c%3D7%26pid%3D5.1&q=0&b=1&p=0&a=0 | ||||||
| 		parse_str(parse_url($url)["query"], $parts); | 		// https://s2.qwant.com/thumbr/474x289/7/f/412d13b3fe3a03eb2b89633c8e88b609b7d0b93cdd9a5e52db3c663e41e65e/th.jpg?u=https%3A%2F%2Ftse.mm.bing.net%2Fth%3Fid%3DOIP.9Tm_Eo6m7V7ltN19mxduDgHaEh%26pid%3DApi&q=0&b=1&p=0&a=0 | ||||||
| 		 | 		 | ||||||
| 		if($is_bing){ | 		$image = parse_url($url); | ||||||
| 			$parse = parse_url($parts["u"]); |  | ||||||
| 			parse_str($parse["query"], $parts); |  | ||||||
| 		 | 		 | ||||||
| 			return "https://" . $parse["host"] . "/th?id=" . urlencode($parts["id"]); | 		if( | ||||||
|  | 			!isset($image["host"]) || | ||||||
|  | 			!isset($image["query"]) | ||||||
|  | 		){ | ||||||
|  | 			 | ||||||
|  | 			// cant do anything | ||||||
|  | 			return $url; | ||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
| 		return $parts["u"]; | 		$id = null; | ||||||
|  | 		 | ||||||
|  | 		if( | ||||||
|  | 			preg_match( | ||||||
|  | 				'/s[0-9]+\.qwant\.com$/', | ||||||
|  | 				$image["host"] | ||||||
|  | 			) | ||||||
|  | 		){ | ||||||
|  | 			 | ||||||
|  | 			parse_str($image["query"], $str); | ||||||
|  | 			 | ||||||
|  | 			// we're being served a proxy URL | ||||||
|  | 			if(isset($str["u"])){ | ||||||
|  | 				 | ||||||
|  | 				$bing_url = $str["u"]; | ||||||
|  | 			}else{ | ||||||
|  | 				 | ||||||
|  | 				// give up | ||||||
|  | 				return $url; | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		// parse bing URL | ||||||
|  | 		$id = null; | ||||||
|  | 		$image = parse_url($bing_url); | ||||||
|  | 		 | ||||||
|  | 		if(isset($image["query"])){ | ||||||
|  | 			 | ||||||
|  | 			parse_str($image["query"], $str); | ||||||
|  | 			 | ||||||
|  | 			if(isset($str["id"])){ | ||||||
|  | 				 | ||||||
|  | 				$id = $str["id"]; | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if($id === null){ | ||||||
|  | 			 | ||||||
|  | 			$id = explode("/th/id/", $image["path"], 2); | ||||||
|  | 			 | ||||||
|  | 			if(count($id) !== 2){ | ||||||
|  | 				 | ||||||
|  | 				// malformed | ||||||
|  | 				return $url; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$id = $id[1]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if(is_array($id)){ | ||||||
|  | 			 | ||||||
|  | 			// fuck off, let proxy.php deal with it | ||||||
|  | 			return $url; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return "https://" . $image["host"] . "/th?id=" . rawurlencode($id); | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
|   | |||||||
							
								
								
									
										541
									
								
								scraper/sepiasearch.php
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										541
									
								
								scraper/sepiasearch.php
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,541 @@ | |||||||
|  | <?php | ||||||
|  |  | ||||||
|  | class sepiasearch{ | ||||||
|  | 	 | ||||||
|  | 	public function __construct(){ | ||||||
|  | 		 | ||||||
|  | 		include "lib/backend.php"; | ||||||
|  | 		$this->backend = new backend("sepiasearch"); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function getfilters($page){ | ||||||
|  | 		 | ||||||
|  | 		return [ | ||||||
|  | 			"nsfw" => [ | ||||||
|  | 				"display" => "NSFW", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"yes" => "Yes", // &sensitiveContent=both | ||||||
|  | 					"no" => "No" // &sensitiveContent=false | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"language" => [ | ||||||
|  | 				"display" => "Language", // &language= | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any language", | ||||||
|  | 					"en" => "English", | ||||||
|  | 					"fr" => "Français", | ||||||
|  | 					"ar" => "العربية", | ||||||
|  | 					"ca" => "Català", | ||||||
|  | 					"cs" => "Čeština", | ||||||
|  | 					"de" => "Deutsch", | ||||||
|  | 					"el" => "ελληνικά", | ||||||
|  | 					"eo" => "Esperanto", | ||||||
|  | 					"es" => "Español", | ||||||
|  | 					"eu" => "Euskara", | ||||||
|  | 					"fa" => "فارسی", | ||||||
|  | 					"fi" => "Suomi", | ||||||
|  | 					"gd" => "Gàidhlig", | ||||||
|  | 					"gl" => "Galego", | ||||||
|  | 					"hr" => "Hrvatski", | ||||||
|  | 					"hu" => "Magyar", | ||||||
|  | 					"is" => "Íslenska", | ||||||
|  | 					"it" => "Italiano", | ||||||
|  | 					"ja" => "日本語", | ||||||
|  | 					"kab" => "Taqbaylit", | ||||||
|  | 					"nl" => "Nederlands", | ||||||
|  | 					"no" => "Norsk", | ||||||
|  | 					"oc" => "Occitan", | ||||||
|  | 					"pl" => "Polski", | ||||||
|  | 					"pt" => "Português (Brasil)", | ||||||
|  | 					"pt-PT" => "Português (Portugal)", | ||||||
|  | 					"ru" => "Pусский", | ||||||
|  | 					"sk" => "Slovenčina", | ||||||
|  | 					"sq" => "Shqip", | ||||||
|  | 					"sv" => "Svenska", | ||||||
|  | 					"th" => "ไทย", | ||||||
|  | 					"tok" => "Toki Pona", | ||||||
|  | 					"tr" => "Türkçe", | ||||||
|  | 					"uk" => "украї́нська мо́ва", | ||||||
|  | 					"vi" => "Tiếng Việt", | ||||||
|  | 					"zh-Hans" => "简体中文(中国)", | ||||||
|  | 					"zh-Hant" => "繁體中文(台灣)" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"type" => [ | ||||||
|  | 				"display" => "Result type", // i handle this | ||||||
|  | 				"option" => [ | ||||||
|  | 					"videos" => "Videos", | ||||||
|  | 					"playlists" => "Playlists", | ||||||
|  | 					"channels" => "Channels" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"sort" => [ | ||||||
|  | 				"display" => "Sort by", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"best" => "Best match", // no filter | ||||||
|  | 					"-publishedAt" => "Newest", // sort=-publishedAt | ||||||
|  | 					"publishedAt" => "Oldest" // sort=publishedAt | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"newer" => [ // &startDate=2025-07-26T04:00:00.000Z | ||||||
|  | 				"display" => "Newer than", | ||||||
|  | 				"option" => "_DATE" | ||||||
|  | 			], | ||||||
|  | 			"duration" => [ | ||||||
|  | 				"display" => "Duration", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any duration", | ||||||
|  | 					"short" => "Short (0-4mins)", // &durationRange=short | ||||||
|  | 					"medium" => "Medium (4-10 mins)", | ||||||
|  | 					"long" => "Long (10+ mins)", | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"category" => [ | ||||||
|  | 				"display" => "Category", // &categoryOneOf[]= | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any category", | ||||||
|  | 					"1" => "Music", | ||||||
|  | 					"2" => "Films", | ||||||
|  | 					"3" => "Vehicles", | ||||||
|  | 					"4" => "Art", | ||||||
|  | 					"5" => "Sports", | ||||||
|  | 					"6" => "Travels", | ||||||
|  | 					"7" => "Gaming", | ||||||
|  | 					"8" => "People", | ||||||
|  | 					"9" => "Comedy", | ||||||
|  | 					"10" => "Entertainment", | ||||||
|  | 					"11" => "News & Politics", | ||||||
|  | 					"12" => "How To", | ||||||
|  | 					"13" => "Education", | ||||||
|  | 					"14" => "Activism", | ||||||
|  | 					"15" => "Science & Technology", | ||||||
|  | 					"16" => "Animals", | ||||||
|  | 					"17" => "Kids", | ||||||
|  | 					"18" => "Food" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"display" => [ | ||||||
|  | 				"display" => "Display", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Everything", | ||||||
|  | 					"true" => "Live videos", // &isLive=true | ||||||
|  | 					"false" => "VODs" // &isLive=false | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"license" => [ | ||||||
|  | 				"display" => "License", // &license= | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any license", | ||||||
|  | 					"1" => "Attribution", | ||||||
|  | 					"2" => "Attribution - Share Alike", | ||||||
|  | 					"3" => "Attribution - No Derivatives", | ||||||
|  | 					"4" => "Attribution - Non Commercial", | ||||||
|  | 					"5" => "Attribution - Non Commercial - Share Alike", | ||||||
|  | 					"6" => "Attribution - Non Commercial - No Derivatives", | ||||||
|  | 					"7" => "Public Domain Dedication" | ||||||
|  | 				] | ||||||
|  | 			] | ||||||
|  | 		]; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function get($proxy, $url, $get = []){ | ||||||
|  | 		 | ||||||
|  | 		$curlproc = curl_init(); | ||||||
|  | 		 | ||||||
|  | 		if($get !== []){ | ||||||
|  | 			$get = http_build_query($get); | ||||||
|  | 			$url .= "?" . $get; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_URL, $url); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | ||||||
|  | 		 | ||||||
|  | 		curl_setopt( | ||||||
|  | 			$curlproc, | ||||||
|  | 			CURLOPT_HTTPHEADER, | ||||||
|  | 			["User-Agent: " . config::USER_AGENT, | ||||||
|  | 			"Accept: application/json, text/plain, */*", | ||||||
|  | 			"Accept-Language: en-US,en;q=0.5", | ||||||
|  | 			"Accept-Encoding: gzip, deflate, br, zstd", | ||||||
|  | 			"DNT: 1", | ||||||
|  | 			"Sec-GPC: 1", | ||||||
|  | 			"Connection: keep-alive", | ||||||
|  | 			"Referer: https://sepiasearch.org/search", | ||||||
|  | 			"Sec-Fetch-Dest: empty", | ||||||
|  | 			"Sec-Fetch-Mode: cors", | ||||||
|  | 			"Sec-Fetch-Site: same-origin", | ||||||
|  | 			"Priority: u=0", | ||||||
|  | 			"TE: trailers"] | ||||||
|  | 		); | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_RETURNTRANSFER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYHOST, 2); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYPEER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_CONNECTTIMEOUT, 30); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_TIMEOUT, 30); | ||||||
|  |  | ||||||
|  | 		$this->backend->assign_proxy($curlproc, $proxy); | ||||||
|  | 		 | ||||||
|  | 		$data = curl_exec($curlproc); | ||||||
|  | 		 | ||||||
|  | 		if(curl_errno($curlproc)){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception(curl_error($curlproc)); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_close($curlproc); | ||||||
|  | 		return $data; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function video($get){ | ||||||
|  | 		 | ||||||
|  | 		if($get["npt"]){ | ||||||
|  | 			 | ||||||
|  | 			[$npt, $proxy] = | ||||||
|  | 				$this->backend | ||||||
|  | 				->get( | ||||||
|  | 					$get["npt"], | ||||||
|  | 					"videos" | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			$npt = json_decode($npt, true); | ||||||
|  | 			$type = $npt["type"]; | ||||||
|  | 			$npt = $npt["npt"]; | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			$proxy = $this->backend->get_ip(); | ||||||
|  | 						 | ||||||
|  | 			$npt = [ | ||||||
|  | 				"search" => $get["s"], | ||||||
|  | 				"start" => 0, | ||||||
|  | 				"count" => 20 | ||||||
|  | 			]; | ||||||
|  | 			 | ||||||
|  | 			if($get["type"] == "videos"){ | ||||||
|  | 				 | ||||||
|  | 				// | ||||||
|  | 				// Parse video filters | ||||||
|  | 				// | ||||||
|  | 				switch($get["nsfw"]){ | ||||||
|  | 					 | ||||||
|  | 					case "yes": $npt["nsfw"] = "both"; break; | ||||||
|  | 					case "no": $npt["nsfw"] = "false"; break; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				$npt["boostLanguages[]"] = "en"; | ||||||
|  | 				if($get["language"] != "any"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["languageOneOf[]"] = $get["language"]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["sort"] != "best"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["sort"] = $get["sort"]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["newer"] !== false){ | ||||||
|  | 					 | ||||||
|  | 					$date = new DateTime("@{$get["newer"]}"); | ||||||
|  | 					$date->setTimezone(new DateTimeZone("UTC")); | ||||||
|  | 					$formatted = $date->format("Y-m-d\TH:i:s.000\Z"); | ||||||
|  | 					 | ||||||
|  | 					$npt["startDate"] = $formatted; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				switch($get["duration"]){ | ||||||
|  | 					 | ||||||
|  | 					case "short": | ||||||
|  | 						$npt["durationMax"] = 240; | ||||||
|  | 						break; | ||||||
|  | 					 | ||||||
|  | 					case "medium": | ||||||
|  | 						$npt["durationMin"] = 240; | ||||||
|  | 						$npt["durationMax"] = 600; | ||||||
|  | 						break; | ||||||
|  | 					 | ||||||
|  | 					case "long": | ||||||
|  | 						$npt["durationMin"] = 600; | ||||||
|  | 						break; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["category"] != "any"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["categoryOneOf[]"] = $get["category"]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["display"] != "any"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["isLive"] = $get["display"]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["license"] != "any"){ | ||||||
|  | 					 | ||||||
|  | 					// typo in license, lol | ||||||
|  | 					$npt["licenceOneOf[]"] = $get["license"]; | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$type = $get["type"]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		switch($type){ | ||||||
|  | 			 | ||||||
|  | 			case "videos": | ||||||
|  | 				$url = "https://sepiasearch.org/api/v1/search/videos"; | ||||||
|  | 				break; | ||||||
|  | 			 | ||||||
|  | 			case "channels": | ||||||
|  | 				$url = "https://sepiasearch.org/api/v1/search/video-channels"; | ||||||
|  | 				break; | ||||||
|  | 			 | ||||||
|  | 			case "playlists": | ||||||
|  | 				$url = "https://sepiasearch.org/api/v1/search/video-playlists"; | ||||||
|  | 				break; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		//$json = file_get_contents("scraper/sepia.json"); | ||||||
|  | 		try{ | ||||||
|  | 			 | ||||||
|  | 			$json = | ||||||
|  | 				$this->get( | ||||||
|  | 					$proxy, | ||||||
|  | 					$url, | ||||||
|  | 					$npt | ||||||
|  | 				); | ||||||
|  | 		}catch(Exception $error){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to fetch JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$json = json_decode($json, true); | ||||||
|  | 		 | ||||||
|  | 		if($json === null){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to parse JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if(isset($json["errors"])){ | ||||||
|  | 			 | ||||||
|  | 			$msg = []; | ||||||
|  | 			foreach($json["errors"] as $error){ | ||||||
|  | 				 | ||||||
|  | 				if(isset($error["msg"])){ | ||||||
|  | 					 | ||||||
|  | 					$msg[] = $error["msg"]; | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Sepia Search returned error(s): " . implode(", ", $msg)); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if(!isset($json["data"])){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Sepia Search did not return a data object"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$out = [ | ||||||
|  | 			"status" => "ok", | ||||||
|  | 			"npt" => null, | ||||||
|  | 			"video" => [], | ||||||
|  | 			"author" => [], | ||||||
|  | 			"livestream" => [], | ||||||
|  | 			"playlist" => [], | ||||||
|  | 			"reel" => [] | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		 | ||||||
|  | 		switch($get["type"]){ | ||||||
|  | 			 | ||||||
|  | 			case "videos": | ||||||
|  | 				foreach($json["data"] as $video){ | ||||||
|  | 					 | ||||||
|  | 					if(count($video["account"]["avatars"]) !== 0){ | ||||||
|  | 						 | ||||||
|  | 						$avatar = | ||||||
|  | 							$video["account"]["avatars"][count($video["account"]["avatars"]) - 1]["url"]; | ||||||
|  | 					}else{ | ||||||
|  | 						 | ||||||
|  | 						$avatar = null; | ||||||
|  | 					} | ||||||
|  | 					 | ||||||
|  | 					if($video["thumbnailUrl"] === null){ | ||||||
|  | 						 | ||||||
|  | 						$thumb = [ | ||||||
|  | 							"ratio" => null, | ||||||
|  | 							"url" => null | ||||||
|  | 						]; | ||||||
|  | 					}else{ | ||||||
|  | 						 | ||||||
|  | 						$thumb  = [ | ||||||
|  | 							"ratio" => "16:9", | ||||||
|  | 							"url" => $video["thumbnailUrl"] | ||||||
|  | 						]; | ||||||
|  | 					} | ||||||
|  | 					 | ||||||
|  | 					if($video["isLive"]){ | ||||||
|  | 						 | ||||||
|  | 						$append = "livestream"; | ||||||
|  | 					}else{ | ||||||
|  | 						 | ||||||
|  | 						$append = "video"; | ||||||
|  | 					} | ||||||
|  | 					 | ||||||
|  | 					$out[$append][] = [ | ||||||
|  | 						"title" => $video["name"], | ||||||
|  | 						"description" => | ||||||
|  | 							$this->limitstrlen( | ||||||
|  | 								$this->titledots( | ||||||
|  | 									$video["description"] | ||||||
|  | 								) | ||||||
|  | 							), | ||||||
|  | 						"author" => [ | ||||||
|  | 							"name" => $video["account"]["displayName"] . " ({$video["account"]["name"]})", | ||||||
|  | 							"url" => $video["account"]["url"], | ||||||
|  | 							"avatar" => $avatar | ||||||
|  | 						], | ||||||
|  | 						"date" => strtotime($video["publishedAt"]), | ||||||
|  | 						"duration" => $video["isLive"] ? "_LIVE" : $video["duration"], | ||||||
|  | 						"views" => $video["views"], | ||||||
|  | 						"thumb" => $thumb, | ||||||
|  | 						"url" => $video["url"] | ||||||
|  | 					]; | ||||||
|  | 				} | ||||||
|  | 				break; | ||||||
|  | 			 | ||||||
|  | 			case "playlists": | ||||||
|  | 				foreach($json["data"] as $playlist){ | ||||||
|  | 					 | ||||||
|  | 					if(count($playlist["ownerAccount"]["avatars"]) !== 0){ | ||||||
|  | 						 | ||||||
|  | 						$avatar = | ||||||
|  | 							$playlist["ownerAccount"]["avatars"][count($playlist["ownerAccount"]["avatars"]) - 1]["url"]; | ||||||
|  | 					}else{ | ||||||
|  | 						 | ||||||
|  | 						$avatar = null; | ||||||
|  | 					} | ||||||
|  | 					 | ||||||
|  | 					if($playlist["thumbnailUrl"] === null){ | ||||||
|  | 						 | ||||||
|  | 						$thumb = [ | ||||||
|  | 							"ratio" => null, | ||||||
|  | 							"url" => null | ||||||
|  | 						]; | ||||||
|  | 					}else{ | ||||||
|  | 						 | ||||||
|  | 						$thumb  = [ | ||||||
|  | 							"ratio" => "16:9", | ||||||
|  | 							"url" => $playlist["thumbnailUrl"] | ||||||
|  | 						]; | ||||||
|  | 					} | ||||||
|  | 					 | ||||||
|  | 					$out["playlist"][] = [ | ||||||
|  | 						"title" => $playlist["displayName"], | ||||||
|  | 						"description" => | ||||||
|  | 							$this->limitstrlen( | ||||||
|  | 								$this->titledots( | ||||||
|  | 									$playlist["description"] | ||||||
|  | 								) | ||||||
|  | 							), | ||||||
|  | 						"author" => [ | ||||||
|  | 							"name" => $playlist["ownerAccount"]["displayName"] . " ({$playlist["ownerAccount"]["name"]})", | ||||||
|  | 							"url" => $playlist["ownerAccount"]["url"], | ||||||
|  | 							"avatar" => $avatar | ||||||
|  | 						], | ||||||
|  | 						"date" => strtotime($playlist["createdAt"]), | ||||||
|  | 						"duration" => $playlist["videosLength"], | ||||||
|  | 						"views" => null, | ||||||
|  | 						"thumb" => $thumb, | ||||||
|  | 						"url" => $playlist["url"] | ||||||
|  | 					]; | ||||||
|  | 				} | ||||||
|  | 				break; | ||||||
|  | 			 | ||||||
|  | 			case "channels": | ||||||
|  | 				foreach($json["data"] as $channel){ | ||||||
|  | 					 | ||||||
|  | 					if(count($channel["avatars"]) !== 0){ | ||||||
|  | 						 | ||||||
|  | 						$thumb = [ | ||||||
|  | 							"ratio" => "1:1", | ||||||
|  | 							"url" => $channel["avatars"][count($channel["avatars"]) - 1]["url"] | ||||||
|  | 						]; | ||||||
|  | 					}else{ | ||||||
|  | 						 | ||||||
|  | 						$thumb = [ | ||||||
|  | 							"ratio" => null, | ||||||
|  | 							"url" => null | ||||||
|  | 						]; | ||||||
|  | 					} | ||||||
|  | 					 | ||||||
|  | 					$out["author"][] = [ | ||||||
|  | 						"title" => $channel["displayName"] . " ({$channel["name"]})", | ||||||
|  | 						"followers" => $channel["followersCount"], | ||||||
|  | 						"description" => | ||||||
|  | 							$channel["videosCount"] . " videos. " . | ||||||
|  | 							$this->limitstrlen( | ||||||
|  | 								$this->titledots( | ||||||
|  | 									$channel["description"] | ||||||
|  | 								) | ||||||
|  | 							), | ||||||
|  | 						"thumb" => $thumb, | ||||||
|  | 						"url" => $channel["url"] | ||||||
|  | 					]; | ||||||
|  | 				} | ||||||
|  | 				break; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		// get next page | ||||||
|  | 		if($json["total"] - 20 > $npt["start"]){ | ||||||
|  | 			 | ||||||
|  | 			$npt["start"] += 20; | ||||||
|  | 			 | ||||||
|  | 			$npt = [ | ||||||
|  | 				"type" => $get["type"], | ||||||
|  | 				"npt" => $npt | ||||||
|  | 			]; | ||||||
|  | 			 | ||||||
|  | 			$out["npt"] = | ||||||
|  | 				$this->backend | ||||||
|  | 				->store( | ||||||
|  | 					json_encode($npt), | ||||||
|  | 					"videos", | ||||||
|  | 					$proxy | ||||||
|  | 				); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return $out; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function titledots($title){ | ||||||
|  | 		 | ||||||
|  | 		$substr = substr($title, -3); | ||||||
|  | 		 | ||||||
|  | 		if( | ||||||
|  | 			$substr == "..." || | ||||||
|  | 			$substr == "…" | ||||||
|  | 		){ | ||||||
|  | 			 | ||||||
|  | 			return trim(substr($title, 0, -3), " \n\r\t\v\x00\0\x0B\xc2\xa0"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return trim($title, " \n\r\t\v\x00\0\x0B\xc2\xa0"); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function limitstrlen($text){ | ||||||
|  | 		 | ||||||
|  | 		return | ||||||
|  | 			explode( | ||||||
|  | 				"\n", | ||||||
|  | 				wordwrap( | ||||||
|  | 					str_replace( | ||||||
|  | 						["\n\r", "\r\n", "\n", "\r"], | ||||||
|  | 						" ", | ||||||
|  | 						$text | ||||||
|  | 					), | ||||||
|  | 					300, | ||||||
|  | 					"\n" | ||||||
|  | 				), | ||||||
|  | 				2 | ||||||
|  | 			)[0]; | ||||||
|  | 	} | ||||||
|  | } | ||||||
| @@ -1226,7 +1226,12 @@ class startpage{ | |||||||
| 		// get results | 		// get results | ||||||
| 		foreach($json["render"]["presenter"]["regions"]["mainline"] as $category){ | 		foreach($json["render"]["presenter"]["regions"]["mainline"] as $category){ | ||||||
| 			 | 			 | ||||||
| 			if($category["display_type"] == "video-youtube"){ | 			if( | ||||||
|  | 				preg_match( | ||||||
|  | 					'/^video-/i', | ||||||
|  | 					$category["display_type"] | ||||||
|  | 				) | ||||||
|  | 			){ | ||||||
| 				 | 				 | ||||||
| 				foreach($category["results"] as $video){ | 				foreach($category["results"] as $video){ | ||||||
| 					 | 					 | ||||||
| @@ -1248,7 +1253,7 @@ class startpage{ | |||||||
| 					} | 					} | ||||||
| 					 | 					 | ||||||
| 					$out["video"][] = [ | 					$out["video"][] = [ | ||||||
| 						"title" => $video["title"], | 						"title" => str_replace(["", ""], "", $video["title"]), | ||||||
| 						"description" => $this->limitstrlen($video["description"]), | 						"description" => $this->limitstrlen($video["description"]), | ||||||
| 						"author" => [ | 						"author" => [ | ||||||
| 							"name" => $video["channelTitle"], | 							"name" => $video["channelTitle"], | ||||||
| @@ -1256,7 +1261,7 @@ class startpage{ | |||||||
| 							"avatar" => null | 							"avatar" => null | ||||||
| 						], | 						], | ||||||
| 						"date" => strtotime($video["publishDate"]), | 						"date" => strtotime($video["publishDate"]), | ||||||
| 						"duration" => $this->hms2int($video["duration"]), | 						"duration" => $this->hms2int($category["display_type"] == "video-youtube" ? $video["duration"] : $video["duration"] / 1000), | ||||||
| 						"views" => (int)$video["viewCount"], | 						"views" => (int)$video["viewCount"], | ||||||
| 						"thumb" => $thumb, | 						"thumb" => $thumb, | ||||||
| 						"url" => $video["clickUrl"] | 						"url" => $video["clickUrl"] | ||||||
|   | |||||||
							
								
								
									
										754
									
								
								scraper/vimeo.php
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										754
									
								
								scraper/vimeo.php
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,754 @@ | |||||||
|  | <?php | ||||||
|  |  | ||||||
|  | class vimeo{ | ||||||
|  | 	 | ||||||
|  | 	public function __construct(){ | ||||||
|  | 		 | ||||||
|  | 		include "lib/backend.php"; | ||||||
|  | 		$this->backend = new backend("vimeo"); | ||||||
|  | 		 | ||||||
|  | 		include "lib/fuckhtml.php"; | ||||||
|  | 		$this->fuckhtml = new fuckhtml(); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function getfilters($page){ | ||||||
|  | 		 | ||||||
|  | 		return [ | ||||||
|  | 			"time" => [ | ||||||
|  | 				"display" => "Date uploaded", // &filter_uploaded= | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any time", | ||||||
|  | 					"today" => "Last 24 hours", | ||||||
|  | 					"this-week" => "Last 7 days", | ||||||
|  | 					"this-month" => "Last 30 days", | ||||||
|  | 					"this-year" => "Last 365 days", | ||||||
|  | 				] | ||||||
|  | 			],  | ||||||
|  | 			"display" => [ | ||||||
|  | 				"display" => "Display", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"video" => "Videos", | ||||||
|  | 					"ondemand" => "On-Demand ($$)", | ||||||
|  | 					"people" => "People", | ||||||
|  | 					"channel" => "Channels", | ||||||
|  | 					"group" => "Groups" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"sort" => [ | ||||||
|  | 				"display" => "Sort by", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"relevance" => "Relevance", // no param | ||||||
|  | 					"recent" => "Newest", // &sort=latest&direction=desc | ||||||
|  | 					"popular" => "Most popular", // &sort=popularity&direction=desc | ||||||
|  | 					"a_z" => "Title, A to Z", // &sort=alphabetical&direction=asc | ||||||
|  | 					"z_a" => "Title, Z to A", // &sort=alphabetical&direction=desc | ||||||
|  | 					"longest" => "Longest", // &sort=duration&direction=desc | ||||||
|  | 					"shortest" => "Shortest", // &sort=duration&direction=asc | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"duration" => [ | ||||||
|  | 				"display" => "Duration", // &filter_duration= | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any duration", | ||||||
|  | 					"short" => "Short (less than 4 minutes)", | ||||||
|  | 					"medium" => "Medium (4-10 minutes)", | ||||||
|  | 					"long" => "Long (over 10 minutes)" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"resolution" => [ | ||||||
|  | 				"display" => "Resolution", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any resolution", | ||||||
|  | 					"4k" => "4K" // &filter_resolution=4k | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"category" => [ | ||||||
|  | 				"display" => "Category", // &filter_category= | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any category", | ||||||
|  | 					"animation" => "Animation", | ||||||
|  | 					"comedy" => "Comedy", | ||||||
|  | 					"music" => "Music", | ||||||
|  | 					"experimental" => "Experimental", | ||||||
|  | 					"documentary" => "Documentary", | ||||||
|  | 					"identsandanimatedlogos" => "Idents and Animated Logos", | ||||||
|  | 					"industry" => "Industry", | ||||||
|  | 					"instructionals" => "Instructionals", | ||||||
|  | 					"narrative" => "Narrative", | ||||||
|  | 					"personal" => "Personal" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"live" => [ | ||||||
|  | 				"display" => "Live events", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any", | ||||||
|  | 					"yes" => "Live now" // &filter_live=now | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"hdr" => [ | ||||||
|  | 				"display" => "HDR", // &filter_hdr= | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any", | ||||||
|  | 					"hdr" => "Any HDR", | ||||||
|  | 					"dolby_vision" => "Dolby Vision", | ||||||
|  | 					"hdr10" => "HDR10", | ||||||
|  | 					"hdr10+" => "HDR10+" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"vimeo_360" => [ | ||||||
|  | 				"display" => "Vimeo 360°", // &filter_vimeo_360 | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any", | ||||||
|  | 					"spatial" => "Spatial", | ||||||
|  | 					"360" => "360°" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"price" => [ // &filter_price= | ||||||
|  | 				"display" => "Price", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any price", | ||||||
|  | 					"free" => "Free", | ||||||
|  | 					"paid" => "Paid" | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"collection" => [ | ||||||
|  | 				"display" => "Vimeo collections", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any collection", | ||||||
|  | 					"staff_pick" => "Staff picks" // &filter_staffpicked=true | ||||||
|  | 				] | ||||||
|  | 			], | ||||||
|  | 			"license" => [ // &filter_license= | ||||||
|  | 				"display" => "License", | ||||||
|  | 				"option" => [ | ||||||
|  | 					"any" => "Any license", | ||||||
|  | 					"by-nc-nd" => "CC BY-NC-ND", | ||||||
|  | 					"by" => "CC BY", | ||||||
|  | 					"by-nc" => "CC BY-NC", | ||||||
|  | 					"by-nc-sa" => "CC BY-NC-SA", | ||||||
|  | 					"by-nd" => "CC BY-ND", | ||||||
|  | 					"by-sa" => "CC BY-SA", | ||||||
|  | 					"cc0" => "CC0" | ||||||
|  | 				] | ||||||
|  | 			] | ||||||
|  | 		]; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function get($proxy, $url, $get = [], $jwt = false){ | ||||||
|  | 		 | ||||||
|  | 		$curlproc = curl_init(); | ||||||
|  | 		 | ||||||
|  | 		if($get !== []){ | ||||||
|  | 			$get = http_build_query($get); | ||||||
|  | 			$url .= "?" . $get; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_URL, $url); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | ||||||
|  | 		 | ||||||
|  | 		if($jwt === false){ | ||||||
|  | 			 | ||||||
|  | 			curl_setopt( | ||||||
|  | 				$curlproc, | ||||||
|  | 				CURLOPT_HTTPHEADER, | ||||||
|  | 				["User-Agent: " . config::USER_AGENT, | ||||||
|  | 				"Accept: */*", | ||||||
|  | 				"Accept-Language: en-US,en;q=0.5", | ||||||
|  | 				"Accept-Encoding: gzip, deflate, br, zstd", | ||||||
|  | 				"Referer: https://vimeo.com/search", | ||||||
|  | 				"X-Requested-With: XMLHttpRequest", | ||||||
|  | 				"DNT: 1", | ||||||
|  | 				"Sec-GPC: 1", | ||||||
|  | 				"Connection: keep-alive", | ||||||
|  | 				"Sec-Fetch-Dest: empty", | ||||||
|  | 				"Sec-Fetch-Mode: cors", | ||||||
|  | 				"Sec-Fetch-Site: same-origin", | ||||||
|  | 				"Priority: u=4"] | ||||||
|  | 			); | ||||||
|  | 			 | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			curl_setopt( | ||||||
|  | 				$curlproc, | ||||||
|  | 				CURLOPT_HTTPHEADER, | ||||||
|  | 				["User-Agent: " . config::USER_AGENT, | ||||||
|  | 				"Accept: application/vnd.vimeo.*+json;version=3.3", | ||||||
|  | 				"Accept-Language: en", | ||||||
|  | 				"Accept-Encoding: gzip, deflate, br, zstd", | ||||||
|  | 				"Referer: https://vimeo.com/", | ||||||
|  | 				"Content-Type: application/json", | ||||||
|  | 				"Authorization: jwt $jwt", | ||||||
|  | 				"Vimeo-Page: /search/[[...slug]]", | ||||||
|  | 				"Origin: https://vimeo.com", | ||||||
|  | 				"DNT: 1", | ||||||
|  | 				"Sec-GPC: 1", | ||||||
|  | 				"Connection: keep-alive", | ||||||
|  | 				"Sec-Fetch-Dest: empty", | ||||||
|  | 				"Sec-Fetch-Mode: cors", | ||||||
|  | 				"Sec-Fetch-Site: same-site", | ||||||
|  | 				"Priority: u=4"] | ||||||
|  | 			); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_RETURNTRANSFER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYHOST, 2); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYPEER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_CONNECTTIMEOUT, 30); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_TIMEOUT, 30); | ||||||
|  |  | ||||||
|  | 		$this->backend->assign_proxy($curlproc, $proxy); | ||||||
|  | 		 | ||||||
|  | 		$data = curl_exec($curlproc); | ||||||
|  | 		 | ||||||
|  | 		if(curl_errno($curlproc)){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception(curl_error($curlproc)); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_close($curlproc); | ||||||
|  | 		return $data; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function video($get){ | ||||||
|  | 		 | ||||||
|  | 		// parse shit | ||||||
|  | 		if($get["npt"]){ | ||||||
|  | 			 | ||||||
|  | 			[$npt, $proxy] = | ||||||
|  | 				$this->backend | ||||||
|  | 				->get( | ||||||
|  | 					$get["npt"], | ||||||
|  | 					"videos" | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			$npt = json_decode($npt, true); | ||||||
|  | 			$pagetype = $npt["pagetype"]; | ||||||
|  | 			$npt = $npt["npt"]; | ||||||
|  | 			 | ||||||
|  | 			$jwt = $this->get_jwt($proxy); | ||||||
|  | 			 | ||||||
|  | 			try{ | ||||||
|  | 				 | ||||||
|  | 				$json = | ||||||
|  | 					$this->get( | ||||||
|  | 						$proxy, | ||||||
|  | 						"https://api.vimeo.com" . $npt, | ||||||
|  | 						[], | ||||||
|  | 						$jwt | ||||||
|  | 					); | ||||||
|  | 			}catch(Exception $error){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to fetch JSON"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			$proxy = null; | ||||||
|  | 			$jwt = $this->get_jwt($proxy); // this gives us a proxy by reference | ||||||
|  | 			 | ||||||
|  | 			// parse filters | ||||||
|  | 			$npt = [ | ||||||
|  | 				"query" => $get["s"], | ||||||
|  | 				"page" => 1, | ||||||
|  | 				"per_page" => 24, | ||||||
|  | 				"facets" => "type" | ||||||
|  | 			]; | ||||||
|  | 			 | ||||||
|  | 			switch($get["display"]){ | ||||||
|  | 				 | ||||||
|  | 				case "video": | ||||||
|  | 					$npt["filter_type"] = "clip"; | ||||||
|  | 					$npt["fields"] = "clip.name,stats.plays,clip.pictures,clip.user.name,clip.user.link,clip.user.pictures.sizes,clip.uri,clip.stats.plays,clip.duration,clip.created_time,clip.link,clip.description"; | ||||||
|  | 					break; | ||||||
|  | 				 | ||||||
|  | 				case "ondemand": | ||||||
|  | 					$npt["filter_type"] = "ondemand"; | ||||||
|  | 					$npt["sizes"] = "296x744"; | ||||||
|  | 					$npt["fields"] = "ondemand.link,ondemand.name,ondemand.pictures.sizes,ondemand.metadata.interactions.buy,ondemand.metadata.interactions.rent,ondemand.uri"; | ||||||
|  | 					break; | ||||||
|  | 				 | ||||||
|  | 				case "people": | ||||||
|  | 					$npt["filter_type"] = "people"; | ||||||
|  | 					$npt["fetch_user_profile"] = "1"; | ||||||
|  | 					$npt["fields"] = "people.name,people.location_details.formatted_address,people.metadata.public_videos.total,people.pictures.sizes,people.link,people.metadata.connections.followers.total,people.skills.name,people.skills.uri,people.background_video,people.uri"; | ||||||
|  | 					break; | ||||||
|  | 				 | ||||||
|  | 				case "channel": | ||||||
|  | 					$npt["filter_type"] = "channel"; | ||||||
|  | 					$npt["fields"] = "channel.name,channel.metadata.connections.users.total,channel.metadata.connections.videos.total,channel.pictures.sizes,channel.link,channel.uri"; | ||||||
|  | 					break; | ||||||
|  | 				 | ||||||
|  | 				case "group": | ||||||
|  | 					$npt["filter_type"] = "group"; | ||||||
|  | 					$npt["fields"] = "group.name,group.metadata.connections.users.total,group.metadata.connections.videos.total,group.pictures.sizes,group.link,group.uri"; | ||||||
|  | 					break; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			// only apply filters if we're searching for videos | ||||||
|  | 			if($get["display"] == "video"){ | ||||||
|  | 				 | ||||||
|  | 				switch($get["sort"]){ | ||||||
|  | 					 | ||||||
|  | 					case "relevance": break; // do nothing | ||||||
|  | 					 | ||||||
|  | 					case "recent": | ||||||
|  | 						$npt["sort"] = "latest"; | ||||||
|  | 						$npt["direction"] = "desc"; | ||||||
|  | 						break; | ||||||
|  | 					 | ||||||
|  | 					case "popular": | ||||||
|  | 						$npt["sort"] = "popularity"; | ||||||
|  | 						$npt["direction"] = "desc"; | ||||||
|  | 						break; | ||||||
|  | 					 | ||||||
|  | 					case "a_z": | ||||||
|  | 						$npt["sort"] = "alphabetical"; | ||||||
|  | 						$npt["direction"] = "asc"; | ||||||
|  | 						break; | ||||||
|  | 					 | ||||||
|  | 					case "z_a": | ||||||
|  | 						$npt["sort"] = "alphabetical"; | ||||||
|  | 						$npt["direction"] = "desc"; | ||||||
|  | 						break; | ||||||
|  | 					 | ||||||
|  | 					case "longest": | ||||||
|  | 						$npt["sort"] = "duration"; | ||||||
|  | 						$npt["direction"] = "desc"; | ||||||
|  | 						break; | ||||||
|  | 					 | ||||||
|  | 					case "shortest": | ||||||
|  | 						$npt["sort"] = "duration"; | ||||||
|  | 						$npt["direction"] = "asc"; | ||||||
|  | 						break; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["time"] != "any"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["filter_uploaded"] = $get["time"]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["duration"] != "any"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["filter_duration"] = $get["duration"]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["resolution"] != "any"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["filter_resolution"] = $get["resolution"]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["category"] != "any"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["filter_category"] = $get["category"]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["live"] != "any"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["filter_live"] = "now"; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["hdr"] != "any"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["filter_hdr"] = $get["hdr"]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["vimeo_360"] != "any"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["filter_vimeo_360"] = $get["vimeo_360"]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["price"] != "any"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["filter_price"] = $get["price"]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["collection"] == "staff_pick"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["filter_staffpicked"] = "true"; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				if($get["license"] != "any"){ | ||||||
|  | 					 | ||||||
|  | 					$npt["filter_license"] = $get["license"]; | ||||||
|  | 				} | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$pagetype = $npt["filter_type"]; | ||||||
|  | 			 | ||||||
|  | 			try{ | ||||||
|  | 				 | ||||||
|  | 				$json = | ||||||
|  | 					$this->get( | ||||||
|  | 						$proxy, | ||||||
|  | 						"https://api.vimeo.com/search", | ||||||
|  | 						$npt, | ||||||
|  | 						$jwt | ||||||
|  | 					); | ||||||
|  | 			}catch(Exception $error){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to fetch JSON"); | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$json = json_decode($json, true); | ||||||
|  | 		 | ||||||
|  | 		if($json === null){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to parse JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$out = [ | ||||||
|  | 			"status" => "ok", | ||||||
|  | 			"npt" => null, | ||||||
|  | 			"video" => [], | ||||||
|  | 			"author" => [], | ||||||
|  | 			"livestream" => [], | ||||||
|  | 			"playlist" => [], | ||||||
|  | 			"reel" => [] | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		if(isset($json["error"])){ | ||||||
|  | 			 | ||||||
|  | 			$error = $json["error"]; | ||||||
|  | 			if(isset($json["developer_message"])){ | ||||||
|  | 				 | ||||||
|  | 				$error .= " ({$json["developer_message"]})"; | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Vimeo returned an error: " . $error); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		if(!isset($json["data"])){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Vimeo did not return a data object"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		switch($pagetype){ | ||||||
|  | 			 | ||||||
|  | 			case "clip": | ||||||
|  | 				foreach($json["data"] as $video){ | ||||||
|  | 					 | ||||||
|  | 					$video = $video["clip"]; | ||||||
|  | 					 | ||||||
|  | 					if(isset($video["user"]["pictures"]["sizes"])){ | ||||||
|  | 						 | ||||||
|  | 						$avatar = $video["user"]["pictures"]["sizes"][count($video["user"]["pictures"]["sizes"]) - 1]["link"]; | ||||||
|  | 					}else{ | ||||||
|  | 						 | ||||||
|  | 						$avatar = null; | ||||||
|  | 					} | ||||||
|  | 					 | ||||||
|  | 					$out["video"][] = [ | ||||||
|  | 						"title" => $video["name"], | ||||||
|  | 						"description" => | ||||||
|  | 							$this->limitstrlen( | ||||||
|  | 								$video["description"] | ||||||
|  | 							), | ||||||
|  | 						"author" => [ | ||||||
|  | 							"name" => $video["user"]["name"], | ||||||
|  | 							"url" => $video["user"]["link"], | ||||||
|  | 							"avatar" => $avatar | ||||||
|  | 						], | ||||||
|  | 						"date" => strtotime($video["created_time"]), | ||||||
|  | 						"duration" => (int)$video["duration"], | ||||||
|  | 						"views" => (int)$video["stats"]["plays"], | ||||||
|  | 						"thumb" => [ | ||||||
|  | 							"ratio" => "16:9", | ||||||
|  | 							"url" => $video["pictures"]["base_link"] | ||||||
|  | 						], | ||||||
|  | 						"url" => $video["link"] | ||||||
|  | 					]; | ||||||
|  | 				} | ||||||
|  | 				break; | ||||||
|  | 			 | ||||||
|  | 			case "ondemand": | ||||||
|  | 				foreach($json["data"] as $video){ | ||||||
|  | 					 | ||||||
|  | 					$video = $video["ondemand"]; | ||||||
|  | 					 | ||||||
|  | 					$description = []; | ||||||
|  | 					if(isset($video["metadata"]["interactions"]["rent"]["display_price"])){ | ||||||
|  | 						 | ||||||
|  | 						$description[] = "Rent for " . $video["metadata"]["interactions"]["rent"]["display_price"]; | ||||||
|  | 					} | ||||||
|  | 					 | ||||||
|  | 					if(isset($video["metadata"]["interactions"]["buy"]["display_price"])){ | ||||||
|  | 						 | ||||||
|  | 						$description[] = "Buy for " . $video["metadata"]["interactions"]["buy"]["display_price"]; | ||||||
|  | 					} | ||||||
|  | 					 | ||||||
|  | 					$description = implode(", ", $description); | ||||||
|  | 					 | ||||||
|  | 					$out["video"][] = [ | ||||||
|  | 						"title" => $video["name"], | ||||||
|  | 						"description" => $description, | ||||||
|  | 						"author" => [ | ||||||
|  | 							"name" => null, | ||||||
|  | 							"url" => null, | ||||||
|  | 							"avatar" => null | ||||||
|  | 						], | ||||||
|  | 						"date" => null, | ||||||
|  | 						"duration" => null, | ||||||
|  | 						"views" => null, | ||||||
|  | 						"thumb" => [ | ||||||
|  | 							"ratio" => "9:16", | ||||||
|  | 							"url" => $video["pictures"]["sizes"][0]["link"] | ||||||
|  | 						], | ||||||
|  | 						"url" => $video["link"] | ||||||
|  | 					]; | ||||||
|  | 				} | ||||||
|  | 				break; | ||||||
|  | 			 | ||||||
|  | 			case "people": | ||||||
|  | 				foreach($json["data"] as $user){ | ||||||
|  | 					 | ||||||
|  | 					$user = $user["people"]; | ||||||
|  | 					 | ||||||
|  | 					if( | ||||||
|  | 						isset($user["pictures"]["sizes"]) && | ||||||
|  | 						count($user["pictures"]["sizes"]) !== 0 | ||||||
|  | 					){ | ||||||
|  | 						 | ||||||
|  | 						$thumb = [ | ||||||
|  | 							"ratio" => "1:1", | ||||||
|  | 							"url" => $user["pictures"]["sizes"][count($user["pictures"]["sizes"]) - 1]["link"] | ||||||
|  | 						]; | ||||||
|  | 					}else{ | ||||||
|  | 						 | ||||||
|  | 						$thumb = [ | ||||||
|  | 							"ratio" => null, | ||||||
|  | 							"url" => null | ||||||
|  | 						]; | ||||||
|  | 					} | ||||||
|  | 					 | ||||||
|  | 					$out["author"][] = [ | ||||||
|  | 						"title" => $user["name"], | ||||||
|  | 						"followers" => (int)$user["metadata"]["connections"]["followers"]["total"], | ||||||
|  | 						"description" => $user["metadata"]["public_videos"]["total"] . " videos.", | ||||||
|  | 						"thumb" => $thumb, | ||||||
|  | 						"url" => $user["link"] | ||||||
|  | 					]; | ||||||
|  | 				} | ||||||
|  | 				break; | ||||||
|  | 			 | ||||||
|  | 			case "channel": | ||||||
|  | 			case "group": | ||||||
|  | 				foreach($json["data"] as $channel){ | ||||||
|  | 					 | ||||||
|  | 					$channel = $channel[$npt["filter_type"]]; | ||||||
|  | 					 | ||||||
|  | 					if( | ||||||
|  | 						isset($channel["pictures"]["sizes"]) && | ||||||
|  | 						count($channel["pictures"]["sizes"]) !== 0 | ||||||
|  | 					){ | ||||||
|  | 						 | ||||||
|  | 						$thumb = [ | ||||||
|  | 							"ratio" => "16:9", | ||||||
|  | 							"url" => $channel["pictures"]["sizes"][count($channel["pictures"]["sizes"]) - 1]["link"] | ||||||
|  | 						]; | ||||||
|  | 					}else{ | ||||||
|  | 						 | ||||||
|  | 						$thumb = [ | ||||||
|  | 							"ratio" => null, | ||||||
|  | 							"url" => null | ||||||
|  | 						]; | ||||||
|  | 					} | ||||||
|  | 					 | ||||||
|  | 					$out["author"][] = [ | ||||||
|  | 						"title" => $channel["name"], | ||||||
|  | 						"followers" => (int)$channel["metadata"]["connections"]["users"]["total"], | ||||||
|  | 						"description" => $channel["metadata"]["connections"]["videos"]["total"] . " videos.", | ||||||
|  | 						"thumb" => $thumb, | ||||||
|  | 						"url" => $channel["link"] | ||||||
|  | 					]; | ||||||
|  | 				} | ||||||
|  | 				break; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		// | ||||||
|  | 		// get next page | ||||||
|  | 		// | ||||||
|  | 		if( | ||||||
|  | 			isset($json["paging"]["next"]) && | ||||||
|  | 			is_string($json["paging"]["next"]) | ||||||
|  | 		){ | ||||||
|  | 			 | ||||||
|  | 			$out["npt"] = | ||||||
|  | 				$this->backend | ||||||
|  | 				->store( | ||||||
|  | 					json_encode([ | ||||||
|  | 						"npt" => $json["paging"]["next"], | ||||||
|  | 						"pagetype" => $pagetype | ||||||
|  | 					]), | ||||||
|  | 					"videos", | ||||||
|  | 					$proxy | ||||||
|  | 				); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return $out; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function get_jwt(&$proxy){ | ||||||
|  | 		 | ||||||
|  | 		// | ||||||
|  | 		// get jwt token | ||||||
|  | 		// it's probably safe to cache this across proxies, cause the jwt doesnt contain an userID | ||||||
|  | 		// only an appID, whatever shit that is | ||||||
|  | 		// we can only cache it for 5 minutes though, otherwise vimeo cries about it | ||||||
|  | 		// | ||||||
|  | 		if($proxy === null){ | ||||||
|  | 			 | ||||||
|  | 			$proxy = $this->backend->get_ip(); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$jwt = apcu_fetch("vimeo_jwt"); | ||||||
|  | 		 | ||||||
|  | 		if($jwt === false){ | ||||||
|  | 			/* | ||||||
|  | 			$html = | ||||||
|  | 				$this->get( | ||||||
|  | 					$proxy, | ||||||
|  | 					"https://vimeo.com/search", | ||||||
|  | 					[], | ||||||
|  | 					false | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			$this->fuckhtml->load($html); | ||||||
|  | 			 | ||||||
|  | 			$captcha = | ||||||
|  | 				$this->fuckhtml | ||||||
|  | 				->getElementsByTagName( | ||||||
|  | 					"title" | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			if( | ||||||
|  | 				count($captcha) !== 0 && | ||||||
|  | 				$this->fuckhtml | ||||||
|  | 				->getTextContent( | ||||||
|  | 					$captcha[0] | ||||||
|  | 				) == "Vimeo / CAPTCHA Challenge" | ||||||
|  | 			){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Vimeo returned a Captcha"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$html = | ||||||
|  | 				explode( | ||||||
|  | 					'<script id="viewer-bootstrap" type="application/json">', | ||||||
|  | 					$html, | ||||||
|  | 					2 | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			if(count($html) !== 2){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to find JWT json"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$jwt = | ||||||
|  | 				json_decode( | ||||||
|  | 					$this->fuckhtml | ||||||
|  | 					->extract_json( | ||||||
|  | 						$html[1] | ||||||
|  | 					), | ||||||
|  | 					true | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			if($jwt === null){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to decode JWT json"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if(!isset($jwt["jwt"])){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to grep JWT"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$jwt = $jwt["jwt"]; | ||||||
|  | 			*/ | ||||||
|  | 			 | ||||||
|  | 			try{ | ||||||
|  | 				$json = | ||||||
|  | 					$this->get( | ||||||
|  | 						$proxy, | ||||||
|  | 						"https://vimeo.com/_next/jwt", | ||||||
|  | 						[], | ||||||
|  | 						false | ||||||
|  | 					); | ||||||
|  | 			}catch(Exception $error){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to fetch JWT token"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$this->fuckhtml->load($json); | ||||||
|  | 			 | ||||||
|  | 			$captcha = | ||||||
|  | 				$this->fuckhtml | ||||||
|  | 				->getElementsByTagName( | ||||||
|  | 					"title" | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			if( | ||||||
|  | 				count($captcha) !== 0 && | ||||||
|  | 				$this->fuckhtml | ||||||
|  | 				->getTextContent( | ||||||
|  | 					$captcha[0] | ||||||
|  | 				) == "Vimeo / CAPTCHA Challenge" | ||||||
|  | 			){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Vimeo returned a Captcha"); | ||||||
|  | 			} | ||||||
|  | 				 | ||||||
|  | 			$json = json_decode($json, true); | ||||||
|  | 			 | ||||||
|  | 			if($json === null){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("The JWT object could not be decoded"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			if(!isset($json["token"])){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Vimeo did not return a JWT"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$jwt = $json["token"]; | ||||||
|  | 			 | ||||||
|  | 			apcu_store("vimeo_jwt", $jwt, 300); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return $jwt; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function titledots($title){ | ||||||
|  | 		 | ||||||
|  | 		$substr = substr($title, -3); | ||||||
|  | 		 | ||||||
|  | 		if( | ||||||
|  | 			$substr == "..." || | ||||||
|  | 			$substr == "…" | ||||||
|  | 		){ | ||||||
|  | 			 | ||||||
|  | 			return trim(substr($title, 0, -3), " \n\r\t\v\x00\0\x0B\xc2\xa0"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return trim($title, " \n\r\t\v\x00\0\x0B\xc2\xa0"); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function limitstrlen($text){ | ||||||
|  | 		 | ||||||
|  | 		return | ||||||
|  | 			explode( | ||||||
|  | 				"\n", | ||||||
|  | 				wordwrap( | ||||||
|  | 					str_replace( | ||||||
|  | 						["\n\r", "\r\n", "\n", "\r"], | ||||||
|  | 						" ", | ||||||
|  | 						$text | ||||||
|  | 					), | ||||||
|  | 					300, | ||||||
|  | 					"\n" | ||||||
|  | 				), | ||||||
|  | 				2 | ||||||
|  | 			)[0]; | ||||||
|  | 	} | ||||||
|  | } | ||||||
							
								
								
									
										257
									
								
								scraper/vsco.php
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										257
									
								
								scraper/vsco.php
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,257 @@ | |||||||
|  | <?php | ||||||
|  |  | ||||||
|  | class vsco{ | ||||||
|  | 	 | ||||||
|  | 	public function __construct(){ | ||||||
|  | 		 | ||||||
|  | 		include "lib/backend.php"; | ||||||
|  | 		$this->backend = new backend("vsco"); | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function getfilters($page){ | ||||||
|  | 		 | ||||||
|  | 		return []; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function get($proxy, $url, $get = [], $bearer = null){ | ||||||
|  | 		 | ||||||
|  | 		$curlproc = curl_init(); | ||||||
|  | 		 | ||||||
|  | 		if($get !== []){ | ||||||
|  | 			$get_tmp = http_build_query($get); | ||||||
|  | 			$url .= "?" . $get_tmp; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_URL, $url); | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | ||||||
|  | 		 | ||||||
|  | 		if($bearer === null){ | ||||||
|  | 			 | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
|  | 				["User-Agent: " . config::USER_AGENT, | ||||||
|  | 				"Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8", | ||||||
|  | 				"Accept-Language: en-US,en;q=0.5", | ||||||
|  | 				"Accept-Encoding: gzip", | ||||||
|  | 				"DNT: 1", | ||||||
|  | 				"Sec-GPC: 1", | ||||||
|  | 				"Connection: keep-alive", | ||||||
|  | 				"Upgrade-Insecure-Requests: 1", | ||||||
|  | 				"Sec-Fetch-Dest: document", | ||||||
|  | 				"Sec-Fetch-Mode: navigate", | ||||||
|  | 				"Sec-Fetch-Site: same-origin", | ||||||
|  | 				"Sec-Fetch-User: ?1", | ||||||
|  | 				"Priority: u=0, i", | ||||||
|  | 				"TE: trailers"] | ||||||
|  | 			); | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
|  | 				["User-Agent: " . config::USER_AGENT, | ||||||
|  | 				"Accept: */*", | ||||||
|  | 				"Accept-Language: en-US", | ||||||
|  | 				"Accept-Encoding: gzip", | ||||||
|  | 				"Referer: https://vsco.co/search/images/" . urlencode($get["query"]), | ||||||
|  | 				"authorization: Bearer " . $bearer, | ||||||
|  | 				"content-type: application/json", | ||||||
|  | 				"x-client-build: 1", | ||||||
|  | 				"x-client-platform: web", | ||||||
|  | 				"DNT: 1", | ||||||
|  | 				"Sec-GPC: 1", | ||||||
|  | 				"Connection: keep-alive", | ||||||
|  | 				"Sec-Fetch-Dest: empty", | ||||||
|  | 				"Sec-Fetch-Mode: cors", | ||||||
|  | 				"Sec-Fetch-Site: same-origin", | ||||||
|  | 				"Priority: u=0", | ||||||
|  | 				"TE: trailers"] | ||||||
|  | 			); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_RETURNTRANSFER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYHOST, 2); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_SSL_VERIFYPEER, true); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_CONNECTTIMEOUT, 30); | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_TIMEOUT, 30); | ||||||
|  | 		 | ||||||
|  | 		// http2 bypass | ||||||
|  | 		curl_setopt($curlproc, CURLOPT_HTTP_VERSION, CURL_HTTP_VERSION_2_0); | ||||||
|  | 		 | ||||||
|  | 		$this->backend->assign_proxy($curlproc, $proxy); | ||||||
|  | 		 | ||||||
|  | 		$data = curl_exec($curlproc); | ||||||
|  | 		 | ||||||
|  | 		if(curl_errno($curlproc)){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception(curl_error($curlproc)); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		curl_close($curlproc); | ||||||
|  | 		return $data; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	public function image($get){ | ||||||
|  | 		 | ||||||
|  | 		if($get["npt"]){ | ||||||
|  | 			 | ||||||
|  | 			[$data, $proxy] = | ||||||
|  | 				$this->backend->get( | ||||||
|  | 					$get["npt"], "images" | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			$data = json_decode($data, true); | ||||||
|  | 			 | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			$search = $get["s"]; | ||||||
|  | 			if(strlen($search) === 0){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Search term is empty!"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$proxy = $this->backend->get_ip(); | ||||||
|  | 			 | ||||||
|  | 			// get bearer token | ||||||
|  | 			try{ | ||||||
|  | 				 | ||||||
|  | 				$html = | ||||||
|  | 					$this->get( | ||||||
|  | 						$proxy, | ||||||
|  | 						"https://vsco.co/feed" | ||||||
|  | 					); | ||||||
|  | 				 | ||||||
|  | 			}catch(Exception $error){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to fetch feed page"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			preg_match( | ||||||
|  | 				'/"tkn":"([A-z0-9]+)"/', | ||||||
|  | 				$html, | ||||||
|  | 				$bearer | ||||||
|  | 			); | ||||||
|  | 			 | ||||||
|  | 			if(!isset($bearer[1])){ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to grep bearer token"); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$data = [ | ||||||
|  | 				"pagination" => [ | ||||||
|  | 					"query" => $search, | ||||||
|  | 					"page" => 0, | ||||||
|  | 					"size" => 100 | ||||||
|  | 				], | ||||||
|  | 				"bearer" => $bearer[1] | ||||||
|  | 			]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		try{ | ||||||
|  | 			 | ||||||
|  | 			$json = | ||||||
|  | 				$this->get( | ||||||
|  | 					$proxy, | ||||||
|  | 					"https://vsco.co/api/2.0/search/images", | ||||||
|  | 					$data["pagination"], | ||||||
|  | 					$data["bearer"] | ||||||
|  | 				); | ||||||
|  | 		}catch(Exception $error){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to fetch JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$json = json_decode($json, true); | ||||||
|  | 		 | ||||||
|  | 		if($json === null){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to decode JSON"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		$out = [ | ||||||
|  | 			"status" => "ok", | ||||||
|  | 			"npt" => null, | ||||||
|  | 			"image" => [] | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		if(!isset($json["results"])){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Failed to access results object"); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		foreach($json["results"] as $image){ | ||||||
|  | 			 | ||||||
|  | 			$image_domain = parse_url("https://" . $image["responsive_url"], PHP_URL_HOST); | ||||||
|  | 			$thumbnail = explode($image_domain, $image["responsive_url"], 2)[1]; | ||||||
|  | 			 | ||||||
|  | 			if(substr($thumbnail, 0, 3) != "/1/"){ | ||||||
|  | 				 | ||||||
|  | 				$thumbnail = | ||||||
|  | 					preg_replace( | ||||||
|  | 						'/^\/[^\/]+/', | ||||||
|  | 						"", | ||||||
|  | 						$thumbnail | ||||||
|  | 					); | ||||||
|  | 			} | ||||||
|  | 			 | ||||||
|  | 			$thumbnail = "https://img.vsco.co/cdn-cgi/image/width=480,height=360" . $thumbnail; | ||||||
|  | 			$size = | ||||||
|  | 				$this->image_ratio( | ||||||
|  | 					(int)$image["dimensions"]["width"], | ||||||
|  | 					(int)$image["dimensions"]["height"] | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			$out["image"][] = [ | ||||||
|  | 				"title" => $image["description"], | ||||||
|  | 				"source" => [ | ||||||
|  | 					[ | ||||||
|  | 						"url" => "https://" . $image["responsive_url"], | ||||||
|  | 						"width" => (int)$image["dimensions"]["width"], | ||||||
|  | 						"height" => (int)$image["dimensions"]["height"] | ||||||
|  | 					], | ||||||
|  | 					[ | ||||||
|  | 						"url" => $thumbnail, | ||||||
|  | 						"width" => $size[0], | ||||||
|  | 						"height" => $size[1] | ||||||
|  | 					] | ||||||
|  | 				], | ||||||
|  | 				"url" => "https://" . $image["grid"]["domain"] . "/media/" . $image["imageId"] | ||||||
|  | 			]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		// get NPT | ||||||
|  | 		$max_page = ceil($json["total"] / 100); | ||||||
|  | 		$data["pagination"]["page"]++; | ||||||
|  | 		 | ||||||
|  | 		if($max_page > $data["pagination"]["page"]){ | ||||||
|  | 			 | ||||||
|  | 			$out["npt"] = | ||||||
|  | 				$this->backend->store( | ||||||
|  | 					json_encode($data), | ||||||
|  | 					"images", | ||||||
|  | 					$proxy | ||||||
|  | 				); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return $out; | ||||||
|  | 	} | ||||||
|  | 	 | ||||||
|  | 	private function image_ratio($width, $height){ | ||||||
|  | 		 | ||||||
|  | 		$ratio = [ | ||||||
|  | 			480 / $width, | ||||||
|  | 			360 / $height | ||||||
|  | 		]; | ||||||
|  | 		 | ||||||
|  | 		if($ratio[0] < $ratio[1]){ | ||||||
|  | 			 | ||||||
|  | 			$ratio = $ratio[0]; | ||||||
|  | 		}else{ | ||||||
|  | 			 | ||||||
|  | 			$ratio = $ratio[1]; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
|  | 		return [ | ||||||
|  | 			floor($width * $ratio), | ||||||
|  | 			floor($height * $ratio) | ||||||
|  | 		]; | ||||||
|  | 	} | ||||||
|  | } | ||||||
| @@ -14,7 +14,7 @@ class yandex{ | |||||||
| 		// backend included in the scraper functions | 		// backend included in the scraper functions | ||||||
| 	} | 	} | ||||||
| 	 | 	 | ||||||
| 	private function get($proxy, $url, $get = [], $nsfw){ | 	private function get($proxy, $url, $get = [], $nsfw, $get_cookie = 1){ | ||||||
| 		 | 		 | ||||||
| 		$curlproc = curl_init(); | 		$curlproc = curl_init(); | ||||||
| 		 | 		 | ||||||
| @@ -25,19 +25,55 @@ class yandex{ | |||||||
| 		 | 		 | ||||||
| 		curl_setopt($curlproc, CURLOPT_URL, $url); | 		curl_setopt($curlproc, CURLOPT_URL, $url); | ||||||
| 		 | 		 | ||||||
|  | 		// extract "i" cookie | ||||||
|  | 		if($get_cookie === 0){ | ||||||
|  | 			 | ||||||
|  | 			$cookies_tmp = []; | ||||||
|  | 			curl_setopt($curlproc, CURLOPT_HEADERFUNCTION, function($curlproc, $header) use (&$cookies_tmp){ | ||||||
|  | 				 | ||||||
|  | 				$length = strlen($header); | ||||||
|  | 				 | ||||||
|  | 				$header = explode(":", $header, 2); | ||||||
|  | 				 | ||||||
|  | 				if(trim(strtolower($header[0])) == "set-cookie"){ | ||||||
|  | 					 | ||||||
|  | 					$cookie_tmp = explode("=", trim($header[1]), 2); | ||||||
|  | 					 | ||||||
|  | 					$cookies_tmp[trim($cookie_tmp[0])] = | ||||||
|  | 						explode(";", $cookie_tmp[1], 2)[0]; | ||||||
|  | 				} | ||||||
|  | 				 | ||||||
|  | 				return $length; | ||||||
|  | 			}); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
| 		switch($nsfw){ | 		switch($nsfw){ | ||||||
| 			case "yes": $nsfw = "0"; break; | 			case "yes": $nsfw = "0"; break; | ||||||
| 			case "maybe": $nsfw = "1"; break; | 			case "maybe": $nsfw = "1"; break; | ||||||
| 			case "no": $nsfw = "2"; break; | 			case "no": $nsfw = "2"; break; | ||||||
| 		} | 		} | ||||||
| 		 | 		 | ||||||
|  | 		switch($get_cookie){ | ||||||
|  | 			 | ||||||
|  | 			case 0: | ||||||
|  | 				$cookie = ""; | ||||||
|  | 				break; | ||||||
|  | 			 | ||||||
|  | 			case 1: | ||||||
|  | 				$cookie = "Cookie: yp=" . (time() - 4000033) . ".szm.1:1920x1080:876x1000#" . time() . ".sp.family:" . $nsfw; | ||||||
|  | 				break; | ||||||
|  | 			 | ||||||
|  | 			default: | ||||||
|  | 				$cookie = "Cookie: i=" . $get_cookie; | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
| 		$headers = | 		$headers = | ||||||
| 			["User-Agent: " . config::USER_AGENT, | 			["User-Agent: " . config::USER_AGENT, | ||||||
| 			"Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8", | 			"Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,*/*;q=0.8", | ||||||
| 			"Accept-Encoding: gzip", | 			"Accept-Encoding: gzip", | ||||||
| 			"Accept-Language: en-US,en;q=0.5", | 			"Accept-Language: en-US,en;q=0.5", | ||||||
| 			"DNT: 1", | 			"DNT: 1", | ||||||
| 			"Cookie: yp=1716337604.sp.family%3A{$nsfw}#1685406411.szm.1:1920x1080:1920x999", | 			$cookie, | ||||||
| 			"Referer: https://yandex.com/images/search", | 			"Referer: https://yandex.com/images/search", | ||||||
| 			"Connection: keep-alive", | 			"Connection: keep-alive", | ||||||
| 			"Upgrade-Insecure-Requests: 1", | 			"Upgrade-Insecure-Requests: 1", | ||||||
| @@ -59,6 +95,17 @@ class yandex{ | |||||||
| 		 | 		 | ||||||
| 		$data = curl_exec($curlproc); | 		$data = curl_exec($curlproc); | ||||||
| 		 | 		 | ||||||
|  | 		if($get_cookie === 0){ | ||||||
|  | 			 | ||||||
|  | 			if(isset($cookies_tmp["i"])){ | ||||||
|  | 				 | ||||||
|  | 				return $cookies_tmp["i"]; | ||||||
|  | 			}else{ | ||||||
|  | 				 | ||||||
|  | 				throw new Exception("Failed to get Yandex clearance cookie"); | ||||||
|  | 			} | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
| 		if(curl_errno($curlproc)){ | 		if(curl_errno($curlproc)){ | ||||||
| 			 | 			 | ||||||
| 			throw new Exception(curl_error($curlproc)); | 			throw new Exception(curl_error($curlproc)); | ||||||
| @@ -217,6 +264,23 @@ class yandex{ | |||||||
| 		// https://yandex.com/search/site/?text=minecraft&web=1&frame=1&v=2.0&searchid=3131712 | 		// https://yandex.com/search/site/?text=minecraft&web=1&frame=1&v=2.0&searchid=3131712 | ||||||
| 		// &within=777&from_day=26&from_month=8&from_year=2023&to_day=26&to_month=8&to_year=2023 | 		// &within=777&from_day=26&from_month=8&from_year=2023&to_day=26&to_month=8&to_year=2023 | ||||||
| 		 | 		 | ||||||
|  | 		// get clearance cookie | ||||||
|  | 		if(($cookie = apcu_fetch("yandexweb_cookie")) === false){ | ||||||
|  | 			 | ||||||
|  | 			$proxy = $this->backend->get_ip(); | ||||||
|  | 			 | ||||||
|  | 			$cookie = | ||||||
|  | 				$this->get( | ||||||
|  | 					$proxy, | ||||||
|  | 					"https://yandex.ru/support2/smart-captcha/ru/", | ||||||
|  | 					[], | ||||||
|  | 					false, | ||||||
|  | 					0 | ||||||
|  | 				); | ||||||
|  | 			 | ||||||
|  | 			apcu_store("yandexweb_cookie", $cookie); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
| 		if($get["npt"]){ | 		if($get["npt"]){ | ||||||
| 			 | 			 | ||||||
| 			[$npt, $proxy] = $this->backend->get($get["npt"], "web"); | 			[$npt, $proxy] = $this->backend->get($get["npt"], "web"); | ||||||
| @@ -226,7 +290,8 @@ class yandex{ | |||||||
| 					$proxy, | 					$proxy, | ||||||
| 					"https://yandex.com" . $npt, | 					"https://yandex.com" . $npt, | ||||||
| 					[], | 					[], | ||||||
| 					"yes" | 					"yes", | ||||||
|  | 					$cookie | ||||||
| 				); | 				); | ||||||
| 		}else{ | 		}else{ | ||||||
| 			 | 			 | ||||||
| @@ -236,7 +301,7 @@ class yandex{ | |||||||
| 				throw new Exception("Search term is empty!"); | 				throw new Exception("Search term is empty!"); | ||||||
| 			} | 			} | ||||||
| 			 | 			 | ||||||
| 			$proxy = $this->backend->get_ip(); | 			$proxy = !isset($proxy) ? $this->backend->get_ip() : $proxy; | ||||||
| 			$lang = $get["lang"]; | 			$lang = $get["lang"]; | ||||||
| 			$older = $get["older"]; | 			$older = $get["older"]; | ||||||
| 			$newer = $get["newer"]; | 			$newer = $get["newer"]; | ||||||
| @@ -283,7 +348,8 @@ class yandex{ | |||||||
| 						$proxy, | 						$proxy, | ||||||
| 						"https://yandex.com/search/site/", | 						"https://yandex.com/search/site/", | ||||||
| 						$params, | 						$params, | ||||||
| 						"yes" | 						"yes", | ||||||
|  | 						$cookie | ||||||
| 					); | 					); | ||||||
| 			}catch(Exception $error){ | 			}catch(Exception $error){ | ||||||
| 				 | 				 | ||||||
| @@ -314,6 +380,19 @@ class yandex{ | |||||||
| 		 | 		 | ||||||
| 		$this->fuckhtml->load($html); | 		$this->fuckhtml->load($html); | ||||||
| 		 | 		 | ||||||
|  | 		// Scrape page blocked error | ||||||
|  | 		$title = | ||||||
|  | 			$this->fuckhtml | ||||||
|  | 			->getElementsByTagName("title"); | ||||||
|  | 		 | ||||||
|  | 		if( | ||||||
|  | 			count($title) !== 0 && | ||||||
|  | 			$title[0]["innerHTML"] == "403" | ||||||
|  | 		){ | ||||||
|  | 			 | ||||||
|  | 			throw new Exception("Yandex blocked this proxy or 4get instance."); | ||||||
|  | 		} | ||||||
|  | 		 | ||||||
| 		// get nextpage | 		// get nextpage | ||||||
| 		$npt = | 		$npt = | ||||||
| 			$this->fuckhtml | 			$this->fuckhtml | ||||||
| @@ -668,7 +747,6 @@ class yandex{ | |||||||
| 		foreach($json["blocks"] as $block){ | 		foreach($json["blocks"] as $block){ | ||||||
| 			 | 			 | ||||||
| 			$html .= $block["html"]; | 			$html .= $block["html"]; | ||||||
| 			 |  | ||||||
| 			// get next page | 			// get next page | ||||||
| 			if( | 			if( | ||||||
| 				isset($block["params"]["nextPageUrl"]) && | 				isset($block["params"]["nextPageUrl"]) && | ||||||
|   | |||||||
| @@ -255,13 +255,6 @@ class yep{ | |||||||
| 		// use http2 | 		// use http2 | ||||||
| 		curl_setopt($curlproc, CURLOPT_HTTP_VERSION, CURL_HTTP_VERSION_2_0); | 		curl_setopt($curlproc, CURLOPT_HTTP_VERSION, CURL_HTTP_VERSION_2_0); | ||||||
| 		 | 		 | ||||||
| 		// set ciphers |  | ||||||
| 		curl_setopt( |  | ||||||
| 			$curlproc, |  | ||||||
| 			CURLOPT_SSL_CIPHER_LIST, |  | ||||||
| 			"aes_128_gcm_sha_256,chacha20_poly1305_sha_256,aes_256_gcm_sha_384,ecdhe_ecdsa_aes_128_gcm_sha_256,ecdhe_rsa_aes_128_gcm_sha_256,ecdhe_ecdsa_chacha20_poly1305_sha_256,ecdhe_rsa_chacha20_poly1305_sha_256,ecdhe_ecdsa_aes_256_gcm_sha_384,ecdhe_rsa_aes_256_gcm_sha_384,ecdhe_ecdsa_aes_256_sha,ecdhe_ecdsa_aes_128_sha,ecdhe_rsa_aes_128_sha,ecdhe_rsa_aes_256_sha,rsa_aes_128_gcm_sha_256,rsa_aes_256_gcm_sha_384,rsa_aes_128_sha,rsa_aes_256_sha" |  | ||||||
| 		); |  | ||||||
| 		 |  | ||||||
| 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | 		curl_setopt($curlproc, CURLOPT_ENCODING, ""); // default encoding | ||||||
| 		curl_setopt($curlproc, CURLOPT_HTTPHEADER, | 		curl_setopt($curlproc, CURLOPT_HTTPHEADER, | ||||||
| 			["User-Agent: " . config::USER_AGENT, | 			["User-Agent: " . config::USER_AGENT, | ||||||
| @@ -351,6 +344,7 @@ class yep{ | |||||||
| 						"type" => "web" | 						"type" => "web" | ||||||
| 					] | 					] | ||||||
| 				); | 				); | ||||||
|  | 			 | ||||||
| 		}catch(Exception $error){ | 		}catch(Exception $error){ | ||||||
| 			 | 			 | ||||||
| 			throw new Exception("Failed to fetch JSON"); | 			throw new Exception("Failed to fetch JSON"); | ||||||
|   | |||||||
| @@ -1209,15 +1209,16 @@ class yt{ | |||||||
| 				 | 				 | ||||||
| 				$reel = | 				$reel = | ||||||
| 					$reel | 					$reel | ||||||
| 					->reelItemRenderer; | 					->shortsLockupViewModel; | ||||||
| 				 | 				 | ||||||
| 				array_push( | 				array_push( | ||||||
| 					$this->out["reel"], | 					$this->out["reel"], | ||||||
| 					[ | 					[ | ||||||
| 						"title" => | 						"title" => | ||||||
| 							$reel | 							$reel | ||||||
| 							->headline | 							->overlayMetadata | ||||||
| 							->simpleText, | 							->primaryText | ||||||
|  | 							->content, | ||||||
| 						"description" => null, | 						"description" => null, | ||||||
| 						"author" => [ | 						"author" => [ | ||||||
| 							"name" => null, | 							"name" => null, | ||||||
| @@ -1225,30 +1226,22 @@ class yt{ | |||||||
| 							"avatar" => null | 							"avatar" => null | ||||||
| 						], | 						], | ||||||
| 						"date" => null, | 						"date" => null, | ||||||
| 						"duration" => | 						"duration" => null, | ||||||
| 							$this->textualtime2int( | 						"views" => null, | ||||||
| 								$reel |  | ||||||
| 								->accessibility |  | ||||||
| 								->accessibilityData |  | ||||||
| 								->label |  | ||||||
| 							), |  | ||||||
| 						"views" => |  | ||||||
| 							$this->truncatedcount2int( |  | ||||||
| 								$reel |  | ||||||
| 								->viewCountText |  | ||||||
| 								->simpleText |  | ||||||
| 							), |  | ||||||
| 						"thumb" => [ | 						"thumb" => [ | ||||||
| 							"url" => | 							"url" => | ||||||
| 								$reel | 								$reel | ||||||
| 								->thumbnail | 								->thumbnail | ||||||
| 								->thumbnails[0] | 								->sources[0] | ||||||
| 								->url, | 								->url, | ||||||
| 							"ratio" => "9:16" | 							"ratio" => "9:16" | ||||||
| 						], | 						], | ||||||
| 						"url" => | 						"url" => | ||||||
| 							"https://www.youtube.com/watch?v=" . | 							"https://www.youtube.com/watch?v=" . | ||||||
| 							$reel | 							$reel | ||||||
|  | 							->onTap | ||||||
|  | 							->innertubeCommand | ||||||
|  | 							->reelWatchEndpoint | ||||||
| 							->videoId | 							->videoId | ||||||
| 					] | 					] | ||||||
| 				); | 				); | ||||||
|   | |||||||
							
								
								
									
										64
									
								
								settings.php
									
									
									
									
									
								
							
							
						
						
									
										64
									
								
								settings.php
									
									
									
									
									
								
							| @@ -125,6 +125,10 @@ $settings = [ | |||||||
| 						"value" => "brave", | 						"value" => "brave", | ||||||
| 						"text" => "Brave" | 						"text" => "Brave" | ||||||
| 					], | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "mullvad_brave", | ||||||
|  | 						"text" => "Mullvad (Brave)" | ||||||
|  | 					], | ||||||
| 					[ | 					[ | ||||||
| 						"value" => "yandex", | 						"value" => "yandex", | ||||||
| 						"text" => "Yandex" | 						"text" => "Yandex" | ||||||
| @@ -133,10 +137,18 @@ $settings = [ | |||||||
| 						"value" => "google", | 						"value" => "google", | ||||||
| 						"text" => "Google" | 						"text" => "Google" | ||||||
| 					], | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "google_api", | ||||||
|  | 						"text" => "Google API" | ||||||
|  | 					], | ||||||
| 					[ | 					[ | ||||||
| 						"value" => "google_cse", | 						"value" => "google_cse", | ||||||
| 						"text" => "Google CSE" | 						"text" => "Google CSE" | ||||||
| 					], | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "mullvad_google", | ||||||
|  | 						"text" => "Mullvad (Google)" | ||||||
|  | 					], | ||||||
| 					[ | 					[ | ||||||
| 						"value" => "startpage", | 						"value" => "startpage", | ||||||
| 						"text" => "Startpage" | 						"text" => "Startpage" | ||||||
| @@ -169,6 +181,14 @@ $settings = [ | |||||||
| 						"value" => "mojeek", | 						"value" => "mojeek", | ||||||
| 						"text" => "Mojeek" | 						"text" => "Mojeek" | ||||||
| 					], | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "baidu", | ||||||
|  | 						"text" => "Baidu" | ||||||
|  | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "coccoc", | ||||||
|  | 						"text" => "Cốc Cốc" | ||||||
|  | 					], | ||||||
| 					[ | 					[ | ||||||
| 						"value" => "solofield", | 						"value" => "solofield", | ||||||
| 						"text" => "Solofield" | 						"text" => "Solofield" | ||||||
| @@ -223,14 +243,34 @@ $settings = [ | |||||||
| 						"value" => "yep", | 						"value" => "yep", | ||||||
| 						"text" => "Yep" | 						"text" => "Yep" | ||||||
| 					], | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "baidu", | ||||||
|  | 						"text" => "Baidu" | ||||||
|  | 					], | ||||||
| 					[ | 					[ | ||||||
| 						"value" => "solofield", | 						"value" => "solofield", | ||||||
| 						"text" => "Solofield" | 						"text" => "Solofield" | ||||||
| 					], | 					], | ||||||
| 					/*[ | 					[ | ||||||
| 						"value" => "pinterest", | 						"value" => "pinterest", | ||||||
| 						"text" => "Pinterest" | 						"text" => "Pinterest" | ||||||
| 					],*/ | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "cara", | ||||||
|  | 						"text" => "Cara" | ||||||
|  | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "flickr", | ||||||
|  | 						"text" => "Flickr" | ||||||
|  | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "fivehpx", | ||||||
|  | 						"text" => "500px" | ||||||
|  | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "vsco", | ||||||
|  | 						"text" => "VSCO" | ||||||
|  | 					], | ||||||
| 					[ | 					[ | ||||||
| 						"value" => "imgur", | 						"value" => "imgur", | ||||||
| 						"text" => "Imgur" | 						"text" => "Imgur" | ||||||
| @@ -249,6 +289,14 @@ $settings = [ | |||||||
| 						"value" => "yt", | 						"value" => "yt", | ||||||
| 						"text" => "YouTube" | 						"text" => "YouTube" | ||||||
| 					], | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "vimeo", | ||||||
|  | 						"text" => "Vimeo" | ||||||
|  | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "sepiasearch", | ||||||
|  | 						"text" => "Sepia Search" | ||||||
|  | 					], | ||||||
| 					[ | 					[ | ||||||
| 						"value" => "ddg", | 						"value" => "ddg", | ||||||
| 						"text" => "DuckDuckGo" | 						"text" => "DuckDuckGo" | ||||||
| @@ -273,6 +321,14 @@ $settings = [ | |||||||
| 						"value" => "qwant", | 						"value" => "qwant", | ||||||
| 						"text" => "Qwant" | 						"text" => "Qwant" | ||||||
| 					], | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "baidu", | ||||||
|  | 						"text" => "Baidu" | ||||||
|  | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "coccoc", | ||||||
|  | 						"text" => "Cốc Cốc" | ||||||
|  | 					], | ||||||
| 					[ | 					[ | ||||||
| 						"value" => "solofield", | 						"value" => "solofield", | ||||||
| 						"text" => "Solofield" | 						"text" => "Solofield" | ||||||
| @@ -310,6 +366,10 @@ $settings = [ | |||||||
| 					[ | 					[ | ||||||
| 						"value" => "mojeek", | 						"value" => "mojeek", | ||||||
| 						"text" => "Mojeek" | 						"text" => "Mojeek" | ||||||
|  | 					], | ||||||
|  | 					[ | ||||||
|  | 						"value" => "baidu", | ||||||
|  | 						"text" => "Baidu" | ||||||
| 					] | 					] | ||||||
| 				] | 				] | ||||||
| 			], | 			], | ||||||
|   | |||||||
| @@ -1,31 +1,30 @@ | |||||||
| :root{ | :root{ | ||||||
| 	--1d2021: #1d2021; | 	--1d2021:#1d2021; | ||||||
| 	--282828: #282828; | 	--282828:#282828; | ||||||
| 	--3c3836: #3c3836; | 	--3c3836:#3c3836; | ||||||
| 	--504945: #504945; | 	--504945:#504945; | ||||||
|  |  | ||||||
| 	/* font */ | 	/* font */ | ||||||
| 	--928374: #928374; | 	--928374:#928374; | ||||||
| 	--a89984: #c9c5bf; | 	--a89984:#c9c5bf; | ||||||
| 	--bdae93: #bdae93; | 	--bdae93:#bdae93; | ||||||
| 	--8ec07c: #8ec07c; | 	--8ec07c:#8ec07c; | ||||||
| 	--ebdbb2: #ebdbb2; | 	--ebdbb2:#ebdbb2; | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
|  |  | ||||||
| body{ | body{ | ||||||
| 	padding:15px 4% 40px; | 	padding:15px 4% 40px; | ||||||
|  | 	margin:unset; | ||||||
| } | } | ||||||
|  |  | ||||||
| h1,h2,h3,h4,h5,h6{ | h1, h2, h3, h4, h5, h6{ | ||||||
| 	padding:0; | 	padding:0; | ||||||
| 	margin:0 0 7px 0; | 	margin:0 0 7px 0; | ||||||
| 	line-height:initial; | 	line-height:initial; | ||||||
| 	color:var(--bdae93); | 	color:var(--bdae93); | ||||||
| } | } | ||||||
|  |  | ||||||
| h3,h4,h5,h6{ | h3, h4, h5, h6{ | ||||||
| 	margin-bottom:14px; | 	margin-bottom:14px; | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -37,11 +36,10 @@ h3,h4,h5,h6{ | |||||||
| 	float:right; | 	float:right; | ||||||
| 	cursor:pointer; | 	cursor:pointer; | ||||||
| 	padding:0 10px; | 	padding:0 10px; | ||||||
|   border-left: 1px solid var(--504945); | 	border-left:1px solid var(--504945); | ||||||
|   background: #723c0b; | 	background:#723c0b; | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
| .searchbox input{ | .searchbox input{ | ||||||
| 	all:unset; | 	all:unset; | ||||||
| 	line-height:36px; | 	line-height:36px; | ||||||
| @@ -96,7 +94,6 @@ h3,h4,h5,h6{ | |||||||
| 	display:inline-block; | 	display:inline-block; | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
| .tabs .tab.selected{ | .tabs .tab.selected{ | ||||||
| 	border-bottom:2px solid #fc92a5; | 	border-bottom:2px solid #fc92a5; | ||||||
| } | } | ||||||
| @@ -106,7 +103,7 @@ h3,h4,h5,h6{ | |||||||
| 	padding-bottom:12px; | 	padding-bottom:12px; | ||||||
| 	padding-top:7px; | 	padding-top:7px; | ||||||
| 	margin-bottom:7px; | 	margin-bottom:7px; | ||||||
| 	background-color:#232525 | 	background-color:#232525; | ||||||
| } | } | ||||||
|  |  | ||||||
| .filters .filter{ | .filters .filter{ | ||||||
| @@ -169,7 +166,6 @@ h3,h4,h5,h6{ | |||||||
| 	font-size:12px; | 	font-size:12px; | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
| .web .hover{ | .web .hover{ | ||||||
| 	display:block; | 	display:block; | ||||||
| 	text-decoration:none; | 	text-decoration:none; | ||||||
| @@ -193,16 +189,13 @@ h3,h4,h5,h6{ | |||||||
| 	color:#9760b1 !important; | 	color:#9760b1 !important; | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
| .web .text-result .greentext{ | .web .text-result .greentext{ | ||||||
| 	font-size:14px; | 	font-size:14px; | ||||||
| 	color:var(--bdae93); | 	color:var(--bdae93); | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
| /* favicon */ | /* favicon */ | ||||||
|  |  | ||||||
|  |  | ||||||
| .favicon-dropdown a{ | .favicon-dropdown a{ | ||||||
| 	text-decoration:none; | 	text-decoration:none; | ||||||
| 	color:#d3d0c1; | 	color:#d3d0c1; | ||||||
| @@ -211,37 +204,31 @@ h3,h4,h5,h6{ | |||||||
| 	font-size:13px; | 	font-size:13px; | ||||||
| } | } | ||||||
|  |  | ||||||
|  | .web .favicon img, .favicon-dropdown img{ | ||||||
| .web .favicon img, |  | ||||||
| .favicon-dropdown img{ |  | ||||||
| 	margin:3px 7px 0 0; | 	margin:3px 7px 0 0; | ||||||
| 	height:16px; | 	height:16px; | ||||||
| 	font-size:12px; | 	font-size:12px; | ||||||
| 	line-height:16px;; | 	line-height:16px; | ||||||
| 	display:block; | 	display:block; | ||||||
| 	text-align:left; | 	text-align:left; | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
| .web .sublinks{ | .web .sublinks{ | ||||||
| 	padding:17px 10px; | 	padding:17px 10px; | ||||||
| 	font-size:15px; | 	font-size:15px; | ||||||
| 	color:var(--#928374); | 	color:var(--#928374); | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
| .web .text-result .sublinks:last-child{ | .web .text-result .sublinks:last-child{ | ||||||
| 	padding-bottom:0; | 	padding-bottom:0; | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
| /* Wikipedia head */ | /* Wikipedia head */ | ||||||
| .wiki-head{ | .wiki-head{ | ||||||
| 	padding:5px; | 	padding:5px; | ||||||
| 	background-color: #322f2b | 	background-color:#322f2b; | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
| /* | /* | ||||||
|   Images tab |   Images tab | ||||||
| */ | */ | ||||||
| @@ -257,8 +244,6 @@ h3,h4,h5,h6{ | |||||||
| 	float:left; | 	float:left; | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
|  |  | ||||||
| #images .image .title{ | #images .image .title{ | ||||||
| 	white-space:nowrap; | 	white-space:nowrap; | ||||||
| 	overflow:hidden; | 	overflow:hidden; | ||||||
| @@ -267,7 +252,6 @@ h3,h4,h5,h6{ | |||||||
| 	color:var(--bdae93); | 	color:var(--bdae93); | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
| #popup-status{ | #popup-status{ | ||||||
| 	display:none; | 	display:none; | ||||||
| 	position:fixed; | 	position:fixed; | ||||||
| @@ -283,40 +267,56 @@ h3,h4,h5,h6{ | |||||||
|   Settings page |   Settings page | ||||||
| */ | */ | ||||||
|  |  | ||||||
|  |  | ||||||
| .web .settings-submit a{ | .web .settings-submit a{ | ||||||
| 	margin-right:17px; | 	margin-right:17px; | ||||||
| 	color:#bdae93; | 	color:#bdae93; | ||||||
| } | } | ||||||
|  |  | ||||||
|  |  | ||||||
| /* | /* | ||||||
|   Responsive image |   Responsive image | ||||||
| */ | */ | ||||||
| @media only screen and (max-width: 1454px){ #images .image-wrapper{ width:25%; } } | @media only screen and (max-width:1454px){ | ||||||
| @media only screen and (max-width: 1161px){ #images .image-wrapper{ width:25%; } } | 	#images .image-wrapper{ | ||||||
| @media only screen and (max-width: 750px){ #images .image-wrapper{ width:50%; } } | 		width:25%; | ||||||
| @media only screen and (max-width: 450px){ #images .image-wrapper{ width:100%; } } | 	} | ||||||
|  | } | ||||||
|  |  | ||||||
|  | @media only screen and (max-width:1161px){ | ||||||
|  | 	#images .image-wrapper{ | ||||||
|  | 		width:25%; | ||||||
|  | 	} | ||||||
|  | } | ||||||
|  |  | ||||||
|  | @media only screen and (max-width:750px){ | ||||||
|  | 	#images .image-wrapper{ | ||||||
|  | 		width:50%; | ||||||
|  | 	} | ||||||
|  | } | ||||||
|  |  | ||||||
|  | @media only screen and (max-width:450px){ | ||||||
|  | 	#images .image-wrapper{ | ||||||
|  | 		width:100%; | ||||||
|  | 	} | ||||||
|  | } | ||||||
|  |  | ||||||
| /* | /* | ||||||
|   Responsive design |   Responsive design | ||||||
| */ | */ | ||||||
| @media only screen and (max-width: 1550px){ |  | ||||||
|  |  | ||||||
| 	 | @media only screen and (max-width:1550px){ | ||||||
| 	.web .left, | .web .left, | ||||||
| 	.searchbox{ | 	.searchbox{ | ||||||
| 		width:60%; | 		width:60%; | ||||||
| 	} | 	} | ||||||
|  |  | ||||||
| } | } | ||||||
|  |  | ||||||
| @media only screen and (max-width: 1000px){ | @media only screen and (max-width:1100px){ | ||||||
|  | .web .left, | ||||||
| } | 	.searchbox{ | ||||||
|  | 		width:100%; | ||||||
|     .type{ |  | ||||||
|     color:var(--bdae93); |  | ||||||
| 	} | 	} | ||||||
| } | } | ||||||
|  |  | ||||||
|  | .type{ | ||||||
|  | 	color:var(--bdae93); | ||||||
|  | } | ||||||
|   | |||||||
							
								
								
									
										17
									
								
								static/themes/Kuuro.css
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										17
									
								
								static/themes/Kuuro.css
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,17 @@ | |||||||
|  | :root{ | ||||||
|  | 	--1d2021: #101010; | ||||||
|  | 	--282828: #1a1a1a; | ||||||
|  | 	--3c3836: #1e1e1e; | ||||||
|  | 	--504945: #232323; | ||||||
|  |  | ||||||
|  | 	--928374: #949494; | ||||||
|  | 	--a89984: #d2d2d2; | ||||||
|  | 	--bdae93: #d2d2d2; | ||||||
|  | 	--8ec07c: #99c794; | ||||||
|  | 	--ebdbb2: #d2d2d2; | ||||||
|  |  | ||||||
|  | 	--comment: #5f6364; | ||||||
|  | 	--default: #cccece; | ||||||
|  | 	--keyword: #c594c5; | ||||||
|  | 	--string:  #99c794; | ||||||
|  | } | ||||||
							
								
								
									
										2
									
								
								web.php
									
									
									
									
									
								
							
							
						
						
									
										2
									
								
								web.php
									
									
									
									
									
								
							| @@ -89,7 +89,7 @@ if($results["spelling"]["type"] != "no_correction"){ | |||||||
| 			'&' . | 			'&' . | ||||||
| 			$frontend->buildquery($get, true) . | 			$frontend->buildquery($get, true) . | ||||||
| 			'&spellcheck=no">' . | 			'&spellcheck=no">' . | ||||||
| 			$results["spelling"]["correction"] . | 			htmlspecialchars($results["spelling"]["correction"]) . | ||||||
| 			'</a>?' . | 			'</a>?' . | ||||||
| 		'</div>'; | 		'</div>'; | ||||||
| } | } | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user