
- NOTICE: config.default.php has changed, re-create your config.php!! - [fix] No longer caches empty results - [fix] No longer make a request if the search query is empty - [fix] Movie highlight/box office cache now works - [fix] Language selector for Qwant, Wikipedia and Duckduckgo - [fix] Season and Episode filter for tv show searches - [fix] Safe search filter now actually works - [fix] Magnet Search category exclusion filter now actually works - [fix] Image size filter works more reliably - [fix] Handling of doublequotes in search queries - [fix] Search sources now show result amounts accurately - [fix] Old cache files are now actually deleted when expired - [fix] Search tabs not properly centered on smaller screens - [new] Box Office page with latest/new downloads from a few supported torrent websites - [new] News page with the latest news from major outlets - [new] Popup with movie info and download links for YTS Movie Highlights - [new] CSS colorschemes configurable in config.php - [new] Easily share magnet links with other Goosle users - [new] Search results from Quant API - [new] Search results from Brave - [new] Image results from Qwant Image API - [new] News results from Hackernews - [new] News results from Yahoo! News - [new] News results from Brave News - [new] News results from Qwant News API - [new] Magnet results from Sukebei.nyaa.si - [new] Special search for IP Lookups via ipify (Search for "ip" or "myip") - [new] Safe search switch for Yahoo! Images - [new] Image size switch for Qwant Images - [new] Merge missing magnet meta data from duplicate results if it doesn't already exist in the matched previous result - [new] Detect meta data for Magnet Search results such as sound and video quality. - [tweak] Cache ttl is now in hours (was minutes) - [tweak] Optimizations in CSS, HTML separators and more - [tweak] Moved icons into CSS so they can be colored using colorschemes - [tweak] Better handling of image results - [tweak] Better handling of empty/incomplete results for all engines - [tweak] Better handling of empty/missing meta data for all magnet engines - [tweak] Better category detection for Limetorrent magnets - [tweak] Raised Magnet search limit to 200 (was 50) - [tweak] Raised Wikipedia search limit to 20 (was 10) - [tweak] Hide magnet results with 0 seeders by default - [tweak] Uniform array formatting for all engines - [tweak] Consistent use of single-quotes and double-qoutes - [tweak] File size string conversion and formatting for all image and magnet engines - [tweak] Update checks are now done weekly(ish) via the Cron job - [tweak] Updated .htaccess caching rules - [removed] CSS for 320px viewport
131 lines
No EOL
4.6 KiB
PHP
131 lines
No EOL
4.6 KiB
PHP
<?php
|
|
/* ------------------------------------------------------------------------------------
|
|
* Goosle - The fast, privacy oriented search tool that just works.
|
|
*
|
|
* COPYRIGHT NOTICE
|
|
* Copyright 2023-2024 Arnan de Gans. All Rights Reserved.
|
|
*
|
|
* COPYRIGHT NOTICES AND ALL THE COMMENTS SHOULD REMAIN INTACT.
|
|
* By using this code you agree to indemnify Arnan de Gans from any
|
|
* liability that might arise from its use.
|
|
------------------------------------------------------------------------------------ */
|
|
abstract class EngineRequest {
|
|
protected $query, $ch, $mh, $opts, $url, $headers;
|
|
|
|
function __construct($opts, $mh) {
|
|
$this->query = $opts->query;
|
|
$this->mh = $mh;
|
|
// Must be in this order :-/
|
|
$this->opts = $opts;
|
|
$this->url = $this->get_request_url();
|
|
|
|
// No search engine url
|
|
if(!$this->url) return;
|
|
|
|
// Skip if there is a cached result (from earlier search)
|
|
if($this->opts->cache_type !== 'off' && has_cached_results($this->opts->cache_type, $this->opts->hash, $this->url, $this->opts->cache_time)) return;
|
|
|
|
// Default headers for the curl request
|
|
$default_headers = array(
|
|
'Accept' => 'text/html, application/xhtml+xml, application/json;q=0.9, application/xml;q=0.8, */*;q=0.7',
|
|
'Accept-Language' => 'en-US,en;q=0.5',
|
|
'Accept-Encoding' => 'gzip, deflate',
|
|
// 'Connection' => 'keep-alive',
|
|
'Upgrade-Insecure-Requests' => '1',
|
|
'User-Agent' => $this->opts->user_agents[array_rand($this->opts->user_agents)],
|
|
'Sec-Fetch-Dest' => 'document',
|
|
'Sec-Fetch-Mode' => 'navigate',
|
|
'Sec-Fetch-Site' => 'none'
|
|
);
|
|
|
|
// Override or remove headers per curl request
|
|
$extra_headers = $this->get_request_headers();
|
|
if(count($extra_headers) > 0) {
|
|
$headers = array_filter(array_replace($default_headers, $extra_headers));
|
|
|
|
foreach($headers as $key => $value) {
|
|
$this->headers[] = $key.': '.$value;
|
|
}
|
|
|
|
unset($key, $value);
|
|
} else {
|
|
$this->headers = $default_headers;
|
|
}
|
|
|
|
unset($default_headers, $extra_headers);
|
|
|
|
// Curl
|
|
$this->ch = curl_init();
|
|
|
|
curl_setopt($this->ch, CURLOPT_URL, $this->url);
|
|
curl_setopt($this->ch, CURLOPT_HTTPGET, 1); // Redundant? Probably...
|
|
curl_setopt($this->ch, CURLOPT_PROTOCOLS, CURLPROTO_HTTPS | CURLPROTO_HTTP);
|
|
curl_setopt($this->ch, CURLOPT_SSL_VERIFYPEER, false);
|
|
curl_setopt($this->ch, CURLOPT_ENCODING, 'gzip,deflate');
|
|
curl_setopt($this->ch, CURLOPT_HTTPHEADER, $this->headers);
|
|
curl_setopt($this->ch, CURLOPT_RETURNTRANSFER, true);
|
|
curl_setopt($this->ch, CURLOPT_FOLLOWLOCATION, true);
|
|
curl_setopt($this->ch, CURLOPT_MAXREDIRS, 5);
|
|
curl_setopt($this->ch, CURLOPT_REDIR_PROTOCOLS, CURLPROTO_HTTPS | CURLPROTO_HTTP);
|
|
curl_setopt($this->ch, CURLOPT_TIMEOUT, 3);
|
|
curl_setopt($this->ch, CURLOPT_VERBOSE, false);
|
|
|
|
if($mh) curl_multi_add_handle($mh, $this->ch);
|
|
}
|
|
|
|
/*--------------------------------------
|
|
// Get search engine url
|
|
--------------------------------------*/
|
|
public function get_request_url() {
|
|
return '';
|
|
}
|
|
|
|
/*--------------------------------------
|
|
// Check if a request to a search engine was successful
|
|
--------------------------------------*/
|
|
public function request_successful() {
|
|
if((isset($this->ch) && curl_getinfo($this->ch)['http_code'] == '200') || ($this->opts->cache_type !== 'off' && has_cached_results($this->opts->cache_type, $this->opts->hash, $this->url, $this->opts->cache_time))) {
|
|
return true;
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
abstract function parse_results($response);
|
|
|
|
/*--------------------------------------
|
|
// Load search results
|
|
--------------------------------------*/
|
|
public function get_results() {
|
|
if(!isset($this->url)) {
|
|
return $this->parse_results(null);
|
|
}
|
|
|
|
// If there is a cached result from an earlier search use that instead
|
|
if($this->opts->cache_type !== 'off' && has_cached_results($this->opts->cache_type, $this->opts->hash, $this->url, $this->opts->cache_time)) {
|
|
return fetch_cached_results($this->opts->cache_type, $this->opts->hash, $this->url);
|
|
}
|
|
|
|
// Curl request
|
|
if(!isset($this->ch)) {
|
|
return $this->parse_results(null);
|
|
}
|
|
|
|
$response = ($this->mh) ? curl_multi_getcontent($this->ch) : curl_exec($this->ch);
|
|
|
|
$results = $this->parse_results($response) ?? array();
|
|
|
|
// Cache last request if there is something to cache
|
|
if($this->opts->cache_type !== 'off') {
|
|
if(count($results) > 0) store_cached_results($this->opts->cache_type, $this->opts->hash, $this->url, $results, $this->opts->cache_time);
|
|
|
|
// Maybe delete old file cache
|
|
if($this->opts->cache_type == 'file') delete_cached_results($this->opts->cache_time);
|
|
}
|
|
|
|
return $results;
|
|
}
|
|
|
|
public static function print_results($results, $opts) {}
|
|
}
|
|
?>
|