
- NOTICE: config.default.php has changed, re-create your config.php!! - [fix] Footer no longer overlaps results - [fix] Search navigation no longer bunched up on smaller displays - [fix] Double search type when searching from start page - [new] Filter for additional/different headers per cURL request - [new] Image search via Openverse API (Access token and cronjob required, see installation instructions) - [new] Image search via Qwant API - [new] Web (recent news) search via Qwant API - [tweak] Merged 'cache' option into 'cache-type', see config.default.php for details - [tweak] Better filtering for duplicate web results - [tweak] File size formatting for images more uniform - [tweak] Optimized curl_multi_exec handling - [tweak] Improved SEO headers - [tweak] Layout tweaks and optimizations for search results, header and footer - [tweak] Removed redundant HTML, CSS and some PHP - [tweak] MagnetDL search disabled by default because of Cloudflare (Will probably be removed in future version) - [tweak] Removed non-functional magnet trackers - [tweak] Added 15 extra public magnet trackers - [change] Removed Ecosia support - [change] Removed Reddit support - [change] Removed 1337x support - [change] Removed MagnetDL support
137 lines
5.1 KiB
PHP
137 lines
5.1 KiB
PHP
<?php
|
|
/* ------------------------------------------------------------------------------------
|
|
* Goosle - A meta search engine for private and fast internet fun.
|
|
*
|
|
* COPYRIGHT NOTICE
|
|
* Copyright 2023-2024 Arnan de Gans. All Rights Reserved.
|
|
*
|
|
* COPYRIGHT NOTICES AND ALL THE COMMENTS SHOULD REMAIN INTACT.
|
|
* By using this code you agree to indemnify Arnan de Gans from any
|
|
* liability that might arise from its use.
|
|
------------------------------------------------------------------------------------ */
|
|
class YahooImageRequest extends EngineRequest {
|
|
public function get_request_url() {
|
|
// Split the query
|
|
$query_terms = explode(" ", strtolower($this->query));
|
|
|
|
// Size override
|
|
$size = "";
|
|
if($query_terms[0] == 'size') {
|
|
$switch = explode(":", $query_terms[0]);
|
|
|
|
if((strlen($switch[1]) >= 3 && strlen($switch[1]) <= 6) && !is_numeric($switch[1])) {
|
|
if($switch[1] == "med") $switch[1] = "medium";
|
|
if($switch[1] == "lrg") $switch[1] = "large";
|
|
if($switch[1] == "xlrg") $switch[1] = "wallpaper";
|
|
|
|
if($switch[1] == "small" || $switch[1] == "medium" || $switch[1] == "large" || $switch[1] == "wallpaper") {
|
|
$size = $switch[1];
|
|
}
|
|
|
|
$this->query = implode(" ", array_slice($query_terms, 1));
|
|
}
|
|
}
|
|
|
|
// p = query
|
|
// imgsz = Image size (small|medium|large|wallpaper)
|
|
|
|
$args = array("p" => $this->query, "imgsz" => $size);
|
|
$url = "https://images.search.yahoo.com/search/images?".http_build_query($args);
|
|
|
|
unset($query_terms, $switch, $size, $args);
|
|
|
|
return $url;
|
|
}
|
|
|
|
public function get_request_headers() {
|
|
return array(
|
|
'Accept' => 'text/html, application/xhtml+xml, application/xml;q=0.8, */*;q=0.7',
|
|
);
|
|
}
|
|
|
|
public function parse_results($response) {
|
|
$results = array();
|
|
$xpath = get_xpath($response);
|
|
|
|
if(!$xpath) return array();
|
|
|
|
// Scrape recommended
|
|
$didyoumean = $xpath->query(".//section[@class='dym-c']/section/h3/a")[0];
|
|
if(!is_null($didyoumean)) {
|
|
$results['did_you_mean'] = $didyoumean->textContent;
|
|
}
|
|
$search_specific = $xpath->query(".//section[@class='dym-c']/section/h5/a")[0];
|
|
if(!is_null($search_specific)) {
|
|
$results['search_specific'] = $search_specific->textContent;
|
|
}
|
|
|
|
// Scrape the results
|
|
// $scrape = $xpath->query("//li[contains(@class, 'ld') and not(contains(@class, 'slotting'))][position() < 101]");
|
|
$scrape = $xpath->query("//li[contains(@class, 'ld') and not(contains(@class, 'ignore'))][position() < 101]");
|
|
|
|
// Set base rank and result amound
|
|
$rank = $results['amount'] = count($scrape);
|
|
|
|
// Nothing found
|
|
if($results['amount'] == 0) return $results;
|
|
|
|
foreach($scrape as $result) {
|
|
$image_thumb = $xpath->evaluate(".//img/@src", $result)[0];
|
|
if(is_null($image_thumb)) continue;
|
|
|
|
$url_data = $xpath->evaluate(".//a/@href", $result)[0];
|
|
if(is_null($url_data)) continue;
|
|
|
|
// Get and prepare meta data
|
|
// -- Relevant $url_data (there is more, but unused by Goosle)
|
|
// w = Image width (1280)
|
|
// h = Image height (720)
|
|
// imgurl = Actual full size image (Used in Yahoo preview/popup)
|
|
// rurl = Url to page where the image is used
|
|
// size = Image size (413.1KB)
|
|
// tt = Website title (Used for image alt text)
|
|
foreach(explode("&", strstr($url_data->textContent, '?')) as &$meta) {
|
|
if(!is_null($meta) || !empty($meta)) {
|
|
$value = explode("=", trim($meta));
|
|
|
|
if(!empty($value[0]) && !empty($value[1])) {
|
|
$usable_data[$value[0]] = urldecode($value[1]);
|
|
}
|
|
}
|
|
unset($meta, $value);
|
|
}
|
|
|
|
// Deal with optional or missing data
|
|
$dimensions_w = (!array_key_exists('w', $usable_data)) ? "" : sanitize($usable_data['w']);
|
|
$dimensions_h = (!array_key_exists('h', $usable_data)) ? "" : sanitize($usable_data['h']);
|
|
$image_full = (!array_key_exists('imgurl', $usable_data)) ? "" : "//".sanitize($usable_data['imgurl']);
|
|
$link = (!array_key_exists('rurl', $usable_data)) ? "" : sanitize($usable_data['rurl']);
|
|
$filesize = (!array_key_exists('size', $usable_data)) ? "" : sanitize($usable_data['size']);
|
|
$alt = (!array_key_exists('tt', $usable_data)) ? "" : sanitize($usable_data['tt']);
|
|
|
|
// Process result
|
|
$image_thumb = sanitize($image_thumb->textContent);
|
|
$filesize = intval(preg_replace('/[^0-9.]/', '', $filesize) * 1000);
|
|
|
|
// filter duplicate IMAGE urls/results
|
|
if(!empty($results['search'])) {
|
|
if(in_array($image_full, array_column($results['search'], "image_full"))) continue;
|
|
}
|
|
|
|
$results['search'][] = array ("id" => uniqid(rand(0, 9999)), "source" => "Yahoo! Images", "image_thumb" => $image_thumb, "alt" => $alt, "image_full" => $image_full, "width" => $dimensions_w, "height" => $dimensions_h, "filesize" => $filesize, "webpage_url" => $link, "engine_rank" => $rank);
|
|
$rank -= 1;
|
|
unset($url_data, $usable_data, $dimensions_w, $dimensions_h, $filesize, $link, $image_full, $alt, $image_thumb);
|
|
}
|
|
unset($response, $xpath, $scrape, $rank);
|
|
|
|
// Add error if there are no search results
|
|
if(empty($results['search'])) {
|
|
$results['error'] = array(
|
|
"message" => "No results found. Please try with less or different keywords!"
|
|
);
|
|
}
|
|
|
|
return $results;
|
|
}
|
|
}
|
|
?>
|