mirror of
https://git.lolcat.ca/lolcat/4get.git
synced 2024-11-14 03:49:48 +01:00
Compare commits
No commits in common. "9cd369ac08683575784acb5f1563c2698026a838" and "aaa30c79f5a0f971ec60b6829eaddb02d0724304" have entirely different histories.
9cd369ac08
...
aaa30c79f5
|
@ -28,9 +28,6 @@ class ddg{
|
||||||
|
|
||||||
curl_setopt($curlproc, CURLOPT_URL, $url);
|
curl_setopt($curlproc, CURLOPT_URL, $url);
|
||||||
|
|
||||||
// http2 bypass
|
|
||||||
curl_setopt($curlproc, CURLOPT_HTTP_VERSION, CURL_HTTP_VERSION_2_0);
|
|
||||||
|
|
||||||
switch($reqtype){
|
switch($reqtype){
|
||||||
case self::req_web:
|
case self::req_web:
|
||||||
$headers =
|
$headers =
|
||||||
|
@ -39,33 +36,27 @@ class ddg{
|
||||||
"Accept-Encoding: gzip",
|
"Accept-Encoding: gzip",
|
||||||
"Accept-Language: en-US,en;q=0.5",
|
"Accept-Language: en-US,en;q=0.5",
|
||||||
"DNT: 1",
|
"DNT: 1",
|
||||||
"Sec-GPC: 1",
|
|
||||||
"Connection: keep-alive",
|
"Connection: keep-alive",
|
||||||
"Upgrade-Insecure-Requests: 1",
|
"Upgrade-Insecure-Requests: 1",
|
||||||
"Sec-Fetch-Dest: document",
|
"Sec-Fetch-Dest: document",
|
||||||
"Sec-Fetch-Mode: navigate",
|
"Sec-Fetch-Mode: navigate",
|
||||||
"Sec-Fetch-Site: same-origin",
|
"Sec-Fetch-Site: cross-site",
|
||||||
"Sec-Fetch-User: ?1",
|
"Upgrade-Insecure-Requests: 1"];
|
||||||
"Priority: u=0, i",
|
|
||||||
"TE: trailers"];
|
|
||||||
break;
|
break;
|
||||||
|
|
||||||
case self::req_xhr:
|
case self::req_xhr:
|
||||||
$headers =
|
$headers =
|
||||||
["User-Agent: " . config::USER_AGENT,
|
["User-Agent: " . config::USER_AGENT,
|
||||||
"Accept: application/json, text/javascript, */*; q=0.01",
|
"Accept: */*",
|
||||||
"Accept-Encoding: gzip",
|
"Accept-Encoding: gzip",
|
||||||
"Accept-Language: en-US,en;q=0.5",
|
"Accept-Language: en-US,en;q=0.5",
|
||||||
"Connection: keep-alive",
|
"Connection: keep-alive",
|
||||||
"Referer: https://duckduckgo.com/",
|
"Referer: https://duckduckgo.com/",
|
||||||
"X-Requested-With: XMLHttpRequest",
|
"X-Requested-With: XMLHttpRequest",
|
||||||
"DNT: 1",
|
"DNT: 1",
|
||||||
"Sec-GPC: 1",
|
"Sec-Fetch-Dest: script",
|
||||||
"Connection: keep-alive",
|
"Sec-Fetch-Mode: no-cors",
|
||||||
"Sec-Fetch-Dest: empty",
|
"Sec-Fetch-Site: same-site"];
|
||||||
"Sec-Fetch-Mode: cors",
|
|
||||||
"Sec-Fetch-Site: same-origin",
|
|
||||||
"TE: trailers"];
|
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -1898,12 +1889,12 @@ class ddg{
|
||||||
[$npt, $proxy] = $this->backend->get($get["npt"], "images");
|
[$npt, $proxy] = $this->backend->get($get["npt"], "images");
|
||||||
|
|
||||||
try{
|
try{
|
||||||
$json = $this->get(
|
$json = json_decode($this->get(
|
||||||
$proxy,
|
$proxy,
|
||||||
"https://duckduckgo.com/i.js?" . $npt,
|
"https://duckduckgo.com/i.js?" . $npt,
|
||||||
[],
|
[],
|
||||||
ddg::req_xhr
|
ddg::req_xhr
|
||||||
);
|
), true);
|
||||||
|
|
||||||
}catch(Exception $err){
|
}catch(Exception $err){
|
||||||
|
|
||||||
|
@ -1929,7 +1920,6 @@ class ddg{
|
||||||
|
|
||||||
$filter = [];
|
$filter = [];
|
||||||
$get_filters = [
|
$get_filters = [
|
||||||
"hps" => "1",
|
|
||||||
"q" => $search,
|
"q" => $search,
|
||||||
"iax" => "images",
|
"iax" => "images",
|
||||||
"ia" => "images"
|
"ia" => "images"
|
||||||
|
@ -1980,7 +1970,7 @@ class ddg{
|
||||||
}
|
}
|
||||||
|
|
||||||
$vqd = $vqd[1];
|
$vqd = $vqd[1];
|
||||||
|
|
||||||
// @TODO: s param = image offset
|
// @TODO: s param = image offset
|
||||||
$js_params = [
|
$js_params = [
|
||||||
"l" => $country,
|
"l" => $country,
|
||||||
|
@ -2004,12 +1994,12 @@ class ddg{
|
||||||
}
|
}
|
||||||
|
|
||||||
try{
|
try{
|
||||||
$json = $this->get(
|
$json = json_decode($this->get(
|
||||||
$proxy,
|
$proxy,
|
||||||
"https://duckduckgo.com/i.js",
|
"https://duckduckgo.com/i.js",
|
||||||
$js_params,
|
$js_params,
|
||||||
ddg::req_xhr
|
ddg::req_xhr
|
||||||
);
|
), true);
|
||||||
|
|
||||||
}catch(Exception $err){
|
}catch(Exception $err){
|
||||||
|
|
||||||
|
@ -2017,13 +2007,6 @@ class ddg{
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
$json = json_decode($json, true);
|
|
||||||
|
|
||||||
if($json === null){
|
|
||||||
|
|
||||||
throw new Exception("Failed to decode JSON");
|
|
||||||
}
|
|
||||||
|
|
||||||
$out = [
|
$out = [
|
||||||
"status" => "ok",
|
"status" => "ok",
|
||||||
"npt" => null,
|
"npt" => null,
|
||||||
|
|
|
@ -220,7 +220,6 @@ class marginalia{
|
||||||
"related" => []
|
"related" => []
|
||||||
];
|
];
|
||||||
|
|
||||||
// API scraper
|
|
||||||
if(config::MARGINALIA_API_KEY !== null){
|
if(config::MARGINALIA_API_KEY !== null){
|
||||||
|
|
||||||
try{
|
try{
|
||||||
|
@ -264,57 +263,34 @@ class marginalia{
|
||||||
return $out;
|
return $out;
|
||||||
}
|
}
|
||||||
|
|
||||||
// HTML parser
|
// no more cloudflare!! Parse html by default
|
||||||
$proxy = $this->backend->get_ip();
|
$params = [
|
||||||
|
"query" => $search
|
||||||
|
];
|
||||||
|
|
||||||
if($get["npt"]){
|
foreach(["adtech", "recent", "intitle"] as $v){
|
||||||
|
|
||||||
[$params, $proxy] =
|
if($get[$v] == "yes"){
|
||||||
$this->backend->get(
|
|
||||||
$get["npt"],
|
|
||||||
"web"
|
|
||||||
);
|
|
||||||
|
|
||||||
try{
|
|
||||||
$html =
|
|
||||||
$this->get(
|
|
||||||
$proxy,
|
|
||||||
"https://search.marginalia.nu/search?" . $params
|
|
||||||
);
|
|
||||||
}catch(Exception $error){
|
|
||||||
|
|
||||||
throw new Exception("Failed to get HTML");
|
switch($v){
|
||||||
}
|
|
||||||
|
|
||||||
}else{
|
|
||||||
$params = [
|
|
||||||
"query" => $search
|
|
||||||
];
|
|
||||||
|
|
||||||
foreach(["adtech", "recent", "intitle"] as $v){
|
|
||||||
|
|
||||||
if($get[$v] == "yes"){
|
|
||||||
|
|
||||||
switch($v){
|
case "adtech": $params["adtech"] = "reduce"; break;
|
||||||
|
case "recent": $params["recent"] = "recent"; break;
|
||||||
case "adtech": $params["adtech"] = "reduce"; break;
|
case "adtech": $params["searchTitle"] = "title"; break;
|
||||||
case "recent": $params["recent"] = "recent"; break;
|
|
||||||
case "adtech": $params["searchTitle"] = "title"; break;
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
try{
|
||||||
|
$html =
|
||||||
|
$this->get(
|
||||||
|
$this->backend->get_ip(),
|
||||||
|
"https://search.marginalia.nu/search",
|
||||||
|
$params
|
||||||
|
);
|
||||||
|
}catch(Exception $error){
|
||||||
|
|
||||||
try{
|
throw new Exception("Failed to get HTML");
|
||||||
$html =
|
|
||||||
$this->get(
|
|
||||||
$proxy,
|
|
||||||
"https://search.marginalia.nu/search",
|
|
||||||
$params
|
|
||||||
);
|
|
||||||
}catch(Exception $error){
|
|
||||||
|
|
||||||
throw new Exception("Failed to get HTML");
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
$this->fuckhtml->load($html);
|
$this->fuckhtml->load($html);
|
||||||
|
@ -411,65 +387,6 @@ class marginalia{
|
||||||
];
|
];
|
||||||
}
|
}
|
||||||
|
|
||||||
// get next page
|
|
||||||
$this->fuckhtml->load($html);
|
|
||||||
|
|
||||||
$pagination =
|
|
||||||
$this->fuckhtml
|
|
||||||
->getElementsByAttributeValue(
|
|
||||||
"aria-label",
|
|
||||||
"pagination",
|
|
||||||
"nav"
|
|
||||||
);
|
|
||||||
|
|
||||||
if(count($pagination) === 0){
|
|
||||||
|
|
||||||
// no pagination
|
|
||||||
return $out;
|
|
||||||
}
|
|
||||||
|
|
||||||
$this->fuckhtml->load($pagination[0]);
|
|
||||||
|
|
||||||
$pages =
|
|
||||||
$this->fuckhtml
|
|
||||||
->getElementsByClassName(
|
|
||||||
"page-link",
|
|
||||||
"a"
|
|
||||||
);
|
|
||||||
|
|
||||||
$found_current_page = false;
|
|
||||||
|
|
||||||
foreach($pages as $page){
|
|
||||||
|
|
||||||
if(
|
|
||||||
stripos(
|
|
||||||
$page["attributes"]["class"],
|
|
||||||
"active"
|
|
||||||
) !== false
|
|
||||||
){
|
|
||||||
|
|
||||||
$found_current_page = true;
|
|
||||||
continue;
|
|
||||||
}
|
|
||||||
|
|
||||||
if($found_current_page){
|
|
||||||
|
|
||||||
// we found current page index, and we iterated over
|
|
||||||
// the next page <a>
|
|
||||||
|
|
||||||
$out["npt"] =
|
|
||||||
$this->backend->store(
|
|
||||||
parse_url(
|
|
||||||
$page["attributes"]["href"],
|
|
||||||
PHP_URL_QUERY
|
|
||||||
),
|
|
||||||
"web",
|
|
||||||
$proxy
|
|
||||||
);
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
return $out;
|
return $out;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -701,11 +701,9 @@ class mojeek{
|
||||||
if(count($thumb) === 2){
|
if(count($thumb) === 2){
|
||||||
|
|
||||||
$answer["thumb"] =
|
$answer["thumb"] =
|
||||||
urldecode(
|
$this->fuckhtml
|
||||||
$this->fuckhtml
|
->getTextContent(
|
||||||
->getTextContent(
|
$thumb[1]
|
||||||
$thumb[1]
|
|
||||||
)
|
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in a new issue