Compare commits

...

3 Commits

Author SHA1 Message Date
lolcat faece63356 fixed soundcloud, fixed API not working, upgraded browser UA 2024-03-20 11:19:27 -04:00
lolcat 697ef3733d config fuckup 2024-03-20 11:00:38 -04:00
lolcat 635b2386d4 fixed google not working in yurop 2024-03-20 10:59:51 -04:00
7 changed files with 42 additions and 18 deletions

View File

@ -16,9 +16,9 @@ $frontend = new frontend();
/*
Captcha
*/
include "lib/captcha_gen.php";
include "lib/bot_protection.php";
$null = null;
new captcha($null, $null, $null, "images", false);
new bot_protection($null, $null, $null, "images", false);
[$scraper, $filters] = $frontend->getscraperfilters(
"images",

View File

@ -16,9 +16,9 @@ $frontend = new frontend();
/*
Captcha
*/
include "lib/captcha_gen.php";
include "lib/bot_protection.php";
$null = null;
new captcha($null, $null, $null, "music", false);
new bot_protection($null, $null, $null, "music", false);
[$scraper, $filters] = $frontend->getscraperfilters(
"music",

View File

@ -16,9 +16,9 @@ $frontend = new frontend();
/*
Captcha
*/
include "lib/captcha_gen.php";
include "lib/bot_protection.php";
$null = null;
new captcha($null, $null, $null, "news", false);
new bot_protection($null, $null, $null, "news", false);
[$scraper, $filters] = $frontend->getscraperfilters(
"news",

View File

@ -16,9 +16,9 @@ $frontend = new frontend();
/*
Captcha
*/
include "lib/captcha_gen.php";
include "lib/bot_protection.php";
$null = null;
new captcha($null, $null, $null, "videos", false);
new bot_protection($null, $null, $null, "videos", false);
[$scraper, $filters] = $frontend->getscraperfilters(
"videos",

View File

@ -16,9 +16,9 @@ $frontend = new frontend();
/*
Captcha
*/
include "lib/captcha_gen.php";
include "lib/bot_protection.php";
$null = null;
new captcha($null, $null, $null, "web", false);
new bot_protection($null, $null, $null, "web", false);
[$scraper, $filters] = $frontend->getscraperfilters(
"web",

View File

@ -83,7 +83,7 @@ class config{
// Default user agent to use for scraper requests. Sometimes ignored to get specific webpages
// Changing this might break things.
const USER_AGENT = "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:122.0) Gecko/20100101 Firefox/122.0";
const USER_AGENT = "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:124.0) Gecko/20100101 Firefox/124.0";
// Proxy pool assignments for each scraper
// false = Use server's raw IP
@ -118,8 +118,8 @@ class config{
// SOUNDCLOUD
// Get these parameters by making a search on soundcloud with network
// tab open, then filter URLs using "search?q=". (No need to login)
const SC_USER_ID = "59333-426459-717969-168008";
const SC_CLIENT_TOKEN = "8BBZpqUP1KSN4W6YB64xog2PX4Dw98b1";
const SC_USER_ID = "447501-577662-794348-352629";
const SC_CLIENT_TOKEN = "VNc62l3wxDWS0Ol62j5UYNc1gsZ3UXPv";
// MARGINALIA
// Get an API key by contacting the Marginalia.nu maintainer. The "public" key

View File

@ -522,6 +522,7 @@ class google{
"Accept-Language: en-US,en;q=0.5",
"Accept-Encoding: gzip",
"DNT: 1",
"Cookie: SOCS=CAESNQgCEitib3FfaWRlbnRpdHlmcm9udGVuZHVpc2VydmVyXzIwMjQwMzE3LjA4X3AwGgJlbiAEGgYIgM7orwY",
"Connection: keep-alive",
"Upgrade-Insecure-Requests: 1",
"Sec-Fetch-Dest: document",
@ -977,9 +978,9 @@ class google{
"related" => []
];
if($this->detect_sorry($html)){
if($error = $this->detect_sorry($html)){
throw new Exception("Google blocked this 4get instance. Please set up a proxy!");
throw new Exception($error);
}
$this->parsejavascript($html);
@ -2813,9 +2814,9 @@ class google{
throw new Exception("Failed to get search page");
}
if($this->detect_sorry($html)){
if($error = $this->detect_sorry($html)){
throw new Exception("Google blocked this 4get instance. Please set up a proxy!");
throw new Exception($error);
}
$out = [
@ -3649,7 +3650,30 @@ class google{
$detect_sorry[0]["innerHTML"] == "302 Moved"
){
return true;
// may be consent.google.com in europe or /sorry captcha page
$url =
$this->fuckhtml
->getElementsByTagName("a");
if(
strpos(
parse_url(
$this->fuckhtml
->getTextContent(
$url[0]["attributes"]["href"]
),
PHP_URL_PATH
),
"/sorry"
) === 0
){
// found /sorry
return "Google blocked this 4get instance. Please setup a proxy!";
}
// found consent.google, should not happen anymore
return "Google served a GPDR consent form. This should not happen, please report if you encounter this message";
}
return false;