2023-11-07 14:04:56 +01:00
|
|
|
<?php
|
|
|
|
class config{
|
|
|
|
// Welcome to the 4get configuration file
|
|
|
|
// When updating your instance, please make sure this file isn't missing
|
|
|
|
// any parameters.
|
|
|
|
|
|
|
|
// 4get version. Please keep this updated
|
2024-04-22 01:31:56 +02:00
|
|
|
const VERSION = 8;
|
2023-11-07 14:04:56 +01:00
|
|
|
|
|
|
|
// Will be shown pretty much everywhere.
|
|
|
|
const SERVER_NAME = "4get";
|
|
|
|
|
|
|
|
// Will be shown in <meta> tag on home page
|
2024-07-29 16:15:17 +02:00
|
|
|
const SERVER_SHORT_DESCRIPTION = "4get is a proxy search engine that doesn't suck.";
|
2023-11-07 14:04:56 +01:00
|
|
|
|
|
|
|
// Will be shown in server list ping (null for no description)
|
|
|
|
const SERVER_LONG_DESCRIPTION = null;
|
|
|
|
|
|
|
|
// Add your own themes in "static/themes". Set to "Dark" for default theme.
|
|
|
|
// Eg. To use "static/themes/Cream.css", specify "Cream".
|
|
|
|
const DEFAULT_THEME = "Dark";
|
|
|
|
|
|
|
|
// Enable the API?
|
|
|
|
const API_ENABLED = true;
|
|
|
|
|
2024-03-25 03:31:19 +01:00
|
|
|
//
|
|
|
|
// BOT PROTECTION
|
|
|
|
//
|
2023-11-07 14:04:56 +01:00
|
|
|
|
2024-03-25 03:31:19 +01:00
|
|
|
// 0 = disabled, 1 = ask for image captcha, @TODO: 2 = invite only (users needs a pass)
|
|
|
|
// VERY useful against a targetted attack
|
|
|
|
const BOT_PROTECTION = 0;
|
2024-01-07 01:43:54 +01:00
|
|
|
|
2023-11-07 14:04:56 +01:00
|
|
|
// if BOT_PROTECTION is set to 1, specify the available datasets here
|
|
|
|
// images should be named from 1.png to X.png, and be 100x100 in size
|
|
|
|
// Eg. data/captcha/birds/1.png up to 2263.png
|
|
|
|
const CAPTCHA_DATASET = [
|
|
|
|
// example:
|
2024-06-18 12:30:50 +02:00
|
|
|
//["birds", 2263],
|
|
|
|
//["fumo_plushies", 1006],
|
|
|
|
//["minecraft", 848]
|
2023-11-07 14:04:56 +01:00
|
|
|
];
|
|
|
|
|
2024-03-25 03:31:19 +01:00
|
|
|
// If this regex expression matches on the user agent, it blocks the request
|
|
|
|
// Not useful at all against a targetted attack
|
2024-05-16 23:22:49 +02:00
|
|
|
const HEADER_REGEX = '/bot|wget|curl|python-requests|scrapy|go-http-client|ruby|yahoo|spider|qwant/i';
|
2024-03-25 03:31:19 +01:00
|
|
|
|
|
|
|
// Block clients who present any of the following headers in their request (SPECIFY IN !!lowercase!!)
|
|
|
|
// Eg: ["x-forwarded-for", "x-via", "forwarded-for", "via"];
|
|
|
|
// Useful for blocking *some* proxies used for botting
|
|
|
|
const FILTERED_HEADER_KEYS = [
|
2024-06-18 12:30:50 +02:00
|
|
|
//"x-forwarded-for",
|
|
|
|
//"x-cluster-client-ip",
|
|
|
|
//"x-client-ip",
|
|
|
|
//"x-real-ip",
|
|
|
|
//"client-ip",
|
|
|
|
//"real-ip",
|
|
|
|
//"forwarded-for",
|
|
|
|
//"forwarded-for-ip",
|
|
|
|
//"forwarded",
|
|
|
|
//"proxy-connection",
|
|
|
|
//"remote-addr",
|
|
|
|
//"via"
|
2024-03-25 03:31:19 +01:00
|
|
|
];
|
|
|
|
|
2024-08-09 16:06:08 +02:00
|
|
|
// Block SSL ciphers used by CLI tools used for botting
|
|
|
|
// Basically a primitive version of Cloudflare's browser integrity check
|
|
|
|
// ** If curl can still access the site (with spoofed headers), please make sure you use the new apache2 config **
|
|
|
|
// https://git.lolcat.ca/lolcat/4get/docs/apache2.md
|
|
|
|
const DISALLOWED_SSL = [
|
|
|
|
// "TLS_AES_256_GCM_SHA384" // used by WGET and CURL
|
|
|
|
];
|
|
|
|
|
2024-03-25 03:31:19 +01:00
|
|
|
// Maximal number of searches per captcha key/pass issued. Counter gets
|
|
|
|
// reset on every APCU cache clear (should happen once a day).
|
|
|
|
// Only useful when BOT_PROTECTION is NOT set to 0
|
|
|
|
const MAX_SEARCHES = 100;
|
|
|
|
|
2023-11-07 14:04:56 +01:00
|
|
|
// List of domains that point to your servers. Include your tor/i2p
|
|
|
|
// addresses here! Must be a valid URL. Won't affect links placed on
|
|
|
|
// the homepage.
|
|
|
|
const ALT_ADDRESSES = [
|
|
|
|
//"https://4get.alt-tld",
|
|
|
|
//"http://4getwebfrq5zr4sxugk6htxvawqehxtdgjrbcn2oslllcol2vepa23yd.onion"
|
|
|
|
];
|
|
|
|
|
|
|
|
// Known 4get instances. MUST use the https protocol if your instance uses
|
|
|
|
// it. Is used to generate a distributed list of instances.
|
|
|
|
// To appear in the list of an instance, contact the host and if everyone added
|
|
|
|
// eachother your serber should appear everywhere.
|
|
|
|
const INSTANCES = [
|
|
|
|
"https://4get.ca",
|
|
|
|
"https://4get.zzls.xyz",
|
2023-11-27 07:01:56 +01:00
|
|
|
"https://4getus.zzls.xyz",
|
2023-11-07 14:04:56 +01:00
|
|
|
"https://4get.silly.computer",
|
2023-11-27 07:01:56 +01:00
|
|
|
"https://4get.konakona.moe",
|
|
|
|
"https://4get.lvkaszus.pl",
|
|
|
|
"https://4g.ggtyler.dev",
|
|
|
|
"https://4get.perennialte.ch",
|
2024-02-18 05:22:19 +01:00
|
|
|
"https://4get.sijh.net",
|
2023-11-27 07:01:56 +01:00
|
|
|
"https://4get.hbubli.cc",
|
|
|
|
"https://4get.plunked.party",
|
2024-02-18 05:22:19 +01:00
|
|
|
"https://4get.seitan-ayoub.lol",
|
|
|
|
"https://4get.etenie.pl",
|
|
|
|
"https://4get.lunar.icu",
|
|
|
|
"https://4get.dcs0.hu",
|
|
|
|
"https://4get.kizuki.lol",
|
|
|
|
"https://4get.psily.garden",
|
|
|
|
"https://search.milivojevic.in.rs",
|
|
|
|
"https://4get.snine.nl",
|
2024-02-26 03:35:57 +01:00
|
|
|
"https://4get.datura.network",
|
2024-06-13 04:41:02 +02:00
|
|
|
"https://4get.neco.lol",
|
|
|
|
"https://4get.lol",
|
|
|
|
"https://4get.ch",
|
|
|
|
"https://4get.edmateo.site",
|
2024-06-18 12:30:50 +02:00
|
|
|
"https://4get.sudovanilla.org",
|
|
|
|
"https://search.mint.lgbt"
|
2023-11-07 14:04:56 +01:00
|
|
|
];
|
|
|
|
|
|
|
|
// Default user agent to use for scraper requests. Sometimes ignored to get specific webpages
|
|
|
|
// Changing this might break things.
|
2024-08-09 16:06:08 +02:00
|
|
|
const USER_AGENT = "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:129.0) Gecko/20100101 Firefox/129.0";
|
2023-11-07 14:04:56 +01:00
|
|
|
|
|
|
|
// Proxy pool assignments for each scraper
|
|
|
|
// false = Use server's raw IP
|
|
|
|
// string = will load a proxy list from data/proxies
|
|
|
|
// Eg. "onion" will load data/proxies/onion.txt
|
|
|
|
const PROXY_DDG = false; // duckduckgo
|
|
|
|
const PROXY_BRAVE = false;
|
|
|
|
const PROXY_FB = false; // facebook
|
2024-07-29 16:17:21 +02:00
|
|
|
const PROXY_GOOGLE = false;
|
2024-07-15 05:10:26 +02:00
|
|
|
const PROXY_STARTPAGE = false;
|
2024-04-22 01:31:56 +02:00
|
|
|
const PROXY_QWANT = false;
|
2024-09-01 16:52:28 +02:00
|
|
|
const PROXY_GHOSTERY = false;
|
2023-11-07 14:04:56 +01:00
|
|
|
const PROXY_MARGINALIA = false;
|
|
|
|
const PROXY_MOJEEK = false;
|
|
|
|
const PROXY_SC = false; // soundcloud
|
2024-01-07 01:43:54 +01:00
|
|
|
const PROXY_SPOTIFY = false;
|
2023-11-07 14:04:56 +01:00
|
|
|
const PROXY_WIBY = false;
|
2024-01-07 01:43:54 +01:00
|
|
|
const PROXY_CURLIE = false;
|
2023-11-07 14:04:56 +01:00
|
|
|
const PROXY_YT = false; // youtube
|
|
|
|
const PROXY_YEP = false;
|
|
|
|
const PROXY_PINTEREST = false;
|
2024-02-18 05:22:19 +01:00
|
|
|
const PROXY_SEZNAM = false;
|
|
|
|
const PROXY_NAVER = false;
|
2024-05-16 23:22:49 +02:00
|
|
|
const PROXY_GREPPR = false;
|
2024-03-23 02:31:06 +01:00
|
|
|
const PROXY_CROWDVIEW = false;
|
2024-02-26 17:31:52 +01:00
|
|
|
const PROXY_MWMBL = false;
|
2023-11-07 14:04:56 +01:00
|
|
|
const PROXY_FTM = false; // findthatmeme
|
|
|
|
const PROXY_IMGUR = false;
|
|
|
|
const PROXY_YANDEX_W = false; // yandex web
|
|
|
|
const PROXY_YANDEX_I = false; // yandex images
|
|
|
|
const PROXY_YANDEX_V = false; // yandex videos
|
|
|
|
|
|
|
|
//
|
|
|
|
// Scraper-specific parameters
|
|
|
|
//
|
|
|
|
|
|
|
|
// MARGINALIA
|
2024-04-22 01:31:56 +02:00
|
|
|
// Use "null" to default out to HTML scraping OR specify a string to
|
|
|
|
// use the API (Eg: "public"). API has less filters.
|
|
|
|
const MARGINALIA_API_KEY = null;
|
2023-11-07 14:04:56 +01:00
|
|
|
}
|