2024-12-21 01:02:14 +00:00
|
|
|
[http.middlewares]
|
|
|
|
|
[http.middlewares.bad_bot_block]
|
|
|
|
|
[http.middlewares.bad_bot_block.plugin.badbot]
|
|
|
|
|
userAgent = [
|
2024-12-29 23:20:18 +00:00
|
|
|
"(^| )PTST\/",
|
|
|
|
|
"(^| )sentry\/",
|
|
|
|
|
"(sistrix|SISTRIX) [cC]rawler",
|
|
|
|
|
"007ac9 Crawler",
|
|
|
|
|
"2ip bot",
|
|
|
|
|
"2ip\.ru",
|
2024-12-21 01:02:14 +00:00
|
|
|
"360Spider",
|
2024-12-29 23:20:18 +00:00
|
|
|
"<li>Mozilla/5.0 (compatible; Ask Jeeves/Teoma; +http://about.ask.com/en/docs/about/webmasters.shtml)</li>",
|
|
|
|
|
"A Patent Crawler",
|
|
|
|
|
"A6-Indexer",
|
2024-12-21 01:02:14 +00:00
|
|
|
"ADmantX",
|
2024-12-29 23:20:18 +00:00
|
|
|
"AHC\/",
|
|
|
|
|
"AISearchBot",
|
|
|
|
|
"APIs-Google",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Aboundex",
|
2024-12-29 23:20:18 +00:00
|
|
|
"AcademicBotRTU",
|
|
|
|
|
"AddSearchBot",
|
|
|
|
|
"AddThis",
|
|
|
|
|
"Adidxbot",
|
|
|
|
|
"AdsBot-Google([^-]|$)",
|
|
|
|
|
"AdsBot-Google-Mobile",
|
|
|
|
|
"AdsTxtCrawler",
|
|
|
|
|
"AdvBot",
|
|
|
|
|
"Ahrefs(Bot|SiteAudit)",
|
|
|
|
|
"AlexandriaOrgBot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"AlphaBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Amazon CloudFront",
|
|
|
|
|
"Amazonbot",
|
|
|
|
|
"AndersPinkBot",
|
|
|
|
|
"AnyEvent",
|
|
|
|
|
"Apercite",
|
|
|
|
|
"AppEngine-Google",
|
|
|
|
|
"AppInsights",
|
|
|
|
|
"Applebot",
|
|
|
|
|
"ArchiveBot",
|
|
|
|
|
"AspiegelBot",
|
|
|
|
|
"Atom Feed Robot",
|
|
|
|
|
"Audisto Crawler",
|
2024-12-21 01:02:14 +00:00
|
|
|
"AwarioBot",
|
|
|
|
|
"AwarioRssBot",
|
|
|
|
|
"AwarioSmartBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"B2B Bot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"BDCbot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"BIGLOTRON",
|
|
|
|
|
"BLEXBot\/",
|
|
|
|
|
"BLP_bbot",
|
|
|
|
|
"BTWebClient",
|
|
|
|
|
"BUbiNG",
|
|
|
|
|
"Baidu-YunGuanCe",
|
|
|
|
|
"Baiduspider",
|
|
|
|
|
"Bark[rR]owler",
|
|
|
|
|
"BazQux",
|
|
|
|
|
"BehloolBot",
|
|
|
|
|
"Better Uptime Bot",
|
|
|
|
|
"BingPreview\/",
|
|
|
|
|
"BitBot",
|
|
|
|
|
"BitSightBot\/",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Blackboard",
|
2024-12-29 23:20:18 +00:00
|
|
|
"BlogTraffic\/\d\.\d+ Feed-Fetcher",
|
|
|
|
|
"BomboraBot",
|
|
|
|
|
"Bot\.AraTurka\.com",
|
|
|
|
|
"BoxcarBot",
|
|
|
|
|
"BrandONbot",
|
|
|
|
|
"BrandVerity",
|
|
|
|
|
"BrightEdge Crawler",
|
|
|
|
|
"BublupBot",
|
|
|
|
|
"Buck\/",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Bytespider",
|
2024-12-29 23:20:18 +00:00
|
|
|
"CC Metadata Scaper",
|
2024-12-21 01:02:14 +00:00
|
|
|
"CCBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"CISPA Webcrawler",
|
|
|
|
|
"Caliperbot",
|
|
|
|
|
"CapsuleChecker",
|
2024-12-21 01:02:14 +00:00
|
|
|
"ChatGPT-User",
|
2024-12-29 23:20:18 +00:00
|
|
|
"CheckMarkNetwork\/",
|
|
|
|
|
"Chrome-Lighthouse",
|
|
|
|
|
"Cincraw",
|
|
|
|
|
"Clickagy",
|
|
|
|
|
"Cliqzbot\/",
|
|
|
|
|
"CloudFlare-AlwaysOnline",
|
|
|
|
|
"CloudFlare-Prefetch",
|
|
|
|
|
"Cloudflare-Healthchecks",
|
|
|
|
|
"Cloudflare-SSLDetector",
|
|
|
|
|
"Cloudflare-Traffic-Manager",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Cocolyzebot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Companybook-Crawler",
|
|
|
|
|
"ContextAd Bot",
|
|
|
|
|
"CookieHubScan",
|
|
|
|
|
"Cookiebot",
|
|
|
|
|
"CrawlyProjectCrawler",
|
|
|
|
|
"CriteoBot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"CrunchBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"CrystalSemanticsBot",
|
|
|
|
|
"Cutbot",
|
|
|
|
|
"CyberPatrol",
|
|
|
|
|
"DareBoost",
|
|
|
|
|
"DataForSeoBot",
|
|
|
|
|
"Datafeedwatch",
|
|
|
|
|
"Datanyze",
|
|
|
|
|
"Dataprovider\.com",
|
|
|
|
|
"Daum\/",
|
|
|
|
|
"DeuSu\/",
|
|
|
|
|
"Diffbot\/",
|
|
|
|
|
"Digg Deeper",
|
|
|
|
|
"Digincore bot",
|
|
|
|
|
"Discordbot",
|
|
|
|
|
"Disqus",
|
2024-12-21 01:02:14 +00:00
|
|
|
"DnyzBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Domain Re-Animator Bot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"DomainStatsBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Domains Project\/",
|
|
|
|
|
"Dragonbot",
|
|
|
|
|
"Dubbotbot",
|
|
|
|
|
"DuckDuckBot",
|
|
|
|
|
"DuckDuckGo-Favicons-Bot",
|
|
|
|
|
"EZID",
|
|
|
|
|
"Embedly",
|
|
|
|
|
"EveryoneSocialBot",
|
|
|
|
|
"Expanse",
|
|
|
|
|
"Experibot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"ExtLinksBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Eyeotabot",
|
|
|
|
|
"FAST Enterprise Crawler",
|
|
|
|
|
"FAST-WebCrawler",
|
|
|
|
|
"Facebot",
|
|
|
|
|
"FeedValidator",
|
|
|
|
|
"Feedbin",
|
|
|
|
|
"Feedfetcher-Google",
|
|
|
|
|
"Feedly",
|
|
|
|
|
"Feedspot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"FemtosearchBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Fetch\/",
|
|
|
|
|
"Fever",
|
|
|
|
|
"FindITAnswersbot",
|
|
|
|
|
"Flamingo_SearchEngine",
|
|
|
|
|
"FlipboardProxy",
|
|
|
|
|
"FreeWebMonitoring SiteChecker",
|
|
|
|
|
"FreshRSS",
|
|
|
|
|
"FreshpingBot",
|
|
|
|
|
"Friendica",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Fyrebot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"G2 Web Services",
|
2024-12-21 01:02:14 +00:00
|
|
|
"GPTBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"GarlikCrawler",
|
|
|
|
|
"GeedoBot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Genieo",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Gigablast",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Gigabot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"GingerCrawler",
|
|
|
|
|
"Gluten Free Crawler\/",
|
|
|
|
|
"GnowitNewsbot",
|
|
|
|
|
"Go-http-client",
|
|
|
|
|
"Google Favicon",
|
|
|
|
|
"Google Web Preview",
|
|
|
|
|
"Google-Adwords-Instant",
|
|
|
|
|
"Google-Certificates-Bridge",
|
|
|
|
|
"Google-InspectionTool",
|
|
|
|
|
"Google-PhysicalWeb",
|
|
|
|
|
"Google-Read-Aloud",
|
|
|
|
|
"Google-Safety",
|
|
|
|
|
"Google-Site-Verification",
|
|
|
|
|
"Google-Structured-Data-Testing-Tool",
|
|
|
|
|
"GoogleOther",
|
|
|
|
|
"Googlebot-Image",
|
|
|
|
|
"Googlebot-Mobile",
|
|
|
|
|
"Googlebot-News",
|
|
|
|
|
"Googlebot-Video",
|
|
|
|
|
"Googlebot\/",
|
|
|
|
|
"Gowikibot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"GrapeshotCrawler",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Grobbot",
|
|
|
|
|
"GroupHigh\/",
|
|
|
|
|
"GroupMeBot",
|
|
|
|
|
"Gwene",
|
2024-12-21 01:02:14 +00:00
|
|
|
"HTTrack",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Hatena",
|
|
|
|
|
"HeadlessChrome",
|
|
|
|
|
"HttpUrlConnection",
|
|
|
|
|
"HubSpot",
|
|
|
|
|
"IAS crawler",
|
|
|
|
|
"ICBot\/",
|
|
|
|
|
"ICC-Crawler",
|
|
|
|
|
"INETDEX-BOT",
|
|
|
|
|
"Iframely",
|
2024-12-21 01:02:14 +00:00
|
|
|
"ImagesiftBot",
|
|
|
|
|
"IndeedBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"InterfaxScanBot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"InternetMeasurement",
|
2024-12-29 23:20:18 +00:00
|
|
|
"IonCrawl",
|
2024-12-21 01:02:14 +00:00
|
|
|
"IstellaBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"James BOT",
|
|
|
|
|
"Jamie's Spider",
|
|
|
|
|
"Jetslide",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Jetty",
|
2024-12-29 23:20:18 +00:00
|
|
|
"JobboerseBot",
|
|
|
|
|
"Jooblebot",
|
|
|
|
|
"Jugendschutzprogramm-Crawler",
|
|
|
|
|
"K7MLWCBot",
|
|
|
|
|
"KStandBot",
|
|
|
|
|
"Kemvibot",
|
|
|
|
|
"KeybaseBot",
|
|
|
|
|
"KomodiaBot",
|
|
|
|
|
"KosmioBot",
|
|
|
|
|
"Landau-Media-Spider",
|
|
|
|
|
"Laserlikebot",
|
|
|
|
|
"Leikibot",
|
|
|
|
|
"LightspeedSystemsCrawler",
|
|
|
|
|
"Linespider",
|
|
|
|
|
"Linguee Bot",
|
|
|
|
|
"LinkArchiver",
|
|
|
|
|
"LinkedInBot",
|
|
|
|
|
"LinkisBot",
|
|
|
|
|
"Livelap[bB]ot",
|
|
|
|
|
"Luminator-robots",
|
|
|
|
|
"MBCrawler",
|
2024-12-21 01:02:14 +00:00
|
|
|
"MJ12bot",
|
|
|
|
|
"MTRobot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"MaCoCu",
|
|
|
|
|
"Mail\.RU_Bot",
|
|
|
|
|
"Mastodon",
|
2024-12-21 01:02:14 +00:00
|
|
|
"MauiBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Mediapartners \(Googlebot\)",
|
|
|
|
|
"Mediapartners-Google",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Mediatoolkitbot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"MegaIndex",
|
|
|
|
|
"MeltwaterNews",
|
|
|
|
|
"MetaInspector",
|
|
|
|
|
"MetaJobBot",
|
|
|
|
|
"MetaURI",
|
|
|
|
|
"Miniflux\/",
|
|
|
|
|
"MixnodeCache\/",
|
|
|
|
|
"MojeekBot\/",
|
|
|
|
|
"Monsidobot",
|
|
|
|
|
"MoodleBot",
|
|
|
|
|
"Moreover",
|
|
|
|
|
"MuckRack",
|
|
|
|
|
"Multiviewbot",
|
|
|
|
|
"NAVER Blog Rssbot",
|
|
|
|
|
"NING\/",
|
|
|
|
|
"NINJA bot",
|
|
|
|
|
"NIXStatsbot",
|
|
|
|
|
"NTENTbot",
|
|
|
|
|
"Neevabot",
|
|
|
|
|
"NerdByNature\.Bot",
|
|
|
|
|
"NetSystemsResearch",
|
|
|
|
|
"NetcraftSurveyAgent",
|
|
|
|
|
"Neticle Crawler",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Netvibes",
|
2024-12-29 23:20:18 +00:00
|
|
|
"NewsBlur",
|
|
|
|
|
"NextCloud",
|
|
|
|
|
"Nicecrawler",
|
|
|
|
|
"Nimbostratus-Bot",
|
|
|
|
|
"Nmap Scripting Engine",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Nutch",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Nuzzel",
|
|
|
|
|
"OAI-SearchBot",
|
|
|
|
|
"Ocarinabot",
|
|
|
|
|
"OdklBot\/",
|
|
|
|
|
"OpenGraphCheck",
|
|
|
|
|
"OpenHoseBot",
|
|
|
|
|
"OrangeBot\/",
|
2024-12-21 01:02:14 +00:00
|
|
|
"OutclicksBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"PR-CY\.RU",
|
|
|
|
|
"PagePeeker\/",
|
|
|
|
|
"PageThing",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Pandalytics",
|
2024-12-29 23:20:18 +00:00
|
|
|
"PaperLiBot",
|
|
|
|
|
"Pcore-HTTP",
|
|
|
|
|
"PerplexityBot\/",
|
|
|
|
|
"PetalBot",
|
|
|
|
|
"PhantomJS",
|
|
|
|
|
"PhxBot",
|
|
|
|
|
"PiplBot",
|
|
|
|
|
"PocketParser",
|
|
|
|
|
"Primalbot",
|
|
|
|
|
"PrivacyAwareBot",
|
|
|
|
|
"Pulsepoint",
|
|
|
|
|
"Python-urllib",
|
|
|
|
|
"Qwantify",
|
2024-12-21 01:02:14 +00:00
|
|
|
"RSSingBot",
|
|
|
|
|
"RankActiveLinkBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Refindbot",
|
|
|
|
|
"RegionStuttgartBot",
|
|
|
|
|
"RetrevoPageAnalyzer",
|
|
|
|
|
"ReverseEngineeringBot",
|
|
|
|
|
"RewriteCond %{HTTP_USER_AGENT} ^$|\<|\>|\'|\%|\_iRc|\_Works|\@\$x|\<\?|\$x0e|\+select\+|\+union\+|1\,\1\,1\,|2icommerce|3GSE|4all|59\.64\.153\.|88\.0\.106\.|98|85\.17\.|A\_Browser|ABAC|Abont|abot|Accept|Access|Accoo|AceFTP|Acme|ActiveTouristBot|Address|Adopt|adress|adressendeutschland|ADSARobot|agent|ah\-ha|Ahead|AESOP\_com\_SpiderMan|aipbot|Alarm|Albert|Alek|Alexibot|Alligator|AllSubmitter|alma|almaden|ALot|Alpha|aktuelles|Akregat|Amfi|amzn\_assoc|Anal|Anarchie|andit|Anon|AnotherBot|Ansearch|AnswerBus|antivirx|Apexoo|appie|Aqua_Products|Arachmo|archive|arian|ASPSe|ASSORT|aster|Atari|ATHENS|AtHome|Atlocal|Atomic_Email_Hunter|Atomz|Atrop|^attach|attrib|autoemailspider|autohttp|axod|batch|b2w|Back|BackDoorBot|BackStreet|BackWeb|Badass|Baid|Bali|Bandit|Baidu|Barry|BasicHTTP|BatchFTP|bdfetch|beat|Become|Beij|BenchMark|berts|bew|big.brother|Bigfoot|Bilgi|Bison|Bitacle|Biz360|Black|Black.Hole|BlackWidow|bladder.fusion|Blaiz|Blog.Checker|Blogl|BlogPeople|Blogshares.Spiders|Bloodhound|Blow|bmclient|Board|BOI|boitho|Bond|Bookmark.search.tool|boris|Bost|Boston.Project|BotRightHere|Bot.mailto:craftbot@yahoo.com|BotALot|botpaidtoclick|botw|brandwatch|BravoBrian|Brok|Bropwers|Broth|browseabit|BrowseX|Browsezilla|Bruin|bsalsa|Buddy|Build|Built|Bulls|bumblebee|Bunny|Busca|Busi|Buy|bwh3|c\-spider|CafeK|Cafi|camel|Cand|captu|Catch|cd34|Ceg|CFNetwork|cgichk|Cha0s|Chang|chaos|Char|char\(32\,35\)|charlotte|CheeseBot|Chek|CherryPicker|chill|ChinaClaw|CICC|Cisco|Cita|Clam|Claw|Click.Bot|clipping|clshttp|Clush|COAST|ColdFusion|Coll|Comb|commentreader|Compan|contact|Control|contype|Conc|Conv|Copernic|Copi|Copy|Coral|Corn|core-project|cosmos|costa|cr4nk|crank|craft|Crap|Crawler0|Crazy|Cres|cs\-CZ|cuill|Curl|Custo|Cute|CSHttp|Cyber|cyberalert|^DA$|daoBot|DARK|Data|Daten|Daum|dcbot|dcs|Deep|DepS|Detect|Deweb|Diam|Digger|Digimarc|digout4uagent|DIIbot|Dillo|Ding|DISC|discobot|Disp|Ditto|DLC|DnloadMage|DotBot|Doubanbot|Download|Download.Demon|Download.Devil|Download.Wonder|Downloader|drag|DreamPassport|Drec|Drip|dsdl|dsok|DSurf|DTAAgent|DTS|Dual|dumb|DynaWeb|e\-collector|eag|earn|EARTHCOM|EasyDL|ebin|EBM-APPLE|EBrowse|eCatch|echo|ecollector|Edco|edgeio|efp\@gmx\.net|EirGrabber|email|Email.Extractor|EmailCollector|EmailSearch|EmailSiphon|EmailWolf|Emer|empas|Enfi|Enhan|Enterprise\_Search|envolk|erck|EroCr|ESurf|Eval|Evil|Evere|EWH|Exabot|Exact|EXPLOITER|Expre|Extra|ExtractorPro|EyeN|FairAd|Fake|FANG|FAST|fastlwspider|FavOrg|Favorites.Sweeper|Faxo|FDM\_1|FDSE|fetch|FEZhead|Filan|FileHound|find|Firebat|Firefox.2\.0|Firs|Flam|Flash|FlickBot|Flip|fluffy|flunky|focus|Foob|Fooky|Forex|Forum|ForV|Fost|Foto|Foun|Franklin.Locator|freefind|FreshDownload|FrontPage|FSurf|Fuck|Fuer|futile|Fyber|Gais|GalaxyBot|Galbot|Gamespy\_Arcade|GbPl|Gener|geni|Geona|Get|gigabaz|Gira|Ginxbot|gluc|glx.?v|gnome|Go.Zilla|Goldfire|Google.Wireless.Transcoder|Googlebot\-Image|Got\-It|GOFORIT|gonzo|GornKer|GoSearch|^gotit$|gozilla|grab|Grabber|GrabNet|Grub|Grup|Graf|Green.Research|grub|grub\-client|gsa\-cra|GSearch|GT\:\:WWW|GuideBot|guruji|gvfs|Gyps|hack|haha|hailo|Harv|Hatena|Hax|Head|Helm|herit|hgre|hhjhj\@yahoo|Hippo|hloader|HMView|holm|holy|HomePageSearch|HooWWWer|HouxouCrawler|HMSE|HPPrint|htdig|HTTPConnect|httpdown|http.generic|HTTPGet|httplib|HTTPRetriever|HTTrack|human|Huron|hverify|Hybrid|Hyper|ia\_archiver|iaskspi|IBM\_Planetwide|iCCra|ichiro|ID\-Search|IDA|IDBot|IEAuto|IEMPT|iexplore\.exe|iGetter|Ilse|Iltrov|Image|Image.Stripper|Image.Sucker|imagefetch|iimds\_monitor|Incutio|IncyWincy|Indexer|Industry.Program|Indy|InetURL|informant|InfoNav|InfoTekies|Ingelin|Innerpr|Inspect|InstallShield.DigitalWizard|Insuran\.|Intellig|Intelliseek|InterGET|Internet.Ninja|Internet.x|Internet\_Explorer|InternetLinkagent|InternetSeer.com|Intraf|IP2|Ipsel|Iria|IRLbot|Iron33|Irvine|ISC\_Sys|iSilo|ISRCCrawler|ISSpi|IUPUI.Research.Bot|Jady|Jaka|Jam|^Java|java\/|Java\(tm\)|JBH.agent|Jenny|JetB|JetC|jeteye|jiro|JoBo|JOC|jupit|Just|Jyx|Kapere|kash|Kazo|KBee|Kenjin|Kernel|Keywo|KFSW|KKma|Know|kosmix|KRAE|KRetrieve|Krug|ksibot|ksoap|Kum|KWebGet|Lachesis|lanshan|Lapo|larbin|leach
|
|
|
|
|
"RidderBot",
|
|
|
|
|
"Rivva",
|
|
|
|
|
"RuxitSynthetic",
|
|
|
|
|
"RyteBot",
|
|
|
|
|
"SBL-BOT",
|
2024-12-21 01:02:14 +00:00
|
|
|
"SEOkicks",
|
2024-12-29 23:20:18 +00:00
|
|
|
"SEOlizer",
|
|
|
|
|
"SWIMGBot",
|
|
|
|
|
"S[eE][mM]rushBot",
|
|
|
|
|
"SafeDNSBot",
|
|
|
|
|
"SafeSearch microdata crawler",
|
2024-12-21 01:02:14 +00:00
|
|
|
"ScoutJet",
|
|
|
|
|
"Scrapy",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Screaming Frog SEO Spider",
|
|
|
|
|
"SearchAtlas",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Seekport",
|
2024-12-29 23:20:18 +00:00
|
|
|
"SemanticScholarBot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"SentiBot",
|
|
|
|
|
"SenutoBot",
|
|
|
|
|
"SeobilityBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"SerendeputyBot",
|
|
|
|
|
"SeznamBot",
|
|
|
|
|
"SimpleCrawler",
|
|
|
|
|
"SimplePie",
|
|
|
|
|
"SimpleScraper",
|
2024-12-21 01:02:14 +00:00
|
|
|
"SiteCheckerBotCrawler",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Siteimprove\.com",
|
|
|
|
|
"SkypeUriPreview",
|
|
|
|
|
"Slack-ImgProxy",
|
|
|
|
|
"Slackbot",
|
|
|
|
|
"Slurp",
|
|
|
|
|
"Snacktory",
|
|
|
|
|
"Snap URL Preview Service",
|
2024-12-21 01:02:14 +00:00
|
|
|
"SocialRankIOBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Sogou",
|
|
|
|
|
"Sonic",
|
|
|
|
|
"Storebot-Google",
|
|
|
|
|
"StorygizeBot",
|
|
|
|
|
"StractBot",
|
|
|
|
|
"Streamline3Bot\/",
|
|
|
|
|
"Superfeedr",
|
|
|
|
|
"SurdotlyBot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"SurveyBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Synapse",
|
|
|
|
|
"Sysomos",
|
|
|
|
|
"Taboolabot",
|
|
|
|
|
"TangibleeBot",
|
|
|
|
|
"TelegramBot",
|
|
|
|
|
"Teoma",
|
|
|
|
|
"Thinklab",
|
|
|
|
|
"TinEye",
|
|
|
|
|
"Tiny Tiny RSS",
|
|
|
|
|
"TombaPublicWebCrawler",
|
|
|
|
|
"ToutiaoSpider",
|
|
|
|
|
"Traackr\.com",
|
|
|
|
|
"TrendsmapResolver",
|
|
|
|
|
"Trove",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Turnitin",
|
2024-12-29 23:20:18 +00:00
|
|
|
"TweetmemeBot",
|
|
|
|
|
"Twingly",
|
|
|
|
|
"Twitterbot",
|
|
|
|
|
"Twurly",
|
|
|
|
|
"UT-Dorkbot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"Upflow",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Uptime-Kuma",
|
|
|
|
|
"UptimeRobot",
|
|
|
|
|
"Uptimebot\.org",
|
|
|
|
|
"UsineNouvelleCrawler",
|
|
|
|
|
"VKRobot",
|
|
|
|
|
"Validator\.nu",
|
|
|
|
|
"Valve\/Steam",
|
2024-12-21 01:02:14 +00:00
|
|
|
"VelenPublicWebCrawler",
|
2024-12-29 23:20:18 +00:00
|
|
|
"Veoozbot",
|
|
|
|
|
"Vercelbot",
|
|
|
|
|
"Viber",
|
|
|
|
|
"Vigil\/",
|
|
|
|
|
"VoluumDSP-content-bot",
|
|
|
|
|
"W3C-checklink",
|
|
|
|
|
"W3C-mobileOK",
|
|
|
|
|
"W3C_CSS_Validator",
|
|
|
|
|
"W3C_I18n-Checker",
|
|
|
|
|
"W3C_Unicorn",
|
|
|
|
|
"W3C_Validator",
|
|
|
|
|
"WeSEE:Search",
|
|
|
|
|
"WebDataStats",
|
|
|
|
|
"WellKnownBot",
|
|
|
|
|
"WhatsApp",
|
|
|
|
|
"WordPress\/",
|
|
|
|
|
"WordupInfoSearch",
|
|
|
|
|
"Xenu Link Sleuth",
|
|
|
|
|
"Y!J",
|
|
|
|
|
"YaK\/",
|
|
|
|
|
"Yahoo Link Preview",
|
|
|
|
|
"YandexRenderResourcesBot\/",
|
|
|
|
|
"Yellowbrandprotectionbot",
|
|
|
|
|
"Yeti",
|
|
|
|
|
"YisouSpider",
|
|
|
|
|
"YouBot",
|
|
|
|
|
"Zabbix",
|
2024-12-21 01:02:14 +00:00
|
|
|
"ZoomBot",
|
|
|
|
|
"ZoominfoBot",
|
|
|
|
|
"ZumBot",
|
2024-12-29 23:20:18 +00:00
|
|
|
"ZuperlistBot\/",
|
|
|
|
|
"[Cc]urebot",
|
|
|
|
|
"[cC]laude[bB]ot",
|
|
|
|
|
"[pP]ingdom",
|
|
|
|
|
"[wW]get",
|
|
|
|
|
"^Apache-HttpClient",
|
|
|
|
|
"^BW\/",
|
|
|
|
|
"^LCC ",
|
|
|
|
|
"^PHP-Curl-Class",
|
|
|
|
|
"^curl",
|
|
|
|
|
"acapbot",
|
|
|
|
|
"acoonbot",
|
|
|
|
|
"adbeat_bot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"adscanner",
|
2024-12-29 23:20:18 +00:00
|
|
|
"aiHitBot",
|
|
|
|
|
"aiohttp",
|
|
|
|
|
"antibot",
|
|
|
|
|
"arabot",
|
|
|
|
|
"archive\.org_bot",
|
|
|
|
|
"awesomecrawler",
|
|
|
|
|
"axios",
|
|
|
|
|
"backlinkcrawler",
|
|
|
|
|
"betaBot",
|
|
|
|
|
"bidswitchbot",
|
|
|
|
|
"bingbot",
|
|
|
|
|
"binlar",
|
|
|
|
|
"bitlybot",
|
|
|
|
|
"blogmuraBot",
|
|
|
|
|
"bnf\.fr_bot",
|
|
|
|
|
"bot-pge\.chlooe\.com",
|
|
|
|
|
"botify",
|
|
|
|
|
"brainobot",
|
|
|
|
|
"buzzbot",
|
|
|
|
|
"cXensebot",
|
|
|
|
|
"careerbot",
|
|
|
|
|
"centurybot",
|
|
|
|
|
"changedetection",
|
|
|
|
|
"check_http",
|
|
|
|
|
"citeseerxbot",
|
|
|
|
|
"coccoc",
|
|
|
|
|
"collection@infegy\.com",
|
|
|
|
|
"content crawler spider",
|
|
|
|
|
"contxbot",
|
|
|
|
|
"convera",
|
2024-12-21 01:02:14 +00:00
|
|
|
"crawler4j",
|
2024-12-29 23:20:18 +00:00
|
|
|
"datagnionbot",
|
|
|
|
|
"dcrawl",
|
|
|
|
|
"deadlinkchecker",
|
|
|
|
|
"deepnoc",
|
|
|
|
|
"developers\.google\.com\/\+\/web\/snippet",
|
|
|
|
|
"discobot",
|
|
|
|
|
"domaincrawler",
|
|
|
|
|
"dotbot",
|
|
|
|
|
"drupact",
|
|
|
|
|
"e\.ventures Investment Crawler",
|
|
|
|
|
"ec2linkfinder",
|
|
|
|
|
"edisterbot",
|
|
|
|
|
"electricmonk",
|
|
|
|
|
"elisabot",
|
|
|
|
|
"epicbot",
|
|
|
|
|
"eright",
|
|
|
|
|
"europarchive\.org",
|
|
|
|
|
"ev-crawler\/",
|
2024-12-21 01:02:14 +00:00
|
|
|
"evc-batch",
|
2024-12-29 23:20:18 +00:00
|
|
|
"exabot",
|
|
|
|
|
"ezooms",
|
|
|
|
|
"facebookcatalog\/",
|
|
|
|
|
"facebookexternalhit",
|
|
|
|
|
"fedoraplanet",
|
|
|
|
|
"feedbot",
|
|
|
|
|
"filterdb\.iss\.net\/crawler",
|
|
|
|
|
"findlink",
|
|
|
|
|
"findthatfile",
|
|
|
|
|
"findxbot",
|
|
|
|
|
"fluffy",
|
|
|
|
|
"fr-crawler",
|
|
|
|
|
"fuelbot",
|
|
|
|
|
"g00g1e\.net",
|
|
|
|
|
"g2reader-bot",
|
|
|
|
|
"gnam gnam spider",
|
|
|
|
|
"google-xrawler",
|
|
|
|
|
"grub\.org",
|
|
|
|
|
"gslfbot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"heritrix",
|
2024-12-29 23:20:18 +00:00
|
|
|
"http_get",
|
|
|
|
|
"https:\/\/developers\.cloudflare\.com\/security-center\/",
|
|
|
|
|
"httpunit",
|
|
|
|
|
"httpx",
|
|
|
|
|
"hypestat",
|
|
|
|
|
"hyscore\.io",
|
|
|
|
|
"ia_archiver",
|
|
|
|
|
"ichiro",
|
|
|
|
|
"imrbot",
|
|
|
|
|
"infoobot",
|
|
|
|
|
"inoreader",
|
|
|
|
|
"integromedb",
|
|
|
|
|
"intelium_bot",
|
|
|
|
|
"ip-web-crawler\.com",
|
2024-12-21 01:02:14 +00:00
|
|
|
"ips-agent",
|
2024-12-29 23:20:18 +00:00
|
|
|
"iskanie",
|
|
|
|
|
"it2media-domain-crawler",
|
|
|
|
|
"jpg-newsbot",
|
|
|
|
|
"jyxobot",
|
|
|
|
|
"lb-spider",
|
|
|
|
|
"libwww-perl",
|
|
|
|
|
"linkapediabot",
|
|
|
|
|
"linkdex",
|
|
|
|
|
"lipperhey",
|
|
|
|
|
"lkxscan",
|
|
|
|
|
"lssbot",
|
|
|
|
|
"lssrocketcrawler",
|
|
|
|
|
"ltx71",
|
2024-12-21 01:02:14 +00:00
|
|
|
"magpie-crawler",
|
2024-12-29 23:20:18 +00:00
|
|
|
"mappydata",
|
|
|
|
|
"memorybot",
|
|
|
|
|
"meta-externalagent\/",
|
|
|
|
|
"meta-externalfetcher\/",
|
|
|
|
|
"mindUpBot",
|
|
|
|
|
"minicrawler",
|
|
|
|
|
"mlbot",
|
|
|
|
|
"moatbot",
|
|
|
|
|
"msnbot",
|
|
|
|
|
"msrbot",
|
|
|
|
|
"nerdybot",
|
|
|
|
|
"netEstate NE Crawler",
|
|
|
|
|
"netresearchserver",
|
|
|
|
|
"newsharecounts",
|
|
|
|
|
"newspaper\/",
|
|
|
|
|
"niki-bot",
|
|
|
|
|
"node-fetch",
|
|
|
|
|
"officestorebot",
|
|
|
|
|
"okhttp",
|
2024-12-21 01:02:14 +00:00
|
|
|
"omgili",
|
2024-12-29 23:20:18 +00:00
|
|
|
"online-webceo-bot",
|
|
|
|
|
"openindexspider",
|
|
|
|
|
"outbrain",
|
|
|
|
|
"page2rss",
|
|
|
|
|
"panscient",
|
|
|
|
|
"phpcrawl",
|
|
|
|
|
"pinterest\.com\/bot",
|
|
|
|
|
"postrank",
|
|
|
|
|
"proximic",
|
|
|
|
|
"psbot",
|
|
|
|
|
"purebot",
|
|
|
|
|
"python-opengraph",
|
|
|
|
|
"python-requests",
|
|
|
|
|
"redditbot",
|
|
|
|
|
"rogerbot",
|
|
|
|
|
"rssbot\/",
|
|
|
|
|
"scribdbot",
|
|
|
|
|
"search\.marginalia\.nu",
|
|
|
|
|
"seekbot",
|
|
|
|
|
"seewithkids",
|
|
|
|
|
"semanticbot",
|
|
|
|
|
"sempi\.tech",
|
2024-12-21 01:02:14 +00:00
|
|
|
"seoscanners",
|
2024-12-29 23:20:18 +00:00
|
|
|
"seostar\.co",
|
|
|
|
|
"serpstatbot\/",
|
|
|
|
|
"sitebot",
|
|
|
|
|
"siteexplorer\.info",
|
|
|
|
|
"smtbot",
|
|
|
|
|
"spbot",
|
|
|
|
|
"speedy",
|
|
|
|
|
"startmebot\/",
|
|
|
|
|
"summify",
|
|
|
|
|
"t3versionsBot",
|
|
|
|
|
"tagoobot",
|
|
|
|
|
"theoldreader\.com",
|
|
|
|
|
"tigerbot",
|
|
|
|
|
"toplistbot",
|
|
|
|
|
"tracemyfile",
|
|
|
|
|
"trendictionbot",
|
|
|
|
|
"trovitBot",
|
|
|
|
|
"tweetedtimes",
|
|
|
|
|
"twengabot",
|
|
|
|
|
"um-LN",
|
|
|
|
|
"urlappendbot",
|
|
|
|
|
"vebidoobot",
|
|
|
|
|
"vercel-screenshot",
|
|
|
|
|
"virustotal",
|
|
|
|
|
"vkShare",
|
|
|
|
|
"voilabot",
|
|
|
|
|
"vuhuvBot",
|
|
|
|
|
"wbsearchbot",
|
|
|
|
|
"web-archive-net\.com\.bot",
|
|
|
|
|
"webcompanycrawler",
|
|
|
|
|
"webmon ",
|
|
|
|
|
"wocbot",
|
|
|
|
|
"woobot",
|
|
|
|
|
"woorankreview\/",
|
|
|
|
|
"woriobot",
|
|
|
|
|
"wotbox",
|
|
|
|
|
"www\.uptime\.com",
|
2024-12-21 01:02:14 +00:00
|
|
|
"x09Mozilla",
|
|
|
|
|
"x22Mozilla",
|
2024-12-29 23:20:18 +00:00
|
|
|
"xovibot",
|
|
|
|
|
"yacybot",
|
|
|
|
|
"yandex\.com\/bots",
|
|
|
|
|
"yanga",
|
|
|
|
|
"yoozBot",
|
|
|
|
|
"zenback bot",
|
2024-12-21 01:02:14 +00:00
|
|
|
"zgrab",
|
|
|
|
|
]
|