Archivo para controlar robots abusivos
This commit is contained in:
parent
396801615e
commit
96ee88de82
270
robots.txt
Normal file
270
robots.txt
Normal file
@ -0,0 +1,270 @@
|
|||||||
|
User-agent: MJ12bot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: Vagabondo
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: BaiDuSpider
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: Exabot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: Yandex
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: BSpider
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: MegaIndex
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: AhrefsBot
|
||||||
|
Crawl-Delay: 3600
|
||||||
|
|
||||||
|
# Slow down bots
|
||||||
|
User-agent: *
|
||||||
|
Crawl-delay: 10
|
||||||
|
|
||||||
|
# Disallow: Sistrix
|
||||||
|
User-agent: sistrix
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# Disallow: Sistrix
|
||||||
|
User-agent: SISTRIX Crawler
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# Disallow: Sistrix
|
||||||
|
User-agent: SISTRIX
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# Disallow: SEOkicks-Robot
|
||||||
|
User-agent: SEOkicks-Robot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# Disallow: jobs.de-Robot
|
||||||
|
User-agent: jobs.de-Robot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# Backlink Analysis
|
||||||
|
user-agent: AhrefsBot
|
||||||
|
disallow: /
|
||||||
|
|
||||||
|
# Bot der Leipziger Unister Holding GmbH
|
||||||
|
user-agent: UnisterBot
|
||||||
|
disallow: /
|
||||||
|
|
||||||
|
# http://moz.com/products
|
||||||
|
User-agent: dotbot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.searchmetrics.com
|
||||||
|
User-agent: SearchmetricsBot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.majestic12.co.uk/projects/dsearch/mj12bot.php
|
||||||
|
User-agent: MJ12bot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.domaintools.com/webmasters/surveybot.php
|
||||||
|
User-agent: SurveyBot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.seodiver.com/bot
|
||||||
|
user-agent: SEOdiver
|
||||||
|
disallow: /
|
||||||
|
|
||||||
|
# http://openlinkprofiler.org/bot
|
||||||
|
User-agent: spbot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.wotbox.com/bot/
|
||||||
|
User-agent: wotbox
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.opensiteexplorer.org/dotbot
|
||||||
|
# http://moz.com/researchtools/ose/dotbot
|
||||||
|
User-agent: dotbot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.meanpath.com/meanpathbot.html
|
||||||
|
User-agent: meanpathbot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.backlinktest.com/crawler.html
|
||||||
|
User-agent: BacklinkCrawler
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.brandwatch.com/magpie-crawler/
|
||||||
|
User-agent: magpie-crawler
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://filterdb.iss.net/crawler/
|
||||||
|
User-agent: oBot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: fr-crawler
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://webmeup-crawler.com
|
||||||
|
User-agent: BLEXBot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# https://megaindex.com/crawler
|
||||||
|
User-agent: MegaIndex.ru
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: megaindex.com
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.cloudservermarket.com
|
||||||
|
User-Agent: CloudServerMarketSpider
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.trendiction.de/de/publisher/bot
|
||||||
|
User-Agent: trendictionbot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.exalead.com
|
||||||
|
User-agent: Exabot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.career-x.de/bot.html
|
||||||
|
User-agent: careerbot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# https://www.lipperhey.com/en/about/
|
||||||
|
User-agent: Lipperhey-Kaus-Australis
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: seoscanners.net
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: MetaJobBot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: Spiderbot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: LinkStats
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: JobboerseBot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: ICCrawler
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: Plista
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: Domain Re-Animator Bot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# https://www.lipperhey.com/en/about/
|
||||||
|
User-agent: Lipperhey-Kaus-Australis
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# https://turnitin.com/robot/crawlerinfo.html
|
||||||
|
User-agent: turnitinbot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://help.coccoc.com/
|
||||||
|
User-agent: coccoc
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# ubermetrics-technologies.com
|
||||||
|
User-agent: um-IC
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# datenbutler.de
|
||||||
|
User-agent: mindUpBot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://searchgears.de/uber-uns/crawling-faq.html
|
||||||
|
User-agent: sg-Orbiter
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://commoncrawl.org/faq/
|
||||||
|
User-agent: CCBot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# https://www.qwant.com/
|
||||||
|
User-agent: Qwantify
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://linkfluence.net/
|
||||||
|
User-agent: Kraken
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.botje.com/plukkie.htm
|
||||||
|
User-agent: plukkie
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# https://www.safedns.com/searchbot
|
||||||
|
User-agent: SafeDNSBot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.haosou.com/help/help_3_2.html
|
||||||
|
User-agent: 360Spider
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.haosou.com/help/help_3_2.html
|
||||||
|
User-agent: HaosouSpider
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.moz.com/dp/rogerbot
|
||||||
|
User-agent: rogerbot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.openhose.org/bot.html
|
||||||
|
User-agent: OpenHoseBot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.screamingfrog.co.uk/seo-spider/
|
||||||
|
User-agent: Screaming Frog SEO Spider
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://thumbsniper.com
|
||||||
|
User-agent: ThumbSniper
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.radian6.com/crawler
|
||||||
|
User-agent: R6_CommentReader
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: ImplisenseBot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://cliqz.com/company/cliqzbot
|
||||||
|
User-agent: Cliqzbot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# https://www.aihitdata.com/about
|
||||||
|
User-agent: aiHitBot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://www.trendiction.com/en/publisher/bot
|
||||||
|
User-Agent: trendictionbot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# http://warebay.com/bot.html
|
||||||
|
User-agent: WBSearchBot
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
# Block MegaIndex.ru
|
||||||
|
User-agent: MegaIndex.ru/2.0
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: MegaIndex.ru
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: megaIndex.ru
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: Slurp
|
||||||
|
Disallow: /
|
||||||
|
|
||||||
|
User-agent: MJ12bot
|
||||||
|
Disallow: /
|
||||||
|
|
Loading…
Reference in New Issue
Block a user