diff --git a/robots.txt b/robots.txt new file mode 100644 index 0000000..8ab5dd5 --- /dev/null +++ b/robots.txt @@ -0,0 +1,48 @@ +User-agent: * +Disallow: /misc/ + +# TOTAL COPYRIGHT DEATH +# IP VIOLATION SCANNERS GTFO + +# "This robot collects content from the Internet for the sole purpose of # +# helping educational institutions prevent plagiarism. [...] we compare student +# papers against the content we find on the Internet to see if we # can find +# similarities." (https://www.turnitin.com/robot/crawlerinfo.html) +User-Agent: TurnitinBot +Disallow: / + +# "NameProtect engages in crawling activity in search of a wide range of brand +# and other intellectual property violations that may be of interest to our +# clients." (https://www.nameprotect.com/botinfo.html) +User-Agent: NPBot +Disallow: / + +# "iThenticate is a new service we have developed to combat the piracy of +# intellectual property and ensure the originality of written work for +# publishers, non-profit agencies, corporations, and newspapers." +# (https://www.slysearch.com/) +User-Agent: SlySearch +Disallow: / + +# "BLEXBot assists internet marketers to get information on the link structure +# of sites and their interlinking on the web, to avoid any technical and +# possible legal issues and improve overall online experience." +# (http://webmeup-crawler.com/) +User-Agent: BLEXBot +Disallow: / + +# "Providing Intellectual Property professionals with superior brand protection +# services by artfully merging the latest technology with expert analysis." +# (https://www.checkmarknetwork.com/spider.html/) +# "The Internet is just way to big to effectively police alone." (ACTUAL quote) +User-agent: CheckMarkNetwork/1.0 (+https://www.checkmarknetwork.com/spider.html) +Disallow: / + +# "Stop trademark violations and affiliate non-compliance in paid search. +# Automatically monitor your partner and affiliates’ online marketing to +# protect yourself from harmful brand violations and regulatory risks. We +# regularly crawl websites on behalf of our clients to ensure content +# compliance with brand and regulatory guidelines." +# (https://www.brandverity.com/why-is-brandverity-visiting-me) +User-agent: BrandVerity/1.0 +Disallow: / \ No newline at end of file