seirdy.one/static/robots.txt

User-agent: *
Disallow: /noindex/
Disallow: /misc/
Disallow: /webmentions/

# "This robot collects content from the Internet for the sole purpose of # helping educational institutions prevent plagiarism. [...] we compare # student papers against the content we find on the Internet to see if we # can find similarities." (http://www.turnitin.com/robot/crawlerinfo.html)
#  --> fuck off.
User-Agent: TurnitinBot
Disallow: /

# "NameProtect engages in crawling activity in search of a wide range of
# brand and other intellectual property violations that may be of interest
# to our clients." (http://www.nameprotect.com/botinfo.html)
#  --> fuck off.
User-Agent: NPBot
Disallow: /

# "iThenticate is a new service we have developed to combat the piracy of intellectual property and ensure the originality of written work for# publishers, non-profit agencies, corporations, and newspapers." (http://www.slysearch.com/)
#  --> fuck off.
User-Agent: SlySearch
Disallow: /

# "BLEXBot assists internet marketers to get information on the link structure of sites and their interlinking on the web, to avoid any technical and possible legal issues and improve overall online experience." (http://webmeup-crawler.com/)
# --> fuck off.
User-Agent: BLEXBot
Dissalow: /

User-Agent: Adsbot
Disallow: /

User-Agent: AdsBot
Disallow: /

Sitemap: https://seirdy.one/sitemap.xml
Fix robots.txt 2020-11-30 21:06:44 +00:00			`User-agent: *`
Update robots.txt 2021-01-23 20:47:50 +00:00			`Disallow: /noindex/`
Update robots.txt 2021-06-11 22:09:43 +00:00			`Disallow: /misc/`
Update robots.txt 2021-01-23 20:47:50 +00:00			`Disallow: /webmentions/`
robots: disallow some toxic bs 2022-04-23 04:45:15 +00:00
Kang VLC's robots.txt commentary 2022-06-13 04:52:28 +00:00			`# "This robot collects content from the Internet for the sole purpose of # helping educational institutions prevent plagiarism. [...] we compare # student papers against the content we find on the Internet to see if we # can find similarities." (http://www.turnitin.com/robot/crawlerinfo.html)`
			`# --> fuck off.`
robots: disallow some toxic bs 2022-04-23 04:45:15 +00:00			`User-Agent: TurnitinBot`
			`Disallow: /`

Kang VLC's robots.txt commentary 2022-06-13 04:52:28 +00:00			`# "NameProtect engages in crawling activity in search of a wide range of`
			`# brand and other intellectual property violations that may be of interest`
			`# to our clients." (http://www.nameprotect.com/botinfo.html)`
			`# --> fuck off.`
robots: disallow some toxic bs 2022-04-23 04:45:15 +00:00			`User-Agent: NPBot`
			`Disallow: /`

Kang VLC's robots.txt commentary 2022-06-13 04:52:28 +00:00			`# "iThenticate is a new service we have developed to combat the piracy of intellectual property and ensure the originality of written work for# publishers, non-profit agencies, corporations, and newspapers." (http://www.slysearch.com/)`
			`# --> fuck off.`
robots: disallow some toxic bs 2022-04-23 04:45:15 +00:00			`User-Agent: SlySearch`
			`Disallow: /`

Kang VLC's robots.txt commentary 2022-06-13 04:52:28 +00:00			`# "BLEXBot assists internet marketers to get information on the link structure of sites and their interlinking on the web, to avoid any technical and possible legal issues and improve overall online experience." (http://webmeup-crawler.com/)`
			`# --> fuck off.`
			`User-Agent: BLEXBot`
			`Dissalow: /`

robots: disallow some toxic bs 2022-04-23 04:45:15 +00:00			`User-Agent: Adsbot`
			`Disallow: /`

			`User-Agent: AdsBot`
			`Disallow: /`

			`Sitemap: https://seirdy.one/sitemap.xml`