2021-11-13 02:02:11 +00:00
|
|
|
User-agent: webproxy-mozz
|
2023-11-01 14:32:02 +00:00
|
|
|
Disallow: /
|
2021-11-13 02:02:11 +00:00
|
|
|
|
|
|
|
User-agent: serpstatbot
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: ltx71
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: oBot
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: DuckDuckBot
|
|
|
|
Disallow:
|
|
|
|
|
|
|
|
User-agent: ia_archiver
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: ltx71 - (http://ltx71.com/)
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: BLEXBot
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: Twingly Recon
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: Googlebot
|
|
|
|
Disallow: /identity/
|
|
|
|
Disallow: /webring.html
|
|
|
|
Disallow: /blog/
|
|
|
|
|
|
|
|
User-agent: Googlebot-Image
|
|
|
|
Disallow: /
|
|
|
|
|
2024-01-30 13:55:30 +00:00
|
|
|
User-agent: Google-Extended
|
|
|
|
Disallow: /
|
|
|
|
|
2021-11-13 02:02:11 +00:00
|
|
|
User-agent: PageThing
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: adsbot
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: SurdotlyBot
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: DataForSeoBot
|
|
|
|
Disallow: /
|
|
|
|
|
2022-08-28 18:27:28 +00:00
|
|
|
User-agent: SpiderLing
|
|
|
|
Disallow: /
|
|
|
|
|
2024-02-19 02:40:16 +00:00
|
|
|
# Fuck your AI and fuck your scraping
|
|
|
|
|
|
|
|
User-agent: CCBot
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: ChatGPT-User
|
|
|
|
Disallow: /
|
|
|
|
|
2023-09-01 12:16:19 +00:00
|
|
|
User-agent: GPTBot
|
|
|
|
Disallow: /
|
|
|
|
|
2024-02-19 02:40:16 +00:00
|
|
|
User-agent: Google-Extended
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: anthropic-ai
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: Omgilibot
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: Omgili
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: FacebookBot
|
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
User-agent: Bytespider
|
|
|
|
Disallow: /
|
|
|
|
|
2021-11-13 02:02:11 +00:00
|
|
|
User-agent: *
|
|
|
|
Disallow: /
|
2023-11-01 14:32:02 +00:00
|
|
|
|