-
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrobots.txt
72 lines (64 loc) · 1.62 KB
/
robots.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
---
vim: filetype=liquid.robots expandtab
layout: null
sitemap: false
attributions:
- https://github.com/ai-robots-txt/ai.robots.txt/blob/main/robots.txt
- https://github.com/dmitrizzle/disallow-ai/blob/main/src/robots.txt
- https://github.com/jekyll/jekyll-sitemap
- https://michaelcurrin.github.io/code-cookbook/recipes/web/seo/robots/jekyll.html
- https://neil-clarke.com/block-the-bots-that-feed-ai-models-by-scraping-your-website/
- https://rknight.me/blog/perplexity-ai-is-lying-about-its-user-agent/
- https://search.google.com/search-console/about
- https://www.cyberciti.biz/robots.txt
- https://www.cyberciti.biz/web-developer/block-openai-bard-bing-ai-crawler-bots-using-robots-txt-file/
- https://www.robotstxt.org/robotstxt.html
bots:
allow:
- Mediapartners-Google
disallow:
- AdsBot-Google
- AhrefsBot
- Amazonbot
- Applebot-Extended
- Bytespider
- CCBot
- ChatGPT-User
- Claude-Web
- ClaudeBot
- Diffbot
- FacebookBot
- FriendlyCrawler
- GPTBot
- Google-Extended
- GoogleOther
- ImagesiftBot
- Omgili
- Omgilibot
- PerplexityBot
- Pintrestbot
- Semrush
- SemrushBot
- YouBot
- YouBot
- anthropic-ai
- cohere-ai
- dotbot
- img2dataset
- omgili
- omgilibot
- peer39_crawler
- peer39_crawler/1.0
---
{% for bot in page.bots.allow %}
User-agent: {{ bot }}
Allow: /
{% endfor %}
{% for bot in page.bots.disallow %}
User-agent: {{ bot }}
Disallow: /
{% endfor %}
User-agent: *
Disallow: /assets/ai/bait.zip
Disallow: /ai-bait/assets/ai/bait.zip
Sitemap: {{ "sitemap.xml" | absolute_url }}