-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathrobots.txt
More file actions
120 lines (90 loc) · 1.85 KB
/
robots.txt
File metadata and controls
120 lines (90 loc) · 1.85 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
# Robots.txt for Orthonode Infrastructure Labs
# Domain: https://orthonode.xyz
# Last Updated: 2026-03-06
User-agent: *
Allow: /
Allow: /index.html
Allow: /sha.html
Allow: /oap.html
Allow: /nexus.html
Allow: /ton-sha.html
Allow: /invariant.html
Allow: /tix-dao.html
Allow: /iotex-research.html
Allow: /site-index.html
Allow: /terms.html
Allow: /privacy.html
# Allow all media assets
Allow: /logo.png
Allow: /banner.png
Allow: /orthonode-banner.png
Allow: /og-image.png
Allow: /twitter-card.png
Allow: /logo-512.png
Allow: /site-logo.png
# Block admin/development areas if they exist
Disallow: /portal/
Disallow: /admin/
Disallow: /.git/
Disallow: /node_modules/
# Explicitly disallow old domain association
# (Prevents confusion with legacy coreframe.systems entity)
Noarchive: https://coreframe.systems/
# Crawl-delay for respectful bot behavior
Crawl-delay: 1
# Sitemap Location
Sitemap: https://orthonode.xyz/sitemap.xml
# Special Instructions for AI/LLM Crawlers
User-agent: GPTBot
Allow: /
User-agent: ChatGPT-User
Allow: /
User-agent: ClaudeBot
Allow: /
User-agent: anthropic-ai
Allow: /
User-agent: Google-Extended
Allow: /
User-agent: CCBot
Allow: /
User-agent: PerplexityBot
Allow: /
# Search Engine Specific Rules
User-agent: Googlebot
Allow: /
Crawl-delay: 1
User-agent: Googlebot-Image
Allow: /
User-agent: Bingbot
Allow: /
Crawl-delay: 1
User-agent: Slurp
Allow: /
User-agent: DuckDuckBot
Allow: /
User-agent: Baiduspider
Allow: /
User-agent: YandexBot
Allow: /
# Social Media Crawlers
User-agent: facebookexternalhit
Allow: /
User-agent: Twitterbot
Allow: /
User-agent: LinkedInBot
Allow: /
User-agent: Discordbot
Allow: /
User-agent: TelegramBot
Allow: /
# Block malicious/spam bots
User-agent: SemrushBot
Disallow: /
User-agent: AhrefsBot
Disallow: /
User-agent: MJ12bot
Disallow: /
User-agent: dotbot
Disallow: /
User-agent: BLEXBot
Disallow: /