-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathrobots.txt
49 lines (45 loc) · 1.2 KB
/
robots.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
---
layout: null
permalink: robots.txt
badagents:
- "Sogou web spider"
- "Sogou inst spider"
- "Sogou spider2"
- "Sogou blog"
- "Sogou News Spider"
- "Sogou Orion spider"
- "Sosospider"
---
{% for agent in page.badagents %}User-agent: {{ agent }}
Disallow: /
{% endfor %}
# These URIs will cause unneccessary traffic with ANY bot.
User-agent: *
User-agent: archive.org_bot
User-agent: ia_archiver
Disallow: /releases/release0.1/doc
Disallow: /releases/release0.5.0~beta1/doc
Disallow: /releases/release0.5.0~beta2/doc
Disallow: /releases/release0.6.0~beta1/doc
Disallow: /releases/release0.6.0~beta2/doc
Disallow: /releases/release0.6.5~20140718/doc
Disallow: /releases/release0.6.5~20140721/doc
Disallow: /releases/release0.6.5~20141030/doc
Disallow: /releases/*/doc/index.html?de/lmu/
# The following spiders were found to misbehave and are no longer welcome:
User-agent: YoudaoBot
User-agent: HaoSouSpider
User-agent: 360Spider
User-agent: MegaIndex
Disallow: /
Crawl-Delay: 360000
# The following spiders are just unnecessary traffic
User-agent: BLEXBot
User-agent: dotbot
User-agent: AhrefsBot
User-agent: SMTBot
User-agent: SemrushBot
User-agent: SemrushBot-SA
User-agent: WeSEE_Bot
User-agent: ltx71
Disallow: /