File: groups.google.com

package info (click to toggle)
python-protego 0.5.0%2Bdfsg-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 30,052 kB
  • sloc: python: 1,579; perl: 190; cpp: 33; sh: 4; makefile: 3
file content (65 lines) | stat: -rw-r--r-- 1,529 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
# robots.txt for Google Groups.  See this URL for documentation on robots.txt:
# https://developers.google.com/webmasters/control-crawl-index/docs/robots_txt
# Note in particular that "the most specific rule based on the length of the
# [path] entry will trump the less specific (shorter) rule."
User-agent: *

Disallow: /groups/search
Disallow: /groups/dir?*q=
Disallow: /a/*.*/groups/search
Disallow: /a/*.*/groups/dir?*q=

Disallow: /d/search*
Disallow: /d/topicsearch*
Disallow: /a/*.*/d/search*
Disallow: /a/*.*/d/topicsearch*

# Explicitly disallow indexing of pages that do not have valuable
# crawlable views (see b/21331185).
Disallow: /*_escaped_fragment_=aboutgroup
Disallow: /*_escaped_fragment_=forumsearch
Disallow: /*_escaped_fragment_=myforums
Disallow: /*_escaped_fragment_=newtopic
Disallow: /*_escaped_fragment_=search
Disallow: /*_escaped_fragment_=searchin
Disallow: /*_escaped_fragment_=starred

Allow: /$
Allow: /a/
Allow: /a/*.*/about
Allow: /a/*.*/browse_
Allow: /a/*.*/group
Allow: /a/*.*/groups
Allow: /a/*.*/images
Allow: /a/*.*/index
Allow: /a/*.*/messages
Allow: /a/*.*/msg/
Allow: /a/*.*/threads
Allow: /a/*.*/topics
Allow: /a/*.*/tree
Allow: /about
Allow: /browse_
Allow: /finance
Allow: /group
Allow: /groups
Allow: /images
Allow: /index
Allow: /messages
Allow: /msg/
Allow: /support
Allow: /threads
Allow: /topics
Allow: /tree
Allow: /googlegroups/

Allow: /a/*.*/d/
Allow: /a/*.*/forum$
Allow: /a/*.*/forum/
Allow: /d/
Allow: /forum$
Allow: /forum/

Allow: /?hl=
Disallow: /?hl=*&

Disallow: /