Skip to content

HTTPS clone URL

Subversion checkout URL

You can clone with
or
.
Download ZIP
Newer
Older
100644 139 lines (103 sloc) 4.768 kb
1155b9a @runpaint Rakefile: Generate a Sitemap, ping search engines.
authored
1 <?xml version="1.0" encoding="UTF-8"?>
2 <!--
3 sitemap_gen.py example configuration script
4
5 This file specifies a set of sample input parameters for the
6 sitemap_gen.py client.
7
8 You should copy this file into "config.xml" and modify it for
9 your server.
10
11
12 ********************************************************* -->
13
14
15 <!-- ** MODIFY **
16 The "site" node describes your basic web site.
17
18 Required attributes:
19 base_url - the top-level URL of the site being mapped
20 store_into - the webserver path to the desired output file.
21 This should end in '.xml' or '.xml.gz'
22 (the script will create this file)
23
24 Optional attributes:
25 verbose - an integer from 0 (quiet) to 3 (noisy) for
26 how much diagnostic output the script gives
27 suppress_search_engine_notify="1"
28 - disables notifying search engines about the new map
29 (same as the "testing" command-line argument.)
30 default_encoding
31 - names a character encoding to use for URLs and
32 file paths. (Example: "UTF-8")
33 sitemap_type
34 - declares the Sitemap type, Common values are
35 web, mobile and news. 'web" Sitemap is default.
36 (Example: sitemap_type="news")
37 -->
38 <site
39 base_url="http://vim.runpaint.org/"
a5f23a7 @runpaint Rakefile: Create offline versions, refactor.
authored
40 store_into="output/www/sitemap.xml"
1155b9a @runpaint Rakefile: Generate a Sitemap, ping search engines.
authored
41 verbose="1"
42 sitemap_type="web">
43
44
45
46 <!-- ********************************************************
47 INPUTS
48
49 All the various nodes in this section control where the script
50 looks to find URLs.
51
52 MODIFY or DELETE these entries as appropriate for your server.
53 ********************************************************* -->
54
55 <!-- ** MODIFY or DELETE **
56 "url" nodes specify individual URLs to include in the map.
57
58 Required attributes:
59 href - the URL
60
61 Optional attributes:
62 lastmod - timestamp of last modification (ISO8601 format)
63 changefreq - how often content at this URL is usually updated
64 priority - value 0.0 to 1.0 of relative importance in your site
65 -->
66
67 <url href="http://vim.runpaint.org/vim-recipes.pdf" priority="0.9"/>
68 <url href="http://vim.runpaint.org/toc/" priority="0.9"/>
69
70
71 <!-- ** MODIFY or DELETE **
72 "directory" nodes tell the script to walk the file system
73 and include all files and directories in the Sitemap.
74
75 Required attributes:
76 path - path to begin walking from
77 url - URL equivalent of that path
78
79 Optional attributes:
80 default_file - name of the index or default file for directory URLs
81 remove_empty_directories - Values are true or false. Default is false.
82 true=remove empty directories
83 -->
84
85 <directory
a1f9c4b @runpaint Sitemap: Update for new www directory.
authored
86 path="output/www/"
1155b9a @runpaint Rakefile: Generate a Sitemap, ping search engines.
authored
87 url="http://vim.runpaint.org/"
3f2f585 @runpaint Don't include *.en/*.en.gz files in sitemap
authored
88 default_file="index.html.en"
1155b9a @runpaint Rakefile: Generate a Sitemap, ping search engines.
authored
89 remove_empty_directories="true"/>
90
91 <!-- ********************************************************
92 FILTERS
93
94 Filters specify wild-card patterns that the script compares
95 against all URLs it finds. Filters can be used to exclude
96 certain URLs from your Sitemap, for instance if you have
97 hidden content that you hope the search engines don't find.
98
99 Filters can be either type="wildcard", which means standard
100 path wildcards (* and ?) are used to compare against URLs,
101 or type="regexp", which means regular expressions are used
102 to compare.
103
104 Filters are applied in the order specified in this file.
105
106 An action="drop" filter causes exclusion of matching URLs.
107 An action="pass" filter causes inclusion of matching URLs,
108 shortcutting any other later filters that might also match.
109 If no filter at all matches a URL, the URL will be included.
110 Together you can build up fairly complex rules.
111
112 The default action is "drop".
113 The default type is "wildcard".
114
115 You can MODIFY or DELETE these entries as appropriate for
116 your site. However, unlike above, the example entries in
117 this section are not contrived and may be useful to you as
118 they are.
119 ********************************************************* -->
120
121 <!-- Exclude URLs that end with a '~' (IE: emacs backup files) -->
122 <filter action="drop" type="wildcard" pattern="*~" />
123
124 <!-- Exclude URLs within UNIX-style hidden files or directories -->
125 <filter action="drop" type="regexp" pattern="/\.[^/]*" />
126
127 <!-- Exclude stylesheets -->
128 <filter action="drop" type="wildcard" pattern="*/css/*" />
f8e8525 @runpaint Sitemap: Exclude output/all.html.
authored
129
130 <!-- Exclude output/all.html -->
131 <filter action="drop" type="wildcard" pattern="*/all.html" />
3f2f585 @runpaint Don't include *.en/*.en.gz files in sitemap
authored
132
133 <!-- Exclude *.gz files -->
134 <filter action="drop" type="wildcard" pattern="*.gz" />
135
136 <!-- Exclude *.en files -->
137 <filter action="drop" type="wildcard" pattern="*.en" />
1155b9a @runpaint Rakefile: Generate a Sitemap, ping search engines.
authored
138 </site>
Something went wrong with that request. Please try again.