[root]# tar ztvf sitemap_gen-1.3.tar.gz drwxr-xr-x opensource/opensource 0 2005-09-08 06:44:40 sitemap_gen-1.3/ -r--r----- opensource/opensource 22 2005-06-17 04:41:30 sitemap_gen-1.3/AUTHORS -r--r----- opensource/opensource 1754 2005-06-17 04:41:30 sitemap_gen-1.3/COPYING -r--r--r-- opensource/opensource 2003 2005-09-08 06:35:41 sitemap_gen-1.3/ChangeLog -r--r--r-- opensource/opensource 1094 2005-09-08 06:35:41 sitemap_gen-1.3/README -r--r--r-- opensource/opensource 5498 2005-09-08 06:35:41 sitemap_gen-1.3/example_config.xml -r--r----- opensource/opensource 975 2005-06-17 04:41:30 sitemap_gen-1.3/example_urllist.txt -r-xr-xr-x opensource/opensource 70647 2005-09-08 06:35:41 sitemap_gen-1.3/sitemap_gen.py -r-xr-xr-x opensource/opensource 27786 2005-09-08 06:35:41 sitemap_gen-1.3/test_sitemap_gen.py -r-xr-xr-x opensource/opensource 305 2005-09-08 06:35:41 sitemap_gen-1.3/setup.py -rw-r--r-- opensource/opensource 248 2005-09-08 06:44:40 sitemap_gen-1.3/PKG-INFO |
<?xml version="1.0" encoding="UTF-8"?>
<site
base_url="http://legacy-b4.dyndns.org/"
store_into="/home/localhost/legacy-b4/sitemap.xml"
verbose="1"
default_encoding="EUC-JP"
>
<directory
path="/home/localhost/legacy-b4/"
url="http://legacy-b4.dyndns.org/"
default_file="index.html"
/>
<filter action="drop" type="wildcard" pattern="*/wp/*" />
</site>
|
crawl-66-249-65-199.googlebot.com - - [26/Nov/2005:13:40:56 +0900] "HEAD /sitemap.xml HTTP/1.1" 200 - 283 "-" "Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)" crawl-66-249-65-199.googlebot.com - - [26/Nov/2005:14:01:56 +0900] "GET /sitemap.xml HTTP/1.1" 200 285995 286278 "-" "Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)" |

[root]# python sitemap_gen.py --config=config2.xml
Reading configuration file: config2.xml
Walking DIRECTORY "/home/localhost/legacy-b4/"
Sorting and normalizing collected URLs.
Writing Sitemap file "sitemap.xml" with 702 URLs
Notifying search engines.
[ERROR] When attempting to access our generated Sitemap at the following URL:
http://legacy-b4.dyndns.org/sitemap.xml
we failed to read it. Please verify the store_into path you specified in
your configuration file is web-accessable. Consult the FAQ for more
information.
[WARNING] Proceeding to notify with an unverifyable URL.
Notifying: www.google.com
Count of file extensions on URLs:
134 .gif
1 .gz
82 .html
1 .ico
352 .jpg
1 .lzh
59 .png
15 .txt
57 /
Number of errors: 1
Number of warnings: 1
|
192.168.24.5 legacy-b4.dyndns.org |