[root]# tar ztvf sitemap_gen-1.3.tar.gz drwxr-xr-x opensource/opensource 0 2005-09-08 06:44:40 sitemap_gen-1.3/ -r--r----- opensource/opensource 22 2005-06-17 04:41:30 sitemap_gen-1.3/AUTHORS -r--r----- opensource/opensource 1754 2005-06-17 04:41:30 sitemap_gen-1.3/COPYING -r--r--r-- opensource/opensource 2003 2005-09-08 06:35:41 sitemap_gen-1.3/ChangeLog -r--r--r-- opensource/opensource 1094 2005-09-08 06:35:41 sitemap_gen-1.3/README -r--r--r-- opensource/opensource 5498 2005-09-08 06:35:41 sitemap_gen-1.3/example_config.xml -r--r----- opensource/opensource 975 2005-06-17 04:41:30 sitemap_gen-1.3/example_urllist.txt -r-xr-xr-x opensource/opensource 70647 2005-09-08 06:35:41 sitemap_gen-1.3/sitemap_gen.py -r-xr-xr-x opensource/opensource 27786 2005-09-08 06:35:41 sitemap_gen-1.3/test_sitemap_gen.py -r-xr-xr-x opensource/opensource 305 2005-09-08 06:35:41 sitemap_gen-1.3/setup.py -rw-r--r-- opensource/opensource 248 2005-09-08 06:44:40 sitemap_gen-1.3/PKG-INFO |
<?xml version="1.0" encoding="UTF-8"?> <site base_url="http://legacy-b4.dyndns.org/" store_into="/home/localhost/legacy-b4/sitemap.xml" verbose="1" default_encoding="EUC-JP" > <directory path="/home/localhost/legacy-b4/" url="http://legacy-b4.dyndns.org/" default_file="index.html" /> <filter action="drop" type="wildcard" pattern="*/wp/*" /> </site> |
crawl-66-249-65-199.googlebot.com - - [26/Nov/2005:13:40:56 +0900] "HEAD /sitemap.xml HTTP/1.1" 200 - 283 "-" "Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)" crawl-66-249-65-199.googlebot.com - - [26/Nov/2005:14:01:56 +0900] "GET /sitemap.xml HTTP/1.1" 200 285995 286278 "-" "Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)" |
[root]# python sitemap_gen.py --config=config2.xml Reading configuration file: config2.xml Walking DIRECTORY "/home/localhost/legacy-b4/" Sorting and normalizing collected URLs. Writing Sitemap file "sitemap.xml" with 702 URLs Notifying search engines. [ERROR] When attempting to access our generated Sitemap at the following URL: http://legacy-b4.dyndns.org/sitemap.xml we failed to read it. Please verify the store_into path you specified in your configuration file is web-accessable. Consult the FAQ for more information. [WARNING] Proceeding to notify with an unverifyable URL. Notifying: www.google.com Count of file extensions on URLs: 134 .gif 1 .gz 82 .html 1 .ico 352 .jpg 1 .lzh 59 .png 15 .txt 57 / Number of errors: 1 Number of warnings: 1 |
192.168.24.5 legacy-b4.dyndns.org |