# robots.txt # Patrick Vande Walle 22/02/2005 # for http://blog.isoc.lu # Updated 29/5/2007 included reference to sitemap.xml SITEMAP: http://patrick.vande-walle.eu/sitemap.xml User-agent: * # All spiders should avoid # disallow all files in these directories Disallow: /cgi-bin/ Disallow: /wp-admin/ Disallow: /wp-includes/ Disallow: /tag/ Disallow: /wp-content/b Disallow: /wp-content/p Disallow: /trackback/ # Disallow: /*?* Disallow: */trackback/ Disallow: /wp-images/ Disallow: /wp-admin/ Disallow: /wp-config.php/ Disallow: /wp-includes/ User-agent: Googlebot # disallow all files ending with these extensions #Disallow: /*.php$ Disallow: /*.js$ Disallow: /*.inc$ Disallow: /*.css$ #Disallow: /*.gz$ Disallow: /*.cgi$ Disallow: /*.wmv$ Disallow: /*.cgi$ Disallow: /*.xhtml$ #Disallow: /*.php* Disallow: */trackback* # Disallow: /*?* Disallow: /wp-* User-agent: Spock* Disallow: * # allow google image bot to search all images User-agent: Googlebot-Image Allow: /* # disallow archiving site #User-agent: ia_archiver #Disallow: / # disable duggmirror User-agent: duggmirror Disallow: / User-agent: * Disallow: /zen/albums Disallow: /zen/cache Disallow: /zen/themes Disallow: /zen/zp-core Disallow: /zen/rss.php Disallow: /zen/rss-comments.php Disallow: /zen/page/search # BEGIN XML-SITEMAP-PLUGIN Sitemap: http://patrick.vande-walle.eu/sitemap.xml.gz # END XML-SITEMAP-PLUGIN