# robots.txt for http://www.opsisltd.info/ # See notes at end. # Google, Microsoft, Yahoo and Ask support sitemap auto-discovery Sitemap: http://www.opsisltd.info/sitemap.xml Sitemap: http://www.opsisltd.info/wordpress/sitemap.xml Sitemap: http://www.opsisltd.info/wordpress/sitemap.xml.gz # Google User-agent: Googlebot Disallow: /aspnet_client/ Disallow: /ccp/ Disallow: /css/ Disallow: /custom/ #Disallow: /design/ Disallow: /gallery/ Disallow: /HDWForm2Mail/ Disallow: /HDWFormCaptcha/ Disallow: /home_intro/ Disallow: /picture_library/ Disallow: /wordpress/wp-* Disallow: /wordpress/author/ Disallow: /wordpress/tags/ Disallow: /wordpress/feed/ Disallow: /wordpress/comments/feed Disallow: /wordpress/category/*/* Disallow: /wordpress/*/trackback/ Disallow: /wordpress/*/email/ Disallow: /wordpress/*/print/ Disallow: /wordpress/2007/ Disallow: /wordpress/2008/ Disallow: /wordpress/2009/ Disallow: /wordpress/2010/ Disallow: /wordpress/2011/ Disallow: /wordpress/2012/ # Disallow URLs that include ? except those that end with ? Allow: /wordpress/*?$ Disallow: /wordpress/*? # Block all files ending with these extensions Disallow: /*.css$ Disallow: /*.js$ # MSN - Allow not supported User-agent: msnbot Disallow: /aspnet_client/ Disallow: /ccp/ Disallow: /css/ Disallow: /custom/ #Disallow: /design/ Disallow: /gallery/ Disallow: /HDWForm2Mail/ Disallow: /HDWFormCaptcha/ Disallow: /home_intro/ Disallow: /picture_library/ Disallow: /wordpress/wp-* Disallow: /wordpress/author/ Disallow: /wordpress/tags/ Disallow: /wordpress/feed/ Disallow: /wordpress/comments/feed Disallow: /wordpress/category/*/* Disallow: /wordpress/*/trackback/ Disallow: /wordpress/*/email/ Disallow: /wordpress/*/print/ Disallow: /wordpress/2007/ Disallow: /wordpress/2008/ Disallow: /wordpress/2009/ Disallow: /wordpress/2010/ Disallow: /wordpress/2011/ Disallow: /wordpress/2012/ # Disallow URLs that include ? except those that end with ? Disallow: /wordpress/*? # Block all files ending with these extensions Disallow: /*.css$ Disallow: /*.js$ Crawl-delay: 10 # Yahoo! User-agent: Slurp Disallow: /aspnet_client/ Disallow: /ccp/ Disallow: /css/ Disallow: /custom/ #Disallow: /design/ Disallow: /gallery/ Disallow: /HDWForm2Mail/ Disallow: /HDWFormCaptcha/ Disallow: /home_intro/ Disallow: /picture_library/ Disallow: /wordpress/wp-* Disallow: /wordpress/author/ Disallow: /wordpress/tags/ Disallow: /wordpress/feed/ Disallow: /wordpress/comments/feed Disallow: /wordpress/category/*/* Disallow: /wordpress/*/trackback/ Disallow: /wordpress/*/email/ Disallow: /wordpress/*/print/ Disallow: /wordpress/2007/ Disallow: /wordpress/2008/ Disallow: /wordpress/2009/ Disallow: /wordpress/2010/ Disallow: /wordpress/2011/ Disallow: /wordpress/2012/ # Disallow URLs that include ? except those that end with ? Allow: /wordpress/*?$ Disallow: /wordpress/*? # Block all files ending with these extensions Disallow: /*.css$ Disallow: /*.js$ Crawl-delay: 10 # Ask - no wildcards User-agent: Teoma Disallow: /aspnet_client/ Disallow: /ccp/ Disallow: /css/ Disallow: /custom/ #Disallow: /design/ Disallow: /gallery/ Disallow: /HDWForm2Mail/ Disallow: /HDWFormCaptcha/ Disallow: /home_intro/ Disallow: /picture_library/ Disallow: /wordpress/wp-admin Disallow: /wordpress/wp-content/plugins Disallow: /wordpress/wp-content/cache Disallow: /wordpress/wp-content/themes Disallow: /wordpress/wp-includes Disallow: /wordpress/author/ Disallow: /wordpress/tags/ Disallow: /wordpress/feed/ Disallow: /wordpress/comments/feed Disallow: /wordpress/category/ Disallow: /wordpress/2007/ Disallow: /wordpress/2008/ Disallow: /wordpress/2009/ Disallow: /wordpress/2010/ Disallow: /wordpress/2011/ Disallow: /wordpress/2012/ Crawl-delay: 10 # Catch-all for other agents User-agent: * Disallow: /aspnet_client/ Disallow: /ccp/ Disallow: /css/ Disallow: /custom/ #Disallow: /design/ Disallow: /gallery/ Disallow: /HDWForm2Mail/ Disallow: /HDWFormCaptcha/ Disallow: /home_intro/ Disallow: /picture_library/ Disallow: /wordpress/wp-* Disallow: /wordpress/wp-admin Disallow: /wordpress/wp-content/plugins Disallow: /wordpress/wp-content/cache Disallow: /wordpress/wp-content/themes Disallow: /wordpress/wp-includes Disallow: /wordpress/author/ Disallow: /wordpress/tags/ Disallow: /wordpress/feed/ Disallow: /wordpress/comments/feed Disallow: /wordpress/category/*/* Disallow: /wordpress/*/trackback/ Disallow: /wordpress/*/email/ Disallow: /wordpress/*/print/ Disallow: /wordpress/2007/ Disallow: /wordpress/2008/ Disallow: /wordpress/2009/ Disallow: /wordpress/2010/ Disallow: /wordpress/2011/ Disallow: /wordpress/2012/ Allow: /wordpress/*?$ Disallow: /wordpress/*? # Block all files ending with these extensions Disallow: /*.css$ Disallow: /*.js$ # Google AdSense User-agent: Mediapartners-Google* Disallow: Allow: /* # Google Image User-agent: Googlebot-Image Disallow: Allow: /* # Internet Archiver Wayback Machine User-agent: ia_archiver Disallow: / # digg mirror User-agent: duggmirror Disallow: / User-agent: Adsbot-Google Allow: / User-agent: Googlebot-Mobile Allow: / User-agent: aipbot Disallow: / User-agent: BecomeBot Disallow: / User-agent: psbot Disallow: / # Only Googlebot, Yahoo! (Slurp) and Ask (Teoma) support Allow # Only Googlebot, MSNbot and Yahoo! (Slurp) support wildcards # Only Ask (Teoma), MSNbot and Yahoo! (Slurp) support crawl delays # # The opsisltd.info Windows server with IIS6 does NOT support mod-rewrite (does now 16/10/08 using IIS Mod-Rewrite program), # only PATHINFO "Almost pretty" Wordpress Permalinks with "/index.php/" in them. # http://codex.wordpress.org/Permalinks#Permalinks_without_mod_rewrite # So Disallow: /wordpress/*? (ie. *?* prevent indexing of any links containing a question mark) # Normally robots.txt disallows *?* to prevent content duplication from the permalink # rewrites of blog posts. # # Disallow: The value of this field specifies a partial URL that is not to be visited. # This can be a full path, or a partial path; any URL that starts with this value will not be retrieved. # For example, Disallow: /help disallows both /help.html and /help/index.html, # whereas Disallow: /help/ would disallow /help/index.html but allow /help.html # # Some major crawlers support an Allow directive which can counteract a following Disallow directive. # This is useful when you disallow an entire directory but still want some HTML documents in that # directory crawled and indexed. It should be noted that while by standard the first matching robots.txt # pattern always wins, Google's implementation differs in that it first evaluates all Allow patterns # and only then all Disallow patterns. Yet, in order to be compatible to all robots, if you want to allow # single files inside an otherwise disallowed directory, you need to place the Allow directive(s) first, # followed by the Disallow. # http://en.wikipedia.org/wiki/Robots.txt # http://www.google.com/support/webmasters/bin/answer.py?answer=40367 # http://searchengineland.com/070305-204850.php # # URLs are case-sensitive. #User-agent: * #Disallow: /