# robots.txt file for http://www.risva.org/ # info just for Google User-agent: Googlebot Disallow: /*.gif$ Disallow: /*.jpg$ Disallow: /*.doc$ Disallow: /*.db$ Disallow: /*.asp$ Disallow: /*.ico$ # info for all robots User-agent: * Crawl-delay: 30 # # do not index these pages Disallow: /sitemap.htm Disallow: /featureref.htm Disallow: /featurevol.htm Disallow: /household-items.htm Disallow: /issues.htm Disallow: /thank.htm # disallow all files in these directories and any sub-directories Disallow: /_db_backups Disallow: /_private Disallow: /seo Disallow: /seo1 Disallow: /seo2 Disallow: /_vti_log Disallow: /aspnet_client Disallow: /Copy of news_files Disallow: /images Disallow: /interpret_files Disallow: /media Disallow: /news_files Disallow: /PSDs Disallow: /stats # pay attention to robots.txt, just don't index it Disallow: /robots.txt Allow: /newsletters/fall2009.htm Allow: /newsletters/mar2008.htm Allow: /newsletters/jun2008.htm Allow: /newsletters/jul2008.htm Allow: /volunteer-opportunities.htm Sitemap: http://www.risva.org/sitemap.xml