# robots.txt for http://www.thecapitalideas.com # Allow S&P User-agent: Atomz/1.0 Disallow: # To enable Twitter and Linkedin access User-agent: Twitterbot Disallow: User-agent: LinkedInBot Disallow: # exclude ia_archiver, VisWeb robots, and Ultraseek User-agent: ia_archiver Disallow: / User-agent: VisWeb Disallow: / User-agent: Ultraseek Disallow: / # exclude directories User-agent: * Disallow: /errors Disallow: /pardons Disallow: /us/search Disallow: /design Disallow: /content Allow: /content/dam/*/Images/* Allow: /content/dam/*/images/* Allow: /content/*.js Allow: /content/*.json Disallow: /global-errors/* Disallow: /*/_jcr_content/* #index exclusion for all PDF files Disallow: *.pdf