# # robots.txt for http://drmor.com # User-agent: * # Enter the path to your sitemap here Sitemap: http://drmor.com/sitemap.xml Disallow: /4/ Disallow: /AP articles/ Disallow: /css/ Disallow: /errorpages/ Disallow: /giu/ Disallow: /img/ Disallow: /images/ Disallow: /images_notused/ Disallow: /inframe/ Disallow: /Knowhow/ Disallow: /m1/old/ Disallow: /m1/sitemap/ Disallow: /old_index/ Disallow: /oldpages/ Disallow: /p/ Disallow: /per/ Disallow: /person/ Disallow: /pg/ Disallow: /scripts/ Disallow: /script/ Disallow: /secure/ Disallow: /st/ Disallow: /temp/ Disallow: /x/ # advertising-related bots: User-agent: Mediapartners-Google* Disallow: / # Crawlers that are kind enough to obey, but which we'd rather not have # unless they're feeding search engines. User-agent: UbiCrawler Disallow: / User-agent: DOC Disallow: / User-agent: Zao Disallow: / # # The 'grub' distributed client has been *very* poorly behaved. # User-agent: grub-client Disallow: / # # Doesn't follow robots.txt anyway, but... # User-agent: k2spider Disallow: / # # Hits many times per second, not acceptable # http://www.nameprotect.com/botinfo.html User-agent: NPBot Disallow: / # A capture bot, downloads gazillions of pages with no public benefit # http://www.webreaper.net/ User-agent: WebReaper Disallow: /