# robots.txt for http://www.nanog.org User-agent: * Disallow: /errorpages/ Disallow: /icons/ Disallow: /images/ Disallow: /includes/ Disallow: /mtg-0002/ Disallow: /mtg-0006/ Disallow: /mtg-0010/ Disallow: /mtg-0102/ Disallow: /mtg-0105/ Disallow: /mtg-0110/ Disallow: /mtg-0202/ Disallow: /mtg-0206/ Disallow: /mtg-0210/ Disallow: /mtg-0302/ Disallow: /mtg-0306/ Disallow: /mtg-0310/ Disallow: /mtg-0402/ Disallow: /mtg-0405/ Disallow: /mtg-0410/ Disallow: /mtg-0501/ Disallow: /mtg-0505/ Disallow: /mtg-0510/ Disallow: /mtg-0602/ Disallow: /mtg-0606/ Disallow: /mtg-0610/ Disallow: /mtg-0702/ Disallow: /mtg-0706/ Disallow: /mtg-0710/ Disallow: /mtg-0802/ Disallow: /mtg-0806/ Disallow: /mtg-0810/ Disallow: /mtg-9410/ Disallow: /mtg-9502/ Disallow: /mtg-9505/ Disallow: /mtg-9509/ Disallow: /mtg-9602/ Disallow: /mtg-9605/ Disallow: /mtg-9610/ Disallow: /mtg-9702/ Disallow: /mtg-9706/ Disallow: /mtg-9710/ Disallow: /mtg-9802/ Disallow: /mtg-9806/ Disallow: /mtg-9811/ Disallow: /mtg-9901/ Disallow: /mtg-9905/ Disallow: /RealMedia/ARIN Disallow: /sendthis/ # Crawlers that are kind enough to obey, but which we'd rather not have # unless they're feeding search engines. User-agent: UbiCrawler Disallow: / User-agent: DOC Disallow: / User-agent: Zao Disallow: / # Some bots are known to be trouble, particularly those designed to copy # entire sites. Please obey robots.txt. User-agent: sitecheck.internetseer.com Disallow: / User-agent: Zealbot Disallow: / User-agent: MSIECrawler Disallow: / User-agent: SiteSnagger Disallow: / User-agent: WebStripper Disallow: / User-agent: WebCopier Disallow: / User-agent: Fetch Disallow: / User-agent: Offline Explorer Disallow: / User-agent: Teleport Disallow: / User-agent: TeleportPro Disallow: / User-agent: WebZIP Disallow: / User-agent: linko Disallow: / User-agent: HTTrack Disallow: / User-agent: Microsoft.URL.Control Disallow: / User-agent: Xenu Disallow: / User-agent: larbin Disallow: / User-agent: libwww Disallow: / User-agent: ZyBORG Disallow: / User-agent: Download Ninja Disallow: / # # The 'grub' distributed client has been *very* poorly behaved. # User-agent: grub-client Disallow: / # # Doesn't follow robots.txt anyway, but... # User-agent: k2spider Disallow: / # # Hits many times per second, not acceptable # http://www.nameprotect.com/botinfo.html User-agent: NPBot Disallow: / # A capture bot, downloads gazillions of pages with no public benefit # http://www.webreaper.net/ User-agent: WebReaper Disallow: /