# # robots.txt # # Specific bots settings User-agent: AhrefsBot User-agent: AhrefsSiteAudit User-agent: adbeat_bot User-agent: Alexibot User-agent: AppEngine User-agent: Aqua_Products User-agent: asterias User-agent: b2w/0.1 User-agent: BackDoorBot/1.0 User-agent: BecomeBot User-agent: BlekkoBot User-agent: Blexbot User-agent: BlowFish/1.0 User-agent: Bookmark search tool User-agent: BotALot User-agent: BuiltBotTough User-agent: Bullseye/1.0 User-agent: BunnySlippers User-agent: CCBot User-agent: CheeseBot User-agent: CherryPicker User-agent: CherryPickerElite/1.0 User-agent: CherryPickerSE/1.0 User-agent: chroot User-agent: Copernic User-agent: CopyRightCheck User-agent: cosmos User-agent: Crescent User-agent: Crescent Internet ToolPak HTTP OLE Control v.1.0 User-agent: DittoSpyder User-agent: dotbot User-agent: dumbot User-agent: EmailCollector User-agent: EmailSiphon User-agent: EmailWolf User-agent: Enterprise_Search User-agent: Enterprise_Search/1.0 User-agent: EroCrawler User-agent: es User-agent: exabot User-agent: ExtractorPro User-agent: FairAd Client User-agent: Flaming AttackBot User-agent: Foobot User-agent: Gaisbot User-agent: GetRight/4.2 User-agent: gigabot User-agent: grub User-agent: grub-client User-agent: Go-http-client User-agent: Harvest/1.5 User-agent: Hatena Antenna User-agent: hloader User-agent: http://www.SearchEngineWorld.com bot User-agent: http://www.WebmasterWorld.com bot User-agent: httplib User-agent: humanlinks User-agent: InfoNaviRobot User-agent: Iron33/1.0.2 User-agent: JamesBOT User-agent: JennyBot User-agent: Jetbot User-agent: Jetbot/1.0 User-agent: Jorgee User-agent: Kenjin Spider User-agent: Keyword Density/0.9 User-agent: LexiBot User-agent: libWeb/clsHTTP User-agent: LinkextractorPro User-agent: LinkpadBot User-agent: LinkScan/8.1a Unix User-agent: LinkWalker User-agent: LNSpiderguy User-agent: looksmart User-agent: lwp-trivial User-agent: lwp-trivial/1.34 User-agent: Mata Hari User-agent: Megalodon User-agent: Microsoft URL Control User-agent: Microsoft URL Control - 5.01.4511 User-agent: Microsoft URL Control - 6.00.8169 User-agent: MIIxpc User-agent: MIIxpc/4.2 User-agent: Mister PiX User-agent: moget User-agent: moget/2.1 User-agent: naver User-agent: NerdyBot User-agent: NetAnts User-agent: NetMechanic User-agent: NICErsPRO User-agent: Nutch User-agent: Openbot User-agent: Openfind User-agent: Openfind data gathere User-agent: Oracle Ultra Search User-agent: PerMan User-agent: ProPowerBot/2.14 User-agent: ProWebWalker User-agent: psbot User-agent: Python-urllib User-agent: QueryN Metasearch User-agent: Radiation Retriever 1.1 User-agent: RepoMonkey User-agent: RepoMonkey Bait & Tackle/v1.01 User-agent: RMA User-agent: rogerbot User-agent: scooter User-agent: searchpreview User-agent: SEMrushBot User-agent: SemrushBot User-agent: SemrushBot-SA User-agent: SEOkicks-Robot User-agent: sootle User-agent: SpankBot User-agent: spanner User-agent: spbot User-agent: Stanford User-agent: Stanford Comp Sci User-agent: Stanford CompClub User-agent: Stanford CompSciClub User-agent: Stanford Spiderboys User-agent: SurveyBot User-agent: SurveyBot_IgnoreIP User-agent: suzuran User-agent: Szukacz/1.4 User-agent: Szukacz/1.4 User-agent: Telesoft User-agent: Teoma User-agent: The Intraformant User-agent: TheNomad User-agent: toCrawl/UrlDispatcher User-agent: True_Robot User-agent: True_Robot/1.0 User-agent: turingos User-agent: Typhoeus User-agent: URL Control User-agent: URL_Spider_Pro User-agent: URLy Warning User-agent: VCI User-agent: VCI WebViewer VCI WebViewer Win32 User-agent: Web Image Collector User-agent: WebAuto User-agent: WebBandit User-agent: WebBandit/3.50 User-agent: WebEnhancer User-agent: WebmasterWorld Extractor User-agent: WebmasterWorldForumBot User-agent: WebSauger User-agent: Website Quester User-agent: Webster Pro User-agent: WebVac User-agent: WWW-Collector-E User-agent: Zeus User-agent: Zeus 32297 Webster Pro V2.9 Win32 User-agent: Zeus Link Scout Disallow: / # Crawlers that are kind enough to obey, but which we'd rather not have # unless they're feeding search engines. User-agent: UbiCrawler User-agent: DOC User-agent: Zao User-agent: gsa-crawler Disallow: / # Some bots are known to be trouble, particularly those designed to copy entire sites. User-agent: sitecheck.internetseer.com User-agent: Zealbot User-agent: MSIECrawler User-agent: SiteSnagger User-agent: WebStripper User-agent: WebCopier User-agent: Fetch User-agent: Offline Explorer User-agent: Teleport User-agent: TeleportPro User-agent: WebZip User-agent: WebZip/4.0 User-agent: linko User-agent: HTTrack User-agent: Microsoft.URL.Control User-agent: Xenu User-agent: Xenu's User-agent: Xenu's Link Sleuth 1.1c User-agent: larbin User-agent: libwww User-agent: ZyBORG User-agent: Download Ninja Disallow: / # wget in its recursive mode is a frequent problem. # There is a wait option you can use to set the delay between hits for instance. User-agent: wget User-agent: Wget/1.11.4 User-agent: Wget/1.13.4 User-agent: Wget/1.12 User-agent: Wget/1.5.3 User-agent: Wget/1.6 Disallow: / # A capture bot, downloads gazillions of pages with no public benefit User-agent: WebReaper User-agent: CNCDialer User-agent: Maxthon User-agent: MJ12bot User-agent: Slurp User-agent: Screaming Frog SEO Spider Disallow: /