# $Id: robots.txt,v 1.9.2.1 2008/12/10 20:12:19 goba Exp $ # # robots.txt # # This file is to prevent the crawling and indexing of certain parts # of your site by web crawlers and spiders run by sites like Yahoo! # and Google. By telling these "robots" where not to go on your site, # you save bandwidth and server resources. # # This file will be ignored unless it is at the root of your host: # Used: http://example.com/robots.txt # Ignored: http://example.com/site/robots.txt # # For more information about the robots.txt standard, see: # http://www.robotstxt.org/wc/robots.html # # For syntax checking, see: # http://www.sxw.org.uk/computing/robots/check.html User-agent: * Crawl-delay: 1 #Disallow: / # Directories Disallow: /includes/ Disallow: /misc/ Disallow: /modules/ Disallow: /profiles/ Disallow: /scripts/ Disallow: /sites/ Disallow: /themes/ # Allow Allow: /sites/default/files/photos/ Allow: /sites/default/files/imagecache/media_node_photo/photos/ Allow: /sites/default/files/external_files/ Allow: /sites/default/files/image_contrib/ Allow: /sites/default/files/imagecache/ Allow: /sites/default/files/imagefield_thumbs/ Allow: /sites/default/files/partner_logo/ Allow: /sites/default/files/pictures/ Allow: /sites/default/files/portraits/ Allow: /sites/default/files/push/ # Files Disallow: /CHANGELOG.txt Disallow: /cron.php Disallow: /INSTALL.mysql.txt Disallow: /INSTALL.pgsql.txt Disallow: /install.php Disallow: /INSTALL.txt Disallow: /LICENSE.txt Disallow: /MAINTAINERS.txt Disallow: /update.php Disallow: /UPGRADE.txt Disallow: /xmlrpc.php # Paths (clean URLs) Disallow: /admin/ Disallow: /comment/reply/ Disallow: /contact/ Disallow: /logout/ Disallow: /node/add/ Disallow: /search/ Disallow: /user/register/ Disallow: /user/password/ Disallow: /user/login/ Disallow: /node/ # Paths (no clean URLs) Disallow: /?q=admin/ Disallow: /?q=comment/reply/ Disallow: /?q=contact/ Disallow: /?q=logout/ Disallow: /?q=node/add/ Disallow: /?q=search/ Disallow: /?q=user/password/ Disallow: /?q=user/register/ Disallow: /?q=user/login/ User-agent: Alexibot User-agent: ApocalXExplorerBot User-agent: asterias User-agent: BackDoorBot/1.0 User-agent: Black Hole User-agent: BlowFish/1.0 User-agent: BotALot User-agent: BuiltBotTough User-agent: Bullseye/1.0 User-agent: BunnySlippers User-agent: Cegbfeieh User-agent: CheeseBot User-agent: CherryPicker User-agent: CherryPickerElite/1.0 User-agent: CherryPickerSE/1.0 User-agent: ConveraCrawler User-agent: CopyRightCheck User-agent: cosmos User-agent: Crescent User-agent: Crescent Internet ToolPak HTTP OLE Control v.1.0 User-agent: DISCo Pump 3.1 User-agent: DittoSpyder User-agent: DOC User-agent: Download Ninja User-agent: EmailCollector User-agent: EmailSiphon User-agent: EmailWolf User-agent: EroCrawler User-agent: ExtractorPro User-agent: Fetch User-agent: Foobot User-agent: Harvest/1.5 User-agent: hloader User-agent: httplib User-agent: HTTrack User-agent: HTTrack 3.0 User-agent: humanlinks User-agent: Igentia User-agent: InfoNaviRobot User-agent: JennyBot User-agent: Jetbot User-agent: Kenjin Spider User-agent: larbin User-agent: LexiBot User-agent: libWeb/clsHTTP User-agent: libwww User-agent: LinkextractorPro User-agent: linko User-agent: LinkScan/8.1a Unix User-agent: LinkWalker User-agent: lwp-trivial User-agent: lwp-trivial/1.34 User-agent: Mata Hari User-agent: Microsoft URL Control - 5.01.4511 User-agent: Microsoft URL Control - 6.00.8169 User-agent: Microsoft.URL.Control User-agent: MIIxpc User-agent: MIIxpc/4.2 User-agent: Mister PiX User-Agent: MJ12bot User-agent: moget User-agent: moget/2.1 User-agent: MSIECrawler User-agent: NetAnts User-agent: NetAttache User-agent: NetAttache Light 1.1 User-agent: NetMechanic User-agent: NICErsPRO User-agent: NPBot User-agent: Offline Explorer User-agent: Openfind User-agent: Openfind data gathere User-agent: ProPowerBot/2.14 User-agent: ProWebWalker User-agent: psbot User-agent: QuepasaCreep User-agent: QueryN Metasearch User-agent: RepoMonkey User-agent: RepoMonkey Bait & Tackle/v1.01 User-agent: RMA User-agent: sitecheck.internetseer.com User-agent: SiteSnagger User-agent: SpankBot User-agent: spanner User-agent: SuperBot User-agent: SuperBot/2.6 User-agent: suzuran User-agent: Szukacz/1.4 User-agent: Teleport User-agent: Teleport User-agent: TeleportPro User-agent: Telesoft User-agent: The Intraformant User-agent: TheNomad User-agent: TightTwatBot User-agent: Titan User-agent: toCrawl/UrlDispatcher User-agent: True_Robot User-agent: True_Robot/1.0 User-agent: turingos User-agent: TurnitinBot User-agent: UbiCrawler User-agent: URLy Warning User-agent: VCI User-agent: VCI WebViewer VCI WebViewer Win32 User-agent: Web Image Collector User-agent: WebAuto User-agent: WebBandit User-agent: WebBandit/3.50 User-agent: WebCopier User-agent: webcopy User-agent: WebEnhancer User-agent: WebmasterWorldForumBot User-agent: webmirror User-agent: WebReaper User-agent: WebSauger User-agent: website extractor User-agent: Website Quester User-agent: Webster Pro User-agent: WebStripper User-agent: WebStripper/2.02 User-agent: WebZip User-agent: WebZip/4.0 User-agent: Wget User-agent: Wget/1.5.3 User-agent: Wget/1.6 User-agent: WinHTTrack User-agent: WWW-Collector-E User-agent: Xenu User-agent: Xenu's User-agent: Xenu's Link Sleuth 1.1c User-agent: Zao User-agent: Zealbot User-agent: Zeus User-agent: Zeus 32297 Webster Pro V2.9 Win32 User-agent: ZyBORG Disallow: /