##################################### # robots.txt file # # # # Jason Bedard - 2009 # # http://jbedard.ca # ##################################### User-agent: * #maximum rate is one page every 4 minutes Crawl-Delay: 240 #basic/common Disallow: /cache/ Disallow: /cgi-bin/ Disallow: /css/ Disallow: /images/ Disallow: /icons/ Disallow: /include/ Disallow: /includes/ Disallow: /js/ Disallow: /lib/ Disallow: /skins/ Disallow: /templates/ Disallow: /modules/ Disallow: /themes/ Disallow: /install/ Disallow: /upgrade/ Disallow: /uploads/ Disallow: /admin/ #stuff #Disallow: /googlebaf* #Disallow: /y_key_* #Disallow: /LiveSearchSiteAuth.xml #images Disallow: /*.jpg$ Disallow: /*.jpeg$ Disallow: /*.JPG$ Disallow: /*.JPEG$ Disallow: /*.png$ Disallow: /*.PNG$ Disallow: /*.gif$ Disallow: /*.GIF$ #not for viewing files Disallow: /*.inc Disallow: /*.lib Disallow: /*.class Disallow: /*.js Disallow: /*.css #index pages Disallow: /*?C=*;O= #disallow a bunch of lame/foreign crawlers User-agent: ArribaPacketRat Disallow: / User-agent: autoemailspider Disallow: / #chinese search engine User-agent: baiduspider Disallow: / User-agent: BecomeBot Disallow: / User-agent: Bilbo Disallow: / User-agent: CazoodleBot Disallow: / #User-agent: Charlotte #Disallow: / User-agent: CatchBot Disallow: / User-agent: DBLBot Disallow: / User-agent: DigExt Disallow: / User-agent: dloader(NaverRobot)/1.0 Disallow: / User-agent: DittoSpyder Disallow: / User-agent: DTS Agent Disallow: / #User-agent: duggmirror #Disallow: / User-agent: fast Disallow: / User-agent: Getleft 1.1b2 Disallow: / User-agent: girafa Disallow: / User-agent: Gigabot Disallow: / User-agent: Googlebot-Image Disallow: / User-agent: grub-client Disallow: / #gmx.net User-agent: Larbin Disallow: / User-agent: HTMLAB Disallow: / User-agent: httrack Disallow: / User-agent: ia_archiver Disallow: / User-agent: ImageVampire Disallow: / User-agent: k2spider Disallow: / User-agent: mail sweeper Disallow: / User-agent: MJ12bot Crawl-Delay: 500 #Disallow: / User-agent: MSIECrawler Disallow: / User-agent: msnbot-media Disallow: / User-agent: msnbot-MM Disallow: / User-agent: msnbot-news Disallow: / User-agent: msnbot-products Disallow: / User-agent: NetCaptor Disallow: / User-agent: NetSeer Disallow: / User-agent: NetcraftSurveyAgent Disallow: / User-agent: NITLE Blog Spider/0.01 Disallow: / User-agent: NPBot Disallow: / User-agent: nutch Disallow: / User-agent: oBot Disallow: / User-agent: Offline Explorer Disallow: / User-agent: OmniExplorer_Bot Disallow: / User-agent: PSBot Disallow: / User-agent: QuepasaCreep v0.9.13 Disallow: / User-agent: Scooter/3.3 Disallow: / #User-agent: SimilarPages #Disallow: / User-agent: sitecheck.internetseer.com Disallow: / #User-agent: Slurp/2.0 #Disallow: / User-agent: SpiderKU/0.9 Disallow: / User-agent: Steeler Disallow: / User-agent: SurveyBot/2.3 Disallow: / User-agent: szukacz Disallow: / User-agent: Szukacz/1.5 Disallow: / User-agent: TurnitinBot Disallow: / User-agent: Vagabondo/2.1 Disallow: / User-agent: vischeck_spiderBot/0.1libwww-perl/5.48 Disallow: / User-agent: voyager Crawl-delay: 500 #Disallow: / User-agent: vscooter Disallow: / User-agent: WebCopier v3.3 Disallow: / User-agent: WebCopier v3.2a Disallow: / User-agent: WebCopier Disallow: / User-agent: webcrawler Disallow: / User-agent: Web Downloader/4.9 Disallow: / User-agent: Web Downloader/5.8 Disallow: / User-agent: WebGather 3.0 Disallow: / User-agent: WebStripper/2.56 Disallow: / User-agent: WebZIP/3.65 Disallow: / User-agent: WebZIP Disallow: / User-agent: Wget Disallow: / User-agent: Zao Disallow: / #yahoo images User-agent: Yahoo-MMCrawler Disallow: / #yahoo movies User-agent: Yahoo-MMAudVid Disallow: / User-agent: Yandex Disallow: / User-agent: Zeus 2.6 Disallow: /