#
# robots.txt for http://www.microsiervos.com
#

# Las Tres Leyes de la Rob—tica
#
# 1. Un robot no puede causar da–o a un ser humano o, por su inacci—n,
# permitir que un ser humano sufra da–o.
#
# 2. Un robot debe obedecer las —rdenes que le sean dadas por un ser
# humano, a menos que dichas —rdenes entren en conflicto con la Primera Ley
#
# 3. Un robot debe proteger su propia existencia, siempre que ello no entre
# en conflicto con la Primera o la Segunda ley
#
# -- Isaac Asimov
#
# (robots.txt inspirado por yell.com/robots.txt)

# First, this is the
# robots.txt from http://www.wikipedia.org/ for "other" robots
# Thanks Wikipedians!
#
# Please note: There are a lot of pages on this site, and there are
# some misbehaved spiders out there that go _way_ too fast. If you're
# irresponsible, your access to the site may be blocked.
#

User-agent: Orthogaffe
Disallow: /

# Crawlers that are kind enough to obey, but which we'd rather not have
# unless they're feeding search engines.
User-agent: UbiCrawler
Disallow: /

User-agent: DOC
Disallow: /

User-agent: Zao
Disallow: /

# Some bots are known to be trouble, particularly those designed to copy
# entire sites. Please obey robots.txt.
User-agent: sitecheck.internetseer.com
Disallow: /

User-agent: Zealbot
Disallow: /

User-agent: MSIECrawler
Disallow: /

User-agent: SiteSnagger
Disallow: /

User-agent: WebStripper
Disallow: /

User-agent: WebCopier
Disallow: /

User-agent: Fetch
Disallow: /

User-agent: Offline Explorer
Disallow: /

User-agent: Teleport
Disallow: /

User-agent: TeleportPro
Disallow: /

User-agent: WebZIP
Disallow: /

User-agent: linko
Disallow: /

User-agent: HTTrack
Disallow: /

User-agent: Microsoft.URL.Control
Disallow: /

User-agent: Xenu
Disallow: /

User-agent: larbin
Disallow: /

User-agent: libwww
Disallow: /

User-agent: ZyBORG
Disallow: /

User-agent: Download Ninja
Disallow: /

# Sorry, wget in its recursive mode is a frequent problem.
# Please read the man page and use it properly; there is a
# --wait option you can use to set the delay between hits,
# for instance.
#
User-agent: wget
Disallow: /

#
# The 'grub' distributed client has been *very* poorly behaved.
#
User-agent: grub-client
Disallow: /

#
# Doesn't follow robots.txt anyway, but...
#
User-agent: k2spider
Disallow: /

#
# Hits many times per second, not acceptable
# http://www.nameprotect.com/botinfo.html
User-agent: NPBot
Disallow: /

# A capture bot, downloads gazillions of pages with no public benefit
# http://www.webreaper.net/
User-agent: WebReaper
Disallow: /

# Specifically for Microsiervos.com
User-agent: *
Disallow: /msmt/                    # CMS, search CGI and others (ignore all)
Disallow: /msmt/mt-search.cgi       # search CGI
Disallow: /microsiervos-al-azar.php  # Random dynamic page, not to be crawled
Disallow: /ad-free-blog.php  # Another random dynamic page, not to be crawled
Disallow: /version1/                        # Old version of the site, ignore
Disallow: /archivo/mundoreal/pollas-y-pito.html                   # ignore for search
Disallow: /archivo/leyendas-urbanas/sadam-hussein-porno-gay.html  # ignore for search
Disallow: /archivo/leyendas-urbanas/hunting-for-bambi.html        #ignore for search
Disallow: /archivo/1988/
Disallow: /archivo/1995/
Disallow: /archivo/2001/
Disallow: /archivo/2002/
Disallow: /archivo/2003/
Disallow: /archivo/2004/
Disallow: /archivo/2005/
Disallow: /archivo/2006/
Disallow: /archivo/2007/
Disallow: /archivos/-sidebar-mapas
Disallow: /archivos/-sidebar-series
Disallow: /archivos/-sidebar-simpson
Disallow: /archivos/-sidebar-simpso
Disallow: /index-2.html
Disallow: /index-3.html
Disallow: /index-4.html
Disallow: /old/
Disallow: /cloneblog/
Disallow: /r/                    # ignore redirects

Sitemap: http://www.microsiervos.com/sitemap.xml
