# The robots.txt file is a good way to prevent a page from getting indexed. # However, not every site can use it. # The only robots.txt file that the spiders will read is the one at the top # html directory of your server. This means you can only use it if you run your own domain. # # Exclude all the search engine spiders from entire domain: # User-agent: * # Disallow: / # # Exclude all the spiders from a certain directory: # # User-agent: * # Disallow: /aboutme/ # Disallow: /stats/ # # Exclude certain files: # # User-agent: * # Disallow: /aboutme/album.html # Disallow: /stats/refer.htm # # Exclude a specific search engine spider from indexing your site: # # User-agent: Robot_Name # Disallow: /zine/spam1.htm # # User-agent: * # Disallow: /baldo.2004/ # Disallow: /spark.2004/ # Disallow: /josef/