# $Id: robots.txt,v 1.9.2.1 2008/12/10 20:12:19 goba Exp $ # # robots.txt # # This file is to prevent the crawling and indexing of certain parts # of your site by web crawlers and spiders run by sites like Yahoo! # and Google. By telling these "robots" where not to go on your site, # you save bandwidth and server resources. # # This file will be ignored unless it is at the root of your host: # Used: http://example.com/robots.txt # Ignored: http://example.com/site/robots.txt # # For more information about the robots.txt standard, see: # http://www.robotstxt.org/wc/robots.html # # For syntax checking, see: # http://www.sxw.org.uk/computing/robots/check.html User-agent: * Crawl-delay: 10 # Default SMF Actions Disallow: /index.php?PHPSESSID=* Disallow: /index.php?*rss* Disallow: /index.php?*;wap Disallow: /index.php?*;wap2 Disallow: /index.php?*;imode Disallow: /index.php?action=activate Disallow: /index.php?action=admin Disallow: /index.php?action=calendar* Disallow: /index.php?action=emailuser Disallow: /index.php?action=findmember Disallow: /index.php?action=help Disallow: /index.php?action=helpadmin Disallow: /index.php?action=login* Disallow: /index.php?action=logout Disallow: /index.php?action=mlist Disallow: /index.php?action=modifykarma Disallow: /index.php?action=pm Disallow: /index.php?action=post Disallow: /index.php?action=printpage* Disallow: /index.php?action=profile* Disallow: /index.php?action=recent Disallow: /index.php?action=register* Disallow: /index.php?action=reminder Disallow: /index.php?action=search* Disallow: /index.php?action=theme Disallow: /index.php?action=unread Disallow: /index.php?action=unreadreplies Disallow: /index.php?action=verificationcode Disallow: /index.php?action=who Disallow: /index.php?theme Disallow: /index.php?action=stats* # Spammers - no thanks Disallow: /index.php?action=http Disallow: /index.php?board=http Disallow: /index.php?topic=http Disallow: /index.php?www Disallow: /index.php?action=links Disallow: /index.php?f= # SMF Mod Related Disallow: /index.php?action=comment Disallow: /index.php?action=recenttopics Disallow: /index.php?action=mm Disallow: /index.php?action=viewkarma Disallow: /index.php?action=sendtopic # Directories Disallow: /Themes Disallow: /forum? Disallow: /news/includes/ Disallow: /news/misc Disallow: /news/modules/ Disallow: /news/profiles/ Disallow: /news/scripts/ Disallow: /news/sites/ Disallow: /news/themes/ # Files Disallow: /news/CHANGELOG.txt Disallow: /news/cron.php Disallow: /news/INSTALL.mysql.txt Disallow: /news/INSTALL.pgsql.txt Disallow: /news/install.php Disallow: /news/INSTALL.txt Disallow: /news/LICENSE.txt Disallow: /news/MAINTAINERS.txt Disallow: /news/update.php Disallow: /news/UPGRADE.txt Disallow: /news/xmlrpc.php # Paths (clean URLs) Disallow: /news/admin/ Disallow: /news/comment/reply/ Disallow: /news/contact Disallow: /news/logout Disallow: /news/node Disallow: /news/search/ Disallow: /news/user/register Disallow: /news/user/password Disallow: /news/user/login # Paths (no clean URLs) Disallow: /news/?q=admin/ Disallow: /news/?q=comment/reply/ Disallow: /news/?q=contact/ Disallow: /news/?q=logout/ Disallow: /news/?q=node/add/ Disallow: /news/?q=search/ Disallow: /news/?q=user/password Disallow: /news/?q=user/register Disallow: /news/?q=user/login Disallow: /news/ro? Disallow: /news/node? Disallow: /news/page? # If you don't want the bulk of your "recent posts" pages indexed, add this: Disallow: /news/tracker? #Wayback Machine - disallow all (www.archive.org) #ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com) User-agent: ia_archiver Disallow: /