User-agent: Googlebot # Don't index mobile versions Disallow: /index.php?*;wap Disallow: /index.php?*;wap2 Disallow: /index.php?*;imode Disallow: /attachments/ Disallow: /Packages/ Disallow: /Smileys/ Disallow: /Sources/ Disallow: /Themes/ Disallow: /index.php?action=activate Disallow: /index.php?action=admin Disallow: /index.php?action=calendar Disallow: /index.php?action=emailuser Disallow: /index.php?action=findmember Disallow: /index.php?action=help Disallow: /index.php?action=helpadmin Disallow: /index.php?action=login Disallow: /index.php?action=logout Disallow: /index.php?action=mlist Disallow: /index.php?action=modifykarma Disallow: /index.php?action=otherkarma Disallow: /index.php?action=pm Disallow: /index.php?action=post Disallow: /index.php?action=printpage Disallow: /index.php?action=profile Disallow: /index.php?action=recent Disallow: /index.php?action=register Disallow: /index.php?action=reminder Disallow: /index.php?action=search Disallow: /index.php?action=theme Disallow: /index.php?action=unread Disallow: /index.php?action=unreadreplies Disallow: /index.php?action=verificationcode Disallow: /index.php?action=who Disallow: /index.php?theme Disallow: /index.php?action=stats;expand Disallow: /index.php?action=stats;collapse Disallow: /tv-program/ Disallow: /gosetup= Disallow: /comments.html? # Yahoo - Too aggressive # So limit it as much as possible. User-agent: Slurp # Disallow Everything Disallow: /forum/ # Now allow bits and then disallow bits Allow: /sitemap.xml$ Allow: /robots.txt$ Allow: /index.php$ Allow: /index.php?topic=*.0$ Allow: /index.php?topic=*.*0$ Allow: /index.php?topic=*.*5$ Allow: /index.php?board=*.0$ Allow: /index.php?board=*.*0$ Allow: /index.php?board=*.*5$ # But don't allow these Disallow: /index.php?*.msg Disallow: /index.php?topic=*.msg*0$ Disallow: /index.php?topic=*.msg*5$ Disallow: /index.php?*.new # Anything with a ; disallow Disallow: /forum/index.php?*;* # Bad bot - Often ignores robots.txt - Waste of bandwidth # Despite claiming on their website to be a search engine in development # I'm suspicious as to whether they are a harvester pretending to be SE User-agent: Twiceler Disallow: / User-Agent: W3C-checklink Disallow: / User-agent: TurnitinBot Disallow: / # Stop following PHPSESSID's User-Agent: MJ12bot Disallow: /index.php?PHPSESSID # Catch all (remainder) # Will be followed by any bots other than ones identified above # Uses BASIC robots.txt directives without wildcards, end-anchors etc # So Spiders should understand these (including MSNBOT) User-agent: * # Default SMF Folders Disallow: /attachments/ Disallow: /Packages/ Disallow: /Smileys/ Disallow: /Sources/ Disallow: /Themes/ Disallow: /index.php?action=activate Disallow: /index.php?action=admin Disallow: /index.php?action=calendar Disallow: /index.php?action=emailuser Disallow: /index.php?action=findmember Disallow: /index.php?action=help Disallow: /index.php?action=helpadmin Disallow: /index.php?action=login Disallow: /index.php?action=logout Disallow: /index.php?action=mlist Disallow: /index.php?action=modifykarma Disallow: /index.php?action=otherkarma Disallow: /index.php?action=pm Disallow: /index.php?action=post Disallow: /index.php?action=printpage Disallow: /index.php?action=profile Disallow: /index.php?action=recent Disallow: /index.php?action=register Disallow: /index.php?action=reminder Disallow: /index.php?action=search Disallow: /index.php?action=theme Disallow: /index.php?action=unread Disallow: /index.php?action=unreadreplies Disallow: /index.php?action=verificationcode Disallow: /index.php?action=who Disallow: /index.php?theme Disallow: /index.php?action=stats;expand Disallow: /index.php?action=stats;collapse Disallow: /tv-program/ Disallow: /gosetup= Disallow: /comments.html? Sitemap: http://forum.orionet.ru/sitemap.xml