# Define access-restrictions for robots/spiders # http://www.robotstxt.org/wc/norobots.html # By default we allow robots to access all areas of our site # already accessible to anonymous users User-agent: * Disallow: set_language Disallow: force_web Disallow: login_form Disallow: sendto_form Disallow: /footer-text Disallow: /fi/ohjeet Disallow: /jasenedut Disallow: /fi/jasenedut Disallow: /search_form Disallow: /sendto_form Disallow: /accessibility-info Disallow: /login_form Disallow: /mail_password_form?userid= Disallow: /news_item Disallow: /enabling_cookie Disallow: /portal_javascripts Disallow: /portal_kss Disallow: /author Disallow: /talkback Disallow: /RSS Disallow: folder_contents # Googlebot allows regex in its syntax # Block all URLs including query strings (? pattern) - contentish objects # expose query string only for actions or status # reports which might confuse search results. # This will also block ?set_language User-Agent: Googlebot Disallow: /*?* Disallow: /*talkback Disallow: /*RSS Disallow: /*login_form Disallow: /*sendto_form Disallow: /*folder_contents Disallow: /jasenedut Disallow: /fi/jasenedut