# Normal robots.txt body is purely substring match only # We exclude lots of general purpose forms which are available in various mount points of the site # and internal image bank which is hidden in the navigation tree in any case User-agent: * Disallow: login_form Disallow: sendto_form # Googlebot allows regex in its syntax # Block all URLs including query strings (? pattern) - contentish objects expose query string only for actions or status reports which # might confuse search results. # This will also block ?set_language User-Agent: Googlebot Disallow: /*?* Disallow: /*login_form$ Disallow: /*sendto_form$ Disallow: /*folder_factories$ Disallow: /link-per-scaricare-materiali/ Disallow: /eventi/ Disallow: /calendario/ Disallow: /file-di-testo/ Disallow: /cast-e-crediti/ Disallow: /schede-produzioni/ Disallow: /foto-di-scena-per-stampa_la-canzone-di-nanda/ Disallow: /foto-di-scena-per-stampa_la-canzone-di-nanda-1/ Disallow: /la-canzone-di-nanda_trailer%20flv/ Disallow: /video-casale_flv-e-mov/ # Allow Adsense bot on entire site # User-agent: Mediapartners-Google* # Disallow: # Allow: /*