User-agent: * # ========================================== # AEM SYSTEM & SECURITY (CRITICAL) # ========================================== Disallow: /.rum/ Disallow: /errors/ Disallow: /*_jcr_content Disallow: /*.lc-* Disallow: /*.infinity.json Disallow: /*.tidy.json Disallow: /*.sysview.xml Disallow: /*.docview.json Disallow: /*.json$ # ========================================== # TRACKING PARAMETERS (SEO & CRAWL BUDGET) # ========================================== Disallow: /*?utm_* Disallow: /*&utm_* Disallow: /*?ref=* Disallow: /*&ref=* Disallow: /*?source=* Disallow: /*&source=* Disallow: /*?sessionid=* Disallow: /*&sessionid=* Disallow: /*?sid=* Disallow: /*&sid=* Disallow: /*?wcmmode=* Disallow: /*&wcmmode=* Disallow: /*?cq_ck=* Disallow: /*&cq_ck=* # ========================================== # ALLOW RULES (ASSETS) # ========================================== Disallow: /content/dam/* # Block all DAM by default Allow: /content/dam/*.pdf$ # Then allow specific extensions Allow: /content/dam/*.docx$ Allow: /content/dam/*.xlsx$ Allow: /content/dam/*.xls$ Allow: /content/dam/*.pptx$ Allow: /content/dam/*.ppt$ Allow: /content/dam/*.mp4$ Allow: /content/dam/*.mp3$ Allow: /content/dam/*.zip$ Allow: /content/dam/*.xhtml$ Allow: /content/dam/*.ico$ Allow: /content/dam/*.png$ Allow: /content/dam/*.svg$ Allow: /content/dam/*.jpg$ Allow: /content/dam/*.jpeg$ Allow: /*.css$ Allow: /*.js$ Allow: /sitemap*.xml # ========================================== # SITEMAPS # ========================================== Sitemap: https://www.fincantieri.com/sitemap.xml # ========================================== # BAD BOTS BLOCKLIST (LEGACY) # ========================================== User-agent: HTTrack Disallow: / User-agent: wget Disallow: / User-agent: WebCopier Disallow: / User-agent: WebZIP Disallow: / User-agent: Teleport Pro Disallow: / User-agent: Offline Explorer Disallow: / User-agent: SiteSucker Disallow: / User-agent: WebReaper Disallow: / User-agent: WebStripper Disallow: / User-agent: SuperBot Disallow: / User-agent: WebWhacker Disallow: / User-agent: 008 Disallow: / User-agent: ZyBORG Disallow: / User-agent: Download Ninja Disallow: / User-agent: ApptusBot Disallow: /