# global live settings : User-agent: * Disallow: /cms_addon Disallow: /cms_docs Disallow: /redFACT Disallow: /REST/frontend/itemstatistics Sitemap: http://www.irishexaminer.com/sitemap-index/41-google_news.xml Sitemap: http://www.irishexaminer.com/sitemap-index/44-google_sitemap.xml Sitemap: http://www.irishexaminer.com/sitemap-index/227-google_channel_sitemap.xml # customised settings : User-agent: * Disallow: /pu_all Disallow: /pu_examiner/scripts Disallow: /pu_examiner/scss Disallow: /pu_examiner/styles Disallow: /pu_examiner/templates Disallow: /pu_examiner/tpl Disallow: /pu_examiner/*.htaccess Disallow: /pu_examiner/*.md Disallow: /pu_examiner/*.json Disallow: /pu_examiner/*.php Disallow: /pu_examiner/*.webmanifest Disallow: /pu_examiner/*.js Disallow: /pu_examiner/*.lock Disallow: /pu_echo/scripts Disallow: /pu_echo/scss Disallow: /pu_echo/styles Disallow: /pu_echo/templates Disallow: /pu_echo/tpl Disallow: /pu_echo/*.htaccess Disallow: /pu_echo/*.md Disallow: /pu_echo/*.json Disallow: /pu_echo/*.php Disallow: /pu_echo/*.webmanifest Disallow: /pu_echo/*.js Disallow: /pu_echo/*.lock User-agent: ia_archiver Disallow: / User-agent: Googlebot Allow: / Disallow: /ar.* Disallow: /pa.* Disallow: /*?topic=* Disallow: /*?type=amp* Disallow: /*?utm_* Disallow: /*?G2I_ActionId=* User-agent: AdsBot-Google Allow: / User-agent: Googlebot-News Disallow: /sponsored/ Disallow: /sponsored-content/ Disallow: /sponsoredshowcase/ Disallow: /test # Exclude SEO-Tools & SPAM-Bots User-agent: backlink-check.de Disallow: / User-agent: BacklinkCrawler Disallow: / User-agent: Bloodhound Disallow: / User-agent: cydralspider Disallow: / User-agent: downloadexpress Disallow: / User-agent: ExtractorPro Disallow: / User-agent: Fasterfox Disallow: / User-agent: gammaSpider Disallow: / User-agent: LinkextractorPro Disallow: / User-agent: LinkWalker Disallow: / User-agent: Meltwater Disallow: / User-agent: MJ12bot Disallow: / User-agent: Node/simplecrawler Disallow: / User-agent: Node/simplecrawler 0.7.0 (git+https://github.com/cgiffard/node-simplecrawler.git) Disallow: / User-agent: ObjectsSearch Disallow: / User-agent: Openbot Disallow: / User-agent: Pimptrain Disallow: / User-agent: Raven Disallow: / User-agent: rogerbot Disallow: / User-agent: searchpreview Disallow: / User-agent: simplecrawler Disallow: / User-agent: SEODAT Disallow: / User-agent: SEOENGBot Disallow: / User-agent: SEOkicks-Robot Disallow: / User-agent: True_Robot Disallow: / User-agent: URL Control Disallow: / User-agent: URL_Spider_Pro Disallow: / User-agent: wapspider Disallow: / User-agent: WebZinger Disallow: / User-agent: xovi Disallow: / User-agent: CCBot Disallow: / User-agent: ChatGPT-User Disallow: / User-agent: GPTBot Disallow: /