# # robots.txt # # This file is to prevent the crawling and indexing of certain parts # of your site by web crawlers and spiders run by sites like Yahoo! # and Google. By telling these "robots" where not to go on your site, # you save bandwidth and server resources. # # This file will be ignored unless it is at the root of your host: # Used: http://example.com/robots.txt # Ignored: http://example.com/site/robots.txt # # For more information about the robots.txt standard, see: # http://www.robotstxt.org/robotstxt.html User-agent: * Disallow: / #Crawl-delay: 10 User-agent: * Disallow: /content/40000-bail-man-fraudulent-conversion-charge User-agent: Googlebot Allow: / Crawl-delay: 30 User-agent: Googlebot-Image Allow: / Crawl-delay: 30 User-agent: Googlebot-Video Allow: / Crawl-delay: 30 User-agent: Googlebot-News Allow: / Crawl-delay: 30 User-agent: Googlebot-Mobile Allow: / Crawl-delay: 30 User-agent: Mediapartners-Google Allow: / Crawl-delay: 30 User-agent: Adsbot-Google Allow: / Crawl-delay: 30 User-agent: Twitterbot Disallow: Crawl-delay: 30 User-agent: facebookexternalhit Disallow: Crawl-delay: 30 User-agent: facebookexternalhit/1.1 Disallow: Crawl-delay: 30 User-agent: trendictionbot0.5.0 Disallow: Crawl-delay: 30 # CSS, JS, Images Allow: /core/*.css$ Allow: /core/*.css? Allow: /core/*.js$ Allow: /core/*.js? Allow: /core/*.gif Allow: /core/*.jpg Allow: /core/*.jpeg Allow: /core/*.png Allow: /core/*.svg Allow: /profiles/*.css$ Allow: /profiles/*.css? Allow: /profiles/*.js$ Allow: /profiles/*.js? Allow: /profiles/*.gif Allow: /profiles/*.jpg Allow: /profiles/*.jpeg Allow: /profiles/*.png Allow: /profiles/*.svg # Directories Disallow: /core/ Disallow: /profiles/ # Files Disallow: /README.txt Disallow: /web.config # Paths (clean URLs) Disallow: /admin/ Disallow: /comment/reply/ Disallow: /filter/tips/ Disallow: /node/add/ Disallow: /search/ Disallow: /user/register/ Disallow: /user/password/ Disallow: /user/login/ Disallow: /user/logout/ # Paths (no clean URLs) Disallow: /index.php/admin/ Disallow: /index.php/comment/reply/ Disallow: /index.php/filter/tips/ Disallow: /index.php/node/add/ Disallow: /index.php/search/ Disallow: /index.php/user/password/ Disallow: /index.php/user/register/ Disallow: /index.php/user/login/ Disallow: /index.php/user/logout/ Disallow: /content/hotelier-freed-fraud-charges Disallow: /content/spelling-mix-former-hotel-manager-innocent-says-attorney Disallow: /content/prominent-greek-national-freed-financial-crime-charge-locally #GSC Disallow: /nl Disallow: /fr Disallow: /index.php/nl Disallow: /index.php/fr # carma.com Bot User-agent: ScooperBot Disallow: / #Archive bot User-agent: special_archiver Disallow: / #SemrushBot bot User-agent: SemrushBot Disallow: / #MJ12bot bot User-agent: MJ12bot Disallow: / #BLEXBot bot User-agent: BLEXBot Disallow: / #DotBot bot User-agent: DotBot Disallow: / #Eyeotabot bot User-agent: Eyeotabot Disallow: / #Eyeotabot bot User-agent: Eyeotabot Disallow: / #bingbot bot User-agent: bingbot Disallow: / #Crawl-delay: 30 #mediapartners-googlebot User-agent: Mediapartners-Googlebot Allow: / Crawl-delay: 30 #Googlebot bot User-agent: Googlebot Crawl-delay: 30 #YandexBot bot User-agent: YandexBot Crawl-delay: 30 #KauaiBot bot User-agent: KauaiBot Allow: / Crawl-delay: 30 #Mediatoolkitbot bot User-agent: Mediatoolkitbot Disallow: / #CriteoBot bot User-agent: CriteoBot Disallow: / #BLP_bbot bot User-agent: BLP_bbot Disallow: / #PetalBot bot User-agent: PetalBot Disallow: / #archive.org_bot bot User-agent: archive.org_bot Disallow: / #Nimbostratus-Bot bot User-agent: Nimbostratus-Bot Disallow: / #TweetmemeBot bot User-agent: TweetmemeBot Disallow: / #TweetmemeBot bot User-agent: Barkrowler Disallow: / #SemrushBot-BM bot User-agent: SemrushBot-BM Disallow: / #YandexBot bot User-agent: YandexBot Disallow: / #MauiBot bot User-agent: MauiBot Disallow: / #CrsspxlBot bot User-agent: CrsspxlBot Disallow: / #AASA-Bot bot User-agent: AASA-Bot Disallow: / #DemandbasePublisherAnalyzer bot User-agent: DemandbasePublisherAnalyzer Disallow: / #MojeekBot bot User-agent: MojeekBot Disallow: / #BomboraBot bot User-agent: BomboraBot Disallow: / #SeznamBot bot User-agent: SeznamBot Disallow: / #BLP_bbot/0.1 bot User-agent: BLP_bbot/0.1 Disallow: / #AhrefsBot User-agent: AhrefsBot Disallow: / #moatbot User-agent: moatbot Disallow: / User-agent: AAABot Disallow: / User-agent: AndersPinkBot Disallow: / User-agent: Seekport Disallow: / User-agent: VoluumDSP-content-bot Disallow: / User-agent: special_archiver Disallow: / User-agent: MegaIndex.ru Disallow: / User-agent: ias-va Disallow: / User-agent: Applebot Disallow: / User-agent: admantx-ussy04 Disallow: / User-agent: python-requests Disallow: / User-agent: Semanticbot Disallow: / User-agent: Feedio.co Feed Crawler Disallow: / User-agent: GumGum Disallow: / User-agent: ias-ir Disallow: / User-agent: ias-or Disallow: / User-agent: ias-sg Disallow: /