robots.txt details

saved: size: 6617 kb md5 checksum: 6d5ddd68e831d74587c55a0122bfdebc

websites using this robots.txt

content


# START YOAST BLOCK
# ---------------------------
User-agent: *
Disallow: /?s=
Disallow: /page/*/?s=
Disallow: /search/
Disallow: /wp-json/
Disallow: /?rest_route=

Sitemap: https://water4hussain.org/sitemap_index.xml
# ---------------------------
# END YOAST BLOCK

# Blocking excluded pages from sitemap
User-agent: *
Disallow: /
Sitemap: https://shiaspouse.org/sitemap.xml

# Block Chatgpt
User-agent: CCBot
Disallow: /

# Block archive.org bots
User-agent: ia_archiver
Disallow: /
User-agent: archive.org_bot
Disallow: /
User-agent: ia_archiver-web.archive.org
Disallow: /

# Block Xenu Crawler
User-agent: Xenu
Disallow: /
User-agent: Xenu's Link Sleuth 1.1c
Disallow: /

# Allow Google Bot
User-agent: Googlebot
Allow: /

# Allow Google Images Bot
User-agent: Googlebot-Image
Allow: /wp-content/uploads/

# Allow Google AdsBot Bot
User-agent: AdsBot-Google
Allow: /

# Allow Google Mobile Bot
User-agent: AdsBot-Google-Mobile
Allow: /

# Allow Bing Bot
User-agent: Bingbot
Allow: /

# Allow MSN Bot
User-agent: Msnbot
Allow: /

# Allow MSNBot Media Bot
User-agent: msnbot-media
Allow: /wp-content/uploads/

# Allow Apple Bot
User-agent: Applebot
Allow: /

# Allow Yandex Bot
User-agent: Yandex
Allow: /

# Allow Yandex Images Bot
User-agent: YandexImages
Allow: /wp-content/uploads/

# Allow Yahoo Search (Slurp bot)
User-agent: Slurp
Allow: /

# Allow DuckDuckGo Bot
User-agent: DuckDuckBot
Allow: /

# Block Qwant Bot
User-agent: Qwantify
Disallow: /

# Block Baidu/Sogou/Soso/Youdao Bot
User-agent: Baiduspider
Disallow: /
User-agent: Baiduspider/2.0
Disallow: /
User-agent: Baiduspider-video
Disallow: /
User-agent: Baiduspider-image
Disallow: /
User-agent: Sogou spider
Disallow: /
User-agent: Sogou web spider
Disallow: /
User-agent: Sosospider
Disallow: /
User-agent: Sosospider+
Disallow: /
User-agent: Sosospider/2.0
Disallow: /
User-agent: yodao
Disallow: /
User-agent: youdao
Disallow: /
User-agent: YoudaoBot
Disallow: /
User-agent: YoudaoBot/1.0
Disallow: /

# Block Naver Bot
User-agent: Naverbot
Disallow: /

# Block Seznam Bot
User-agent: seznambot
Disallow: /

# Allow Webp Images
User-agent: *
Allow: /*.webp$

# Block Jpg Images
User-agent: *
Disallow: /*.jpg$

# Block Png Images
User-agent: *
Disallow: /*.png$

# Allow Gif Images
User-agent: *
Allow: /*.gif$

# Block Scrapper Bots
User-agent: DotBot
Disallow: /
User-agent: GiftGhostBot
Disallow: /
User-agent: Seznam
Disallow: /
User-agent: PaperLiBot
Disallow: /
User-agent: Genieo
Disallow: /
User-agent: Dataprovider/6.101
Disallow: /
User-agent: DataproviderSiteExplorer
Disallow: /
User-agent: Dazoobot/1.0
Disallow: /
User-agent: Diffbot
Disallow: /
User-agent: DomainStatsBot/1.0
Disallow: /
User-agent: DotBot/1.1
Disallow: /
User-agent: dubaiindex
Disallow: /
User-agent: eCommerceBot
Disallow: /
User-agent: ExpertSearchSpider
Disallow: /
User-agent: Feedbin
Disallow: /
User-agent: Fetch/2.0a
Disallow: /
User-agent: FFbot/1.0
Disallow: /
User-agent: focusbot/1.1
Disallow: /
User-agent: HuaweiSymantecSpider
Disallow: /
User-agent: HuaweiSymantecSpider/1.0
Disallow: /
User-agent: JobdiggerSpider
Disallow: /
User-agent: LemurWebCrawler
Disallow: /
User-agent: LipperheyLinkExplorer
Disallow: /
User-agent: LSSRocketCrawler/1.0
Disallow: /
User-agent: LYT.SRv1.5
Disallow: /
User-agent: MiaDev/0.0.1
Disallow: /
User-agent: Najdi.si/3.1
Disallow: /
User-agent: BountiiBot
Disallow: /
User-agent: Experibot_v1
Disallow: /
User-agent: bixocrawler
Disallow: /
User-agent: bixocrawler TestCrawler
Disallow: /
User-agent: Crawler4j
Disallow: /
User-agent: Crowsnest/0.5
Disallow: /
User-agent: CukBot
Disallow: /
User-agent: Dataprovider/6.92
Disallow: /
User-agent: DBLBot/1.0
Disallow: /
User-agent: Diffbot/0.1
Disallow: /
User-agent: Digg Deeper/v1
Disallow: /
User-agent: discobot/1.0
Disallow: /
User-agent: discobot/1.1
Disallow: /
User-agent: discobot/2.0
Disallow: /
User-agent: discoverybot/2.0
Disallow: /
User-agent: Dlvr.it/1.0
Disallow: /
User-agent: DomainStatsBot/1.0
Disallow: /
User-agent: drupact/0.7
Disallow: /
User-agent: Ezooms/1.0
Disallow: /
User-agent: fastbot crawler beta 2.0
Disallow: /
User-agent: fastbot crawler beta 4.0
Disallow: /
User-agent: feedly social
Disallow: /
User-agent: Feedly/1.0
Disallow: /
User-agent: FeedlyBot/1.0
Disallow: /
User-agent: Feedspot
Disallow: /
User-agent: Feedspotbot/1.0
Disallow: /
User-agent: Clickagy Intelligence Bot v2
Disallow: /
User-agent: classbot
Disallow: /
User-agent: CISPA Vulnerability Notification
Disallow: /
User-agent: CirrusExplorer/1.1
Disallow: /
User-agent: Checksem/Nutch-1.10
Disallow: /
User-agent: CatchBot/5.0
Disallow: /
User-agent: CatchBot/3.0
Disallow: /
User-agent: CatchBot/2.0
Disallow: /
User-agent: CatchBot/1.0
Disallow: /
User-agent: CamontSpider/1.0
Disallow: /
User-agent: Buzzbot/1.0
Disallow: /
User-agent: Buzzbot
Disallow: /
User-agent: BusinessSeek.biz_Spider
Disallow: /
User-agent: BUbiNG
Disallow: /
User-agent: 008/0.85
Disallow: /
User-agent: 008/0.83
Disallow: /
User-agent: 008/0.71
Disallow: /
User-agent: ^Nail
Disallow: /
User-agent: FyberSpider/1.3
Disallow: /
User-agent: findlinks/1.1.6-beta5
Disallow: /
User-agent: g2reader-bot/1.0
Disallow: /
User-agent: findlinks/1.1.6-beta6
Disallow: /
User-agent: findlinks/2.0
Disallow: /
User-agent: findlinks/2.0.1
Disallow: /
User-agent: findlinks/2.0.2
Disallow: /
User-agent: findlinks/2.0.4
Disallow: /
User-agent: findlinks/2.0.5
Disallow: /
User-agent: findlinks/2.0.9
Disallow: /
User-agent: findlinks/2.1
Disallow: /
User-agent: findlinks/2.1.5
Disallow: /
User-agent: findlinks/2.1.3
Disallow: /
User-agent: findlinks/2.2
Disallow: /
User-agent: findlinks/2.5
Disallow: /
User-agent: findlinks/2.6
Disallow: /
User-agent: FFbot/1.0
Disallow: /
User-agent: findlinks/1.0
Disallow: /
User-agent: findlinks/1.1.3-beta8
Disallow: /
User-agent: findlinks/1.1.3-beta9
Disallow: /
User-agent: findlinks/1.1.4-beta7
Disallow: /
User-agent: findlinks/1.1.6-beta1
Disallow: /
User-agent: findlinks/1.1.6-beta1 Yacy
Disallow: /
User-agent: findlinks/1.1.6-beta2
Disallow: /
User-agent: findlinks/1.1.6-beta3
Disallow: /
User-agent: findlinks/1.1.6-beta4
Disallow: /
User-agent: bixo
Disallow: /
User-agent: bixolabs/1.0
Disallow: /
User-agent: Crawlera/1.10.2
Disallow: /
User-agent: Dataprovider Site Explorer
Disallow: /