# As a condition of accessing this website, you agree to abide by the following
# content signals:
# (a) If a Content-Signal = yes, you may collect content for the corresponding
# use.
# (b) If a Content-Signal = no, you may not collect content for the
# corresponding use.
# (c) If the website operator does not include a Content-Signal for a
# corresponding use, the website operator neither grants nor restricts
# permission via Content-Signal with respect to the corresponding use.
# The content signals and their meanings are:
# search: building a search index and providing search results (e.g., returning
# hyperlinks and short excerpts from your website's contents). Search does not
# include providing AI-generated search summaries.
# ai-input: inputting content into one or more AI models (e.g., retrieval
# augmented generation, grounding, or other real-time taking of content for
# generative AI search answers).
# ai-train: training or fine-tuning AI models.
# ANY RESTRICTIONS EXPRESSED VIA CONTENT SIGNALS ARE EXPRESS RESERVATIONS OF
# RIGHTS UNDER ARTICLE 4 OF THE EUROPEAN UNION DIRECTIVE 2019/790 ON COPYRIGHT
# AND RELATED RIGHTS IN THE DIGITAL SINGLE MARKET.
# BEGIN Cloudflare Managed content
User-agent: *
Content-Signal: search=yes,ai-train=no
Allow: /
User-agent: Amazonbot
Disallow: /
User-agent: Applebot-Extended
Disallow: /
User-agent: Bytespider
Disallow: /
User-agent: CCBot
Disallow: /
User-agent: ClaudeBot
Disallow: /
User-agent: CloudflareBrowserRenderingCrawler
Disallow: /
User-agent: Google-Extended
Disallow: /
User-agent: GPTBot
Disallow: /
User-agent: meta-externalagent
Disallow: /
# END Cloudflare Managed Content
# If the Joomla site is installed within a folder such as at
# e.g. www.example.com/joomla/ the robots.txt file MUST be
# moved to the site root at e.g. www.example.com/robots.txt
# AND the joomla folder name MUST be prefixed to the disallowed
# path, e.g. the Disallow rule for the /administrator/ folder
# MUST be changed to read Disallow: /joomla/administrator/
#
# For more information about the robots.txt standard, see:
# http://www.robotstxt.org/orig.html
#
# For syntax checking, see:
# http://tool.motoricerca.info/robots-checker.phtml
# Semrush settings
User-agent: SiteAuditBot
Disallow:
User-agent: SemrushBot-SI
Disallow:
User-agent: SemrushBot
Crawl-delay: 5
# CPU usage slow the crawl to 10 seconds
User-agent: Amazonbot
User-agent: Googlebot
Crawl-delay: 10
User-agent: googlebot
User-agent: google
User-agent: bingbot
User-agent: bing
User-agent: SemrushBot
Disallow: /bin/
Disallow: /cache/
Disallow: /cli/
Disallow: /includes/
Disallow: /installation/
Disallow: /language/
Disallow: /layouts/
Disallow: /libraries/
Disallow: /logs/
Disallow: /tmp/
Disallow: /devsite/
Disallow: /cathy/
Disallow: /databasebackups/
User-agent: *
Allow: /*.js*
Allow: /*.css*
Allow: /*.png*
Allow: /*.jpg*
Allow: /*.gif*
Allow: /*.ico*
Allow: https://www.pntra.com/b*
Allow: https://www.pjtra.com/b*
Allow: https://www.pjatr.com/b*
Allow: https://www.gopjn.com/b*
Allow: https://www.pntrs.com/b*
Disallow: /bin/
Disallow: /cache/
Disallow: /cli/
Disallow: /includes/
Disallow: /installation/
Disallow: /language/
Disallow: /layouts/
Disallow: /libraries/
Disallow: /logs/
Disallow: /tmp/
Disallow: /devsite/
Disallow: /cathy/
Disallow: /databasebackups/
# JSitemap entries
Sitemap: https://equineinfoexchange.com/index.php?option=com_jmap&view=sitemap&format=xml
Sitemap: https://equineinfoexchange.com/index.php?option=com_jmap&view=sitemap&format=images
Sitemap: https://equineinfoexchange.com/index.php?option=com_jmap&view=sitemap&format=hreflang
Sitemap: https://equineinfoexchange.com/index.php?option=com_jmap&view=sitemap&format=gnews
Sitemap: https://equineinfoexchange.com/index.php?option=com_jmap&view=sitemap&format=mobile
Sitemap: https://equineinfoexchange.com/index.php?option=com_jmap&view=sitemap&format=videos
Sitemap: https://equineinfoexchange.com/component/jmap/sitemap/xml
Sitemap: https://equineinfoexchange.com/component/jmap/sitemap/images
Sitemap: https://equineinfoexchange.com/component/jmap/sitemap/videos