# As a condition of accessing this website, you agree to abide by the following
# content signals:

# (a)  If a Content-Signal = yes, you may collect content for the corresponding
#      use.
# (b)  If a Content-Signal = no, you may not collect content for the
#      corresponding use.
# (c)  If the website operator does not include a Content-Signal for a
#      corresponding use, the website operator neither grants nor restricts
#      permission via Content-Signal with respect to the corresponding use.

# The content signals and their meanings are:

# search:   building a search index and providing search results (e.g., returning
#           hyperlinks and short excerpts from your website's contents). Search does not
#           include providing AI-generated search summaries.
# ai-input: inputting content into one or more AI models (e.g., retrieval
#           augmented generation, grounding, or other real-time taking of content for
#           generative AI search answers).
# ai-train: training or fine-tuning AI models.

# ANY RESTRICTIONS EXPRESSED VIA CONTENT SIGNALS ARE EXPRESS RESERVATIONS OF
# RIGHTS UNDER ARTICLE 4 OF THE EUROPEAN UNION DIRECTIVE 2019/790 ON COPYRIGHT
# AND RELATED RIGHTS IN THE DIGITAL SINGLE MARKET.

# BEGIN Cloudflare Managed content

User-agent: *
Content-Signal: search=yes,ai-train=no
Allow: /

User-agent: Amazonbot
Disallow: /

User-agent: Applebot-Extended
Disallow: /

User-agent: Bytespider
Disallow: /

User-agent: CCBot
Disallow: /

User-agent: ClaudeBot
Disallow: /

User-agent: CloudflareBrowserRenderingCrawler
Disallow: /

User-agent: Google-Extended
Disallow: /

User-agent: GPTBot
Disallow: /

User-agent: meta-externalagent
Disallow: /

# END Cloudflare Managed Content

# As a condition of accessing this website, you agree to abide by the following
# content signals:

# (a)  If a Content-Signal = yes, you may collect content for the corresponding
#      use.
# (b)  If a Content-Signal = no, you may not collect content for the
#      corresponding use.
# (c)  If the website operator does not include a Content-Signal for a
#      corresponding use, the website operator neither grants nor restricts
#      permission via Content-Signal with respect to the corresponding use.

# The content signals and their meanings are:

# search:   building a search index and providing search results (e.g., returning
#           hyperlinks and short excerpts from your website's contents). Search does not
#           include providing AI-generated search summaries.
# ai-input: inputting content into one or more AI models (e.g., retrieval
#           augmented generation, grounding, or other real-time taking of content for
#           generative AI search answers).
# ai-train: training or fine-tuning AI models.

# ANY RESTRICTIONS EXPRESSED VIA CONTENT SIGNALS ARE EXPRESS RESERVATIONS OF
# RIGHTS UNDER ARTICLE 4 OF THE EUROPEAN UNION DIRECTIVE 2019/790 ON COPYRIGHT
# AND RELATED RIGHTS IN THE DIGITAL SINGLE MARKET.

# --- Default: Allow all crawlers ---
User-agent: *
Content-Signal: search=yes,ai-input=yes,ai-train=no
Allow: /

# --- Google: Search, Ads & Business Profile ---
User-agent: Googlebot
Allow: /

User-agent: Googlebot-Image
Allow: /

User-agent: AdsBot-Google
Allow: /

User-agent: AdsBot-Google-Mobile
Allow: /

User-agent: Mediapartners-Google
Allow: /

# --- Google AI: Allowed for grounding/citations, no training ---
User-agent: Google-Extended
Allow: /

# --- Bing / Microsoft Ads ---
User-agent: Bingbot
Allow: /

User-agent: msnbot
Allow: /

User-agent: adidxbot
Allow: /

# --- Facebook / Instagram / Meta Ads ---
User-agent: facebookexternalhit
Allow: /

User-agent: FacebookBot
Allow: /

# --- AI Assistants & Answer Engines: Allowed for real-time answers/citations ---
# ChatGPT / OpenAI
User-agent: GPTBot
Allow: /

User-agent: ChatGPT-User
Allow: /

User-agent: OAI-SearchBot
Allow: /

# Claude / Anthropic
User-agent: ClaudeBot
Allow: /

User-agent: Claude-Web
Allow: /

User-agent: anthropic-ai
Allow: /

# Perplexity
User-agent: PerplexityBot
Allow: /

User-agent: Perplexity-User
Allow: /

# Apple Intelligence / Siri
User-agent: Applebot
Allow: /

User-agent: Applebot-Extended
Allow: /

# You.com
User-agent: YouBot
Allow: /

# Mistral
User-agent: MistralAI-User
Allow: /

# Cohere
User-agent: cohere-ai
Allow: /

User-agent: cohere-training-data-crawler
Allow: /

# DuckDuckGo AI Assist
User-agent: DuckAssistBot
Allow: /

# Brave Search AI
User-agent: Bravebot
Allow: /

# Microsoft Copilot (uses Bingbot already allowed above, plus:)
User-agent: Microsoft-Copilot
Allow: /

# --- Pure Training Scrapers: Blocked (we allow real-time answer engines, not bulk training) ---
User-agent: Amazonbot
Disallow: /

User-agent: Bytespider
Disallow: /

User-agent: CCBot
Disallow: /

User-agent: meta-externalagent
Disallow: /

User-agent: Meta-ExternalFetcher
Disallow: /

User-agent: Omgili
Disallow: /

User-agent: Diffbot
Disallow: /

User-agent: ImagesiftBot
Disallow: /

# --- Other Search Engines ---
User-agent: Yandex
Allow: /

User-agent: DuckDuckBot
Allow: /

# Yahoo Search
User-agent: Slurp
Allow: /

# Mojeek (privacy-first)
User-agent: MojeekBot
Allow: /

# Kagi (paid privacy search)
User-agent: KagiBot
Allow: /

# --- Grok / xAI ---
User-agent: xAI-Spider
Allow: /

User-agent: Grok
Allow: /

# --- Social media crawlers (link previews / OpenGraph fetching) ---
User-agent: Twitterbot
Allow: /

User-agent: LinkedInBot
Allow: /

User-agent: Slackbot
Allow: /

User-agent: Slackbot-LinkExpanding
Allow: /

User-agent: Discordbot
Allow: /

User-agent: WhatsApp
Allow: /

User-agent: TelegramBot
Allow: /

User-agent: Pinterest
Allow: /

# --- Misc reputable crawlers ---
User-agent: ia_archiver
Allow: /

User-agent: AhrefsBot
Allow: /

User-agent: SemrushBot
Allow: /

Sitemap: https://www.computerrecyclingllc.com/sitemap.xml

# LLM discovery
# https://www.computerrecyclingllc.com/llms.txt
# https://www.computerrecyclingllc.com/.well-known/llms.txt

IndexNow-key: 058dd37c2faf4f25a8e76343e676757c