# 长风低空 robots.txt # 站点: https://cfdkjj.com/ # 最近更新: 2026-05-27 # ========== 传统搜索引擎(明确允许全站爬取,排除后台/接口)========== # 谷歌系 User-agent: Googlebot Allow: / Disallow: /admin/ Disallow: /api/ User-agent: Googlebot-Image Allow: /assets/ Allow: / # 百度系(中文市场主力) User-agent: Baiduspider Allow: / Disallow: /admin/ Disallow: /api/ User-agent: Baiduspider-image Allow: /assets/ Allow: / # 必应(含 ChatGPT/Copilot 索引来源) User-agent: Bingbot Allow: / Disallow: /admin/ Disallow: /api/ # 搜狗 User-agent: Sogou web spider Allow: / Disallow: /admin/ # 360 User-agent: 360Spider Allow: / Disallow: /admin/ # 神马(移动端中文) User-agent: YisouSpider Allow: / Disallow: /admin/ # ========== 大模型 / AI 引擎爬虫(明确允许,让 AI 引用我们的内容)========== # OpenAI ChatGPT 检索 User-agent: GPTBot Allow: / Disallow: /admin/ User-agent: OAI-SearchBot Allow: / User-agent: ChatGPT-User Allow: / # Anthropic Claude User-agent: ClaudeBot Allow: / Disallow: /admin/ User-agent: Claude-Web Allow: / User-agent: anthropic-ai Allow: / # Google AI 训练(独立于 Googlebot) User-agent: Google-Extended Allow: / # Perplexity User-agent: PerplexityBot Allow: / User-agent: Perplexity-User Allow: / # 字节豆包 / 抖音搜索 User-agent: Bytespider Allow: / Disallow: /admin/ # 苹果智能 User-agent: Applebot Allow: / User-agent: Applebot-Extended Allow: / # Meta / Llama User-agent: Meta-ExternalAgent Allow: / User-agent: FacebookBot Allow: / # Common Crawl(开源数据集,被多家大模型使用) User-agent: CCBot Allow: / # Mistral User-agent: MistralAI-User Allow: / # ========== 兜底规则 ========== User-agent: * Allow: / Disallow: /admin/ Disallow: /api/ Disallow: /backup/ Disallow: /infra/ Disallow: /scripts/ Disallow: /seed/ Disallow: /.git/ Disallow: /node_modules/ Crawl-delay: 1 # ========== Sitemap & 资源 ========== Sitemap: https://cfdkjj.com/sitemap.xml Host: https://cfdkjj.com