# robots.txt para folioepress.com # ===================================== # PERMITIR BOTS DE IA Y LLMs PRINCIPALES # ===================================== # OpenAI (ChatGPT) User-agent: GPTBot Allow: / User-agent: ChatGPT-User Allow: / # Anthropic (Claude) User-agent: anthropic-ai Allow: / User-agent: Claude-Web Allow: / # Perplexity User-agent: PerplexityBot Allow: / # Common Crawl (fuente de datos para LLMs) User-agent: CCBot Allow: / # You.com User-agent: YouBot Allow: / # ByteDance (para modelos de IA) User-agent: Bytespider Allow: / # Diffbot (extracción de datos estructurados) User-agent: Diffbot Allow: / # Facebook (para IA de Meta) User-agent: FacebookBot Allow: / # Google Extended (Bard/Gemini) User-agent: Google-Extended Allow: / # Omgili (agregador de contenido para IA) User-agent: omgili Allow: / User-agent: omgilibot Allow: / # Bingbot (necesario para Copilot de Microsoft) User-agent: bingbot Allow: / # ===================================== # PERMITIR BOTS DE BÚSQUEDA PRINCIPALES # ===================================== User-agent: Googlebot Allow: / User-agent: Googlebot-image Allow: / # ===================================== # BLOQUEAR BOTS PROBLEMÁTICOS Y ABUSIVOS # ===================================== User-agent: grapeshot Disallow: / User-agent: proximic Disallow: / User-agent: AhrefsBot Disallow: / User-agent: YandexBot Disallow: / User-agent: BLEXBot Disallow: / User-Agent: MJ12bot Disallow: / User-agent: dotbot Disallow: / User-agent: 360Spider Disallow: / User-agent: HaoSouSpider Disallow: / User-agent: 360Spider-Image Disallow: / User-agent: 360Spider-Video Disallow: / User-agent: adbeat_bot Disallow: / User-agent: Yandex Disallow: / User-agent: Baiduspider Disallow: / User-agent: baiduspider Disallow: / User-agent: Baiduspider+ Disallow: / User-agent: sogou spider Disallow: / User-agent: Sogou web spider Disallow: / User-agent: Nutch Disallow: / User-agent: Dow Jones Searchbot Disallow: / User-agent: linkdex Disallow: / User-agent: linkdex.com Disallow: / User-agent: linkdex.com/v2.0 Disallow: / User-agent: Flamingo_SearchEngine+(+http://www.flamingosearch.com/bot) Disallow: / User-agent: Flamingo_SearchEngine Disallow: / User-agent: Spinn3r Disallow: / User-agent: Owlin Bot v. 3.0 Disallow: / User-agent: Owlin bot v3 Disallow: / User-agent: Owlin Bot Disallow: / User-agent: Owlin Disallow: / User-agent: MegaIndex.ru Disallow: / User-agent: MegaIndex.ru/2.0 Disallow: / User-agent: SemrushBot Disallow: / User-agent: panscient.com Disallow: / User-agent: DomainAppender Disallow: / User-agent: wotbox Disallow: / User-agent: OrangeBot Disallow: / User-agent: spbot Disallow: / User-agent: magpie-crawler Disallow: / User-agent: Cliqzbot Disallow: / User-agent: IstellaBot Disallow: / User-agent: BUbiNG Disallow: / User-agent: ZumBot Disallow: / User-agent: Aboundexbot Disallow: / User-agent: yoozBot Disallow: / User-agent: Go-http-client Disallow: / User-agent: ltx71 Disallow: / User-agent: SiteExplorer Disallow: / User-agent: DomainCrawler Disallow: / User-agent: SEOkicks-Robot Disallow: /