# # robots.txt # # This file is to prevent the crawling and indexing of certain parts # of your site by web crawlers and spiders run by sites like Yahoo! # and Google. By telling these "robots" where not to go on your site, # you save bandwidth and server resources. # # This file will be ignored unless it is at the root of your host: # Used: http://example.com/robots.txt # Ignored: http://example.com/site/robots.txt # # For more information about the robots.txt standard, see: # http://www.robotstxt.org/robotstxt.html User-agent: * Crawl-delay: 10 # CSS, JS, Images Allow: /misc/*.css$ Allow: /misc/*.css? Allow: /misc/*.js$ Allow: /misc/*.js? Allow: /misc/*.gif Allow: /misc/*.jpg Allow: /misc/*.jpeg Allow: /misc/*.png Allow: /modules/*.css$ Allow: /modules/*.css? Allow: /modules/*.js$ Allow: /modules/*.js? Allow: /modules/*.gif Allow: /modules/*.jpg Allow: /modules/*.jpeg Allow: /modules/*.png Allow: /profiles/*.css$ Allow: /profiles/*.css? Allow: /profiles/*.js$ Allow: /profiles/*.js? Allow: /profiles/*.gif Allow: /profiles/*.jpg Allow: /profiles/*.jpeg Allow: /profiles/*.png Allow: /themes/*.css$ Allow: /themes/*.css? Allow: /themes/*.js$ Allow: /themes/*.js? Allow: /themes/*.gif Allow: /themes/*.jpg Allow: /themes/*.jpeg Allow: /themes/*.png # Directories Disallow: /includes/ Disallow: /misc/ Disallow: /modules/ Disallow: /profiles/ Disallow: /scripts/ Disallow: /themes/ # Files Disallow: /CHANGELOG.txt Disallow: /cron.php Disallow: /INSTALL.mysql.txt Disallow: /INSTALL.pgsql.txt Disallow: /INSTALL.sqlite.txt Disallow: /install.php Disallow: /INSTALL.txt Disallow: /LICENSE.txt Disallow: /MAINTAINERS.txt Disallow: /update.php Disallow: /UPGRADE.txt Disallow: /xmlrpc.php # Paths (clean URLs) Disallow: /admin/ Disallow: /comment/reply/ Disallow: /filter/tips/ Disallow: /node/add/ Disallow: /search/ Disallow: /user/register/ Disallow: /user/password/ Disallow: /user/login/ Disallow: /user/logout/ # Paths (no clean URLs) Disallow: /?q=admin/ Disallow: /?q=comment/reply/ Disallow: /?q=filter/tips/ Disallow: /?q=node/add/ Disallow: /?q=search/ Disallow: /?q=user/password/ Disallow: /?q=user/register/ Disallow: /?q=user/login/ Disallow: /?q=user/logout/ Disallow: /committees Disallow: /committees/information_centre # Prevent allow search engines accidentally flagging content. Disallow: /flag/ # Prevent indexing of non-existent languages. Disallow: /es/ Disallow: /pt-br/ Disallow: /it/ Disallow: /zh-hans/ Disallow: /fr/ Disallow: /el/ Disallow: /nl/ Disallow: /de/ # Ultimate AI Block List v1.3 20250310 # https://perishablepress.com/ultimate-ai-block-list/ User-agent: .ai User-agent: Agentic User-agent: AI Article Writer User-agent: AI Content Detector User-agent: AI Dungeon User-agent: AI Search Engine User-agent: AI SEO Crawler User-agent: AI Writer User-agent: AI21 Labs User-agent: AI2Bot User-agent: AIBot User-agent: AIMatrix User-agent: AISearchBot User-agent: AI Training User-agent: AITraining User-agent: Alexa User-agent: Alpha AI User-agent: AlphaAI User-agent: Amazon Bedrock User-agent: Amazon-Kendra User-agent: Amazon Lex User-agent: Amazon Comprehend User-agent: Amazon Sagemaker User-agent: Amazon Silk User-agent: Amazon Textract User-agent: AmazonBot User-agent: Amelia User-agent: AndersPinkBot User-agent: Anthropic User-agent: AnyPicker User-agent: Anyword User-agent: Applebot User-agent: Aria Browse User-agent: Articoolo User-agent: Automated Writer User-agent: AwarioRssBot User-agent: AwarioSmartBot User-agent: BardBot User-agent: BingAI User-agent: Bingbot-chat User-agent: BLEXBot User-agent: Brave Leo User-agent: ByteDance User-agent: Bytespider User-agent: CatBoost User-agent: CC-Crawler User-agent: CCBot User-agent: ChatGLM User-agent: Chinchilla User-agent: Claude User-agent: claudebot User-agent: ClearScope User-agent: Cohere User-agent: Common Crawl User-agent: CommonCrawl User-agent: Content Harmony User-agent: Content King User-agent: Content Optimizer User-agent: Content Samurai User-agent: ContentAtScale User-agent: ContentBot User-agent: Contentedge User-agent: Conversion AI User-agent: Copilot User-agent: CopyAI User-agent: Copymatic User-agent: Copyscape User-agent: Cotoyogi User-agent: CrawlQ AI User-agent: Crawlspace User-agent: Crew AI User-agent: CrewAI User-agent: DALL-E User-agent: DataForSeoBot User-agent: DataProvider User-agent: DeepAI User-agent: DeepL User-agent: DeepMind User-agent: DeepSeek User-agent: Diffbot User-agent: Doubao AI User-agent: DuckAssistBot User-agent: FacebookBot User-agent: FacebookExternalHit User-agent: Firecrawl User-agent: Flyriver User-agent: Frase AI User-agent: FriendlyCrawler User-agent: Gemini User-agent: Gemma User-agent: GenAI User-agent: Google Bard AI User-agent: Google-CloudVertexBot User-agent: Google-Extended User-agent: GoogleOther User-agent: Goose User-agent: GPT User-agent: Grammarly User-agent: Grendizer User-agent: Grok User-agent: GT Bot User-agent: GTBot User-agent: Hemingway Editor User-agent: Hugging Face User-agent: Hypotenuse AI User-agent: iaskspider User-agent: ICC-Crawler User-agent: ImagesiftBot User-agent: img2dataset User-agent: INK Editor User-agent: INKforall User-agent: IntelliSeek User-agent: Inferkit User-agent: ISSCyberRiskCrawler User-agent: JasperAI User-agent: Kafkai User-agent: Kangaroo User-agent: Keyword Density AI User-agent: KomoBot User-agent: LLaMA User-agent: magpie-crawler User-agent: MarketMuse User-agent: Meltwater User-agent: Meta AI User-agent: Meta-AI User-agent: Meta-External User-agent: MetaAI User-agent: MetaTagBot User-agent: Mistral User-agent: Narrative User-agent: NeevaBot User-agent: Neural Text User-agent: NeuralSEO User-agent: OAI-SearchBot User-agent: Omgili User-agent: Open AI User-agent: OpenAI User-agent: OpenBot User-agent: OpenText AI User-agent: Outwrite User-agent: Page Analyzer AI User-agent: PanguBot User-agent: Paperlibot User-agent: Paraphraser.io User-agent: PerplexityBot User-agent: PetalBot User-agent: Phindbot User-agent: PiplBot User-agent: ProWritingAid User-agent: QuillBot User-agent: RobotSpider User-agent: Rytr User-agent: SaplingAI User-agent: Scalenut User-agent: Scraper User-agent: Scrapy User-agent: ScriptBook User-agent: SEO Content Machine User-agent: SEO Robot User-agent: Sentibot User-agent: Sidetrade User-agent: Simplified AI User-agent: Skydancer User-agent: SlickWrite User-agent: Spin Rewriter User-agent: Spinbot User-agent: Stability User-agent: StableDiffusionBot User-agent: Sudowrite User-agent: Surfer AI User-agent: Text Blaze User-agent: TextCortex User-agent: The Knowledge AI User-agent: Timpibot User-agent: Vidnami AI User-agent: Webzio User-agent: Whisper User-agent: WordAI User-agent: Wordtune User-agent: WormsGTP User-agent: WPBot User-agent: Writecream User-agent: WriterZen User-agent: Writescope User-agent: Writesonic User-agent: xAI User-agent: xBot User-agent: YouBot User-agent: Zero GTP User-agent: Zerochat User-agent: Zimm Disallow: /