# As a condition of accessing this website, you agree to abide by the following # content signals: # (a) If a Content-Signal = yes, you may collect content for the corresponding # use. # (b) If a Content-Signal = no, you may not collect content for the # corresponding use. # (c) If the website operator does not include a Content-Signal for a # corresponding use, the website operator neither grants nor restricts # permission via Content-Signal with respect to the corresponding use. # The content signals and their meanings are: # search: building a search index and providing search results (e.g., returning # hyperlinks and short excerpts from your website's contents). Search does not # include providing AI-generated search summaries. # ai-input: inputting content into one or more AI models (e.g., retrieval # augmented generation, grounding, or other real-time taking of content for # generative AI search answers). # ai-train: training or fine-tuning AI models. # ANY RESTRICTIONS EXPRESSED VIA CONTENT SIGNALS ARE EXPRESS RESERVATIONS OF # RIGHTS UNDER ARTICLE 4 OF THE EUROPEAN UNION DIRECTIVE 2019/790 ON COPYRIGHT # AND RELATED RIGHTS IN THE DIGITAL SINGLE MARKET. # BEGIN Cloudflare Managed content User-agent: * Content-Signal: search=yes,ai-train=no Allow: / User-agent: Amazonbot Disallow: / User-agent: Applebot-Extended Disallow: / User-agent: Bytespider Disallow: / User-agent: CCBot Disallow: / User-agent: ClaudeBot Disallow: / User-agent: CloudflareBrowserRenderingCrawler Disallow: / User-agent: Google-Extended Disallow: / User-agent: GPTBot Disallow: / User-agent: meta-externalagent Disallow: / # END Cloudflare Managed Content # # robots.txt # # This file is to prevent the crawling and indexing of certain parts # of your site by web crawlers and spiders run by sites like Yahoo! # and Google. By telling these "robots" where not to go on your site, # you save bandwidth and server resources. # # This file will be ignored unless it is at the root of your host: # Used: http://example.com/robots.txt # Ignored: http://example.com/site/robots.txt # # For more information about the robots.txt standard, see: # http://www.robotstxt.org/robotstxt.html User-agent: * sitemap: https://www.crash.net/sitemap.xml sitemap: https://www.crash.net/image-sitemap.xml sitemap: https://www.crash.net/video-sitemap.xml sitemap: https://www.crash.net/googlenews.xml # CSS, JS, Images Allow: /core/*.css$ Allow: /core/*.css? Allow: /core/*.js$ Allow: /core/*.js? Allow: /core/*.gif Allow: /core/*.jpg Allow: /core/*.jpeg Allow: /core/*.png Allow: /core/*.svg Allow: /misc/*.css$ Allow: /misc/*.css? Allow: /misc/*.js$ Allow: /misc/*.js? Allow: /misc/*.gif Allow: /misc/*.jpg Allow: /misc/*.jpeg Allow: /misc/*.png Allow: /modules/*.css$ Allow: /modules/*.css? Allow: /modules/*.js$ Allow: /modules/*.js? Allow: /modules/*.gif Allow: /modules/*.jpg Allow: /modules/*.jpeg Allow: /modules/*.png Allow: /profiles/*.css$ Allow: /profiles/*.css? Allow: /profiles/*.js$ Allow: /profiles/*.js? Allow: /profiles/*.gif Allow: /profiles/*.jpg Allow: /profiles/*.jpeg Allow: /profiles/*.png Allow: /profiles/*.svg Allow: /themes/*.css$ Allow: /themes/*.css? Allow: /themes/*.js$ Allow: /themes/*.js? Allow: /themes/*.gif Allow: /themes/*.jpg Allow: /themes/*.jpeg Allow: /themes/*.png Allow: /themes/*.svg # Directories Disallow: /core/ Disallow: /includes/ Disallow: /misc/ Disallow: /modules/ Disallow: /profiles/ Disallow: /scripts/ Disallow: /themes/ # Files Disallow: /CHANGELOG.txt Disallow: /cron.php Disallow: /INSTALL.mysql.txt Disallow: /INSTALL.pgsql.txt Disallow: /INSTALL.sqlite.txt Disallow: /install.php Disallow: /INSTALL.txt Disallow: /LICENSE.txt Disallow: /MAINTAINERS.txt Disallow: /update.php Disallow: /UPGRADE.txt Disallow: /README.txt Disallow: /web.config # Paths (clean URLs) Disallow: /admin/ Disallow: /comment/* Disallow: /filter/tips/ Disallow: /node/add/ Disallow: /search/ Disallow: /user/* Disallow: /media/oembed Disallow: /*/media/oembed # Paths (no clean URLs) Disallow: /index.php/admin/ Disallow: /index.php/comment/* Disallow: /index.php/filter/tips Disallow: /index.php/node/add/ Disallow: /index.php/search/ Disallow: /index.php/user/* Disallow: /index.php/media/oembed Disallow: /index.php/*/media/oembed # General Patterns Disallow: /node/* Disallow: /node?* Disallow: /files/* Disallow: /search/* Disallow: /content/* # Site Specific Patterns # Custom Disallow: /news/articlePrint.aspx Disallow: /*/print.html Disallow: /*/print Disallow: /*/email.html Disallow: /contact.html Disallow: /login.html Disallow: /register.html Disallow: /*/tags/ Disallow: /*/newcomment/ Disallow: /*/newComment/ Disallow: /*/have_your_say/ Disallow: /*/have_your_say_author/ Disallow: /*/have_your_say_comments/ Disallow: /*/reportComment/ Disallow: /*/picturearchive/ Disallow: /*/grid_girls/ Disallow: /*/top_grid_girls/ Disallow: /*/kw/ Disallow: /*/igallery/ Disallow: /*/services/ Disallow: /*/radio_archive/ Disallow: /radio.asp Disallow: /radio.htm Disallow: /radioplayer/ Disallow: /*/video_archive/ Disallow: /*/audio_archive/ Disallow: /video.asp Disallow: /video.htm Disallow: /*/vote/ Disallow: /*/poll/ Disallow: /*/poll_results/ Disallow: /*/shop/ Disallow: /*/picture_search/ Disallow: /*/free_podcasts/ Disallow: /pictures/igallery.aspx Disallow: /videos/eplayer.aspx Disallow: /PublicServices/ Disallow: /ScriptResource.axd Disallow: /WebResource.axd Disallow: /videos/eplayer.aspx Disallow: /1037673/* Disallow: /21100889/* Disallow: /s3/files/styles/* Disallow: /countries/* #Custom ID General Patterns Disallow: /id/comment/* Disallow: /id/user/* Disallow: /id/node/* Disallow: /id/node?* Disallow: /id/files/* Disallow: /id/search/* Disallow: /id/content/* Disallow: /id/countries/* # Championship Patterns Disallow: /*/large_picture/* Disallow: /*/youtube/* #Block ChatGPT User-agent: GPTBot Disallow: /