From 480647f2e212f0405d4e830401f2a42fef16745c Mon Sep 17 00:00:00 2001 From: TheErrorExe <161362055+TheErrorExe@users.noreply.github.com> Date: Thu, 26 Jun 2025 18:21:29 +0000 Subject: [PATCH] add robots.txt --- robots.txt | 87 ++++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 87 insertions(+) create mode 100644 robots.txt diff --git a/robots.txt b/robots.txt new file mode 100644 index 0000000..e494f21 --- /dev/null +++ b/robots.txt @@ -0,0 +1,87 @@ +# Stop search engine scrapers from downloading videos +User-agent: * +Disallow: /watch +Disallow: /channel +Disallow: /sigma/videos/* + +# Stop AI scrapers +User-agent: AI2Bot +User-agent: Ai2Bot-Dolma +User-agent: aiHitBot +User-agent: Amazonbot +User-agent: Andibot +User-agent: anthropic-ai +User-agent: Applebot +User-agent: Applebot-Extended +User-agent: bedrockbot +User-agent: Brightbot 1.0 +User-agent: Bytespider +User-agent: CCBot +User-agent: ChatGPT-User +User-agent: Claude-SearchBot +User-agent: Claude-User +User-agent: Claude-Web +User-agent: ClaudeBot +User-agent: cohere-ai +User-agent: cohere-training-data-crawler +User-agent: Cotoyogi +User-agent: Crawlspace +User-agent: Diffbot +User-agent: DuckAssistBot +User-agent: EchoboxBot +User-agent: FacebookBot +User-agent: Factset_spyderbot +User-agent: FirecrawlAgent +User-agent: FriendlyCrawler +User-agent: Google-CloudVertexBot +User-agent: Google-Extended +User-agent: GoogleOther +User-agent: GoogleOther-Image +User-agent: GoogleOther-Video +User-agent: GPTBot +User-agent: iaskspider/2.0 +User-agent: ICC-Crawler +User-agent: ImagesiftBot +User-agent: img2dataset +User-agent: ISSCyberRiskCrawler +User-agent: Kangaroo Bot +User-agent: meta-externalagent +User-agent: Meta-ExternalAgent +User-agent: meta-externalfetcher +User-agent: Meta-ExternalFetcher +User-agent: MistralAI-User/1.0 +User-agent: MyCentralAIScraperBot +User-agent: NovaAct +User-agent: OAI-SearchBot +User-agent: omgili +User-agent: omgilibot +User-agent: Operator +User-agent: PanguBot +User-agent: Panscient +User-agent: panscient.com +User-agent: Perplexity-User +User-agent: PerplexityBot +User-agent: PetalBot +User-agent: PhindBot +User-agent: Poseidon Research Crawler +User-agent: QualifiedBot +User-agent: QuillBot +User-agent: quillbot.com +User-agent: SBIntuitionsBot +User-agent: Scrapy +User-agent: SemrushBot +User-agent: SemrushBot-BA +User-agent: SemrushBot-CT +User-agent: SemrushBot-OCOB +User-agent: SemrushBot-SI +User-agent: SemrushBot-SWA +User-agent: Sidetrade indexer bot +User-agent: TikTokSpider +User-agent: Timpibot +User-agent: VelenPublicWebCrawler +User-agent: Webzio-Extended +User-agent: wpbot +User-agent: YandexAdditional +User-agent: YandexAdditionalBot +User-agent: YouBot +Disallow: /