aboutsummaryrefslogtreecommitdiff
path: root/data
diff options
context:
space:
mode:
Diffstat (limited to 'data')
-rw-r--r--data/botPolicies.json2
-rw-r--r--data/botPolicies.yaml2
-rw-r--r--data/bots/ai-robots-txt.yaml2
3 files changed, 3 insertions, 3 deletions
diff --git a/data/botPolicies.json b/data/botPolicies.json
index dad04e8..160bbf0 100644
--- a/data/botPolicies.json
+++ b/data/botPolicies.json
@@ -41,7 +41,7 @@
},
{
"name": "generic-browser",
- "user_agent_regex": "Mozilla|Opera\n",
+ "user_agent_regex": "Mozilla|Opera",
"action": "CHALLENGE"
}
],
diff --git a/data/botPolicies.yaml b/data/botPolicies.yaml
index 585be15..51af499 100644
--- a/data/botPolicies.yaml
+++ b/data/botPolicies.yaml
@@ -43,7 +43,7 @@ bots:
# Generic catchall rule
- name: generic-browser
- user_agent_regex: >
+ user_agent_regex: >-
Mozilla|Opera
action: CHALLENGE
diff --git a/data/bots/ai-robots-txt.yaml b/data/bots/ai-robots-txt.yaml
index 19cbe93..ef2790c 100644
--- a/data/bots/ai-robots-txt.yaml
+++ b/data/bots/ai-robots-txt.yaml
@@ -1,4 +1,4 @@
- name: "ai-robots-txt"
- user_agent_regex: >
+ user_agent_regex: >-
AI2Bot|Ai2Bot-Dolma|Amazonbot|anthropic-ai|Applebot|Applebot-Extended|Brightbot 1.0|Bytespider|CCBot|ChatGPT-User|Claude-Web|ClaudeBot|cohere-ai|cohere-training-data-crawler|Crawlspace|Diffbot|DuckAssistBot|FacebookBot|FriendlyCrawler|Google-Extended|GoogleOther|GoogleOther-Image|GoogleOther-Video|GPTBot|iaskspider/2.0|ICC-Crawler|ImagesiftBot|img2dataset|ISSCyberRiskCrawler|Kangaroo Bot|Meta-ExternalAgent|Meta-ExternalFetcher|OAI-SearchBot|omgili|omgilibot|PanguBot|Perplexity-User|PerplexityBot|PetalBot|Scrapy|SemrushBot-OCOB|SemrushBot-SWA|Sidetrade indexer bot|Timpibot|VelenPublicWebCrawler|Webzio-Extended|YouBot
action: DENY \ No newline at end of file