| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788 |
- - # Pathological bots to deny
- # This correlates to data/bots/_deny-pathological.yaml in the source tree
- # https://github.com/TecharoHQ/anubis/blob/main/data/bots/_deny-pathological.yaml
- import: (data)/bots/_deny-pathological.yaml
- - import: (data)/bots/aggressive-brazilian-scrapers.yaml
- # Aggressively block AI/LLM related bots/agents by default
- - import: (data)/meta/ai-block-aggressive.yaml
- # Consider replacing the aggressive AI policy with more selective policies:
- # - import: (data)/meta/ai-block-moderate.yaml
- # - import: (data)/meta/ai-block-permissive.yaml
- # Search engine crawlers to allow, defaults to:
- # - Google (so they don't try to bypass Anubis)
- # - Apple
- # - Bing
- # - DuckDuckGo
- # - Qwant
- # - The Internet Archive
- # - Kagi
- # - Marginalia
- # - Mojeek
- - import: (data)/crawlers/_allow-good.yaml
- # Challenge Firefox AI previews
- - import: (data)/clients/x-firefox-ai.yaml
- # Allow common "keeping the internet working" routes (well-known, favicon, robots.txt)
- - import: (data)/common/keep-internet-working.yaml
- # # Punish any bot with "bot" in the user-agent string
- # # This is known to have a high false-positive rate, use at your own risk
- # - name: generic-bot-catchall
- # user_agent_regex: (?i:bot|crawler)
- # action: CHALLENGE
- # challenge:
- # difficulty: 16 # impossible
- # algorithm: slow # intentionally waste CPU cycles and time
- # Requires a subscription to Thoth to use, see
- # https://anubis.techaro.lol/docs/admin/thoth#geoip-based-filtering
- - name: countries-with-aggressive-scrapers
- action: WEIGH
- geoip:
- countries:
- - BR
- - CN
- weight:
- adjust: 10
- # Requires a subscription to Thoth to use, see
- # https://anubis.techaro.lol/docs/admin/thoth#asn-based-filtering
- - name: aggressive-asns-without-functional-abuse-contact
- action: WEIGH
- asns:
- match:
- - 13335 # Cloudflare
- - 136907 # Huawei Cloud
- - 45102 # Alibaba Cloud
- weight:
- adjust: 10
- # ## System load based checks.
- # # If the system is under high load, add weight.
- # - name: high-load-average
- # action: WEIGH
- # expression: load_1m >= 10.0 # make sure to end the load comparison in a .0
- # weight:
- # adjust: 20
- ## If your backend service is running on the same operating system as Anubis,
- ## you can uncomment this rule to make the challenge easier when the system is
- ## under low load.
- ##
- ## If it is not, remove weight.
- # - name: low-load-average
- # action: WEIGH
- # expression: load_15m <= 4.0 # make sure to end the load comparison in a .0
- # weight:
- # adjust: -10
- # Generic catchall rule
- - name: generic-browser
- user_agent_regex: >-
- Mozilla|Opera
- action: WEIGH
- weight:
- adjust: 10
|