Files
privacore-open-source-searc…/urlblacklist.txt.example
2017-10-17 15:43:20 +02:00

116 lines
3.0 KiB
Plaintext

# this file accepts multiple criteria types
# blocks url from being inserted into spiderdb
# one line criteria per line
#
# types:
# - domain
# - file
# - host
# - hostsuffix
# - path
# - regex (pcre)
# - tld
#
# domain example
# ==============
# block all subdomain of example.com domain
# blocks: www.example.com
# blocks: sub.example.com
# blocks: example.com
domain example.com
# block all of example.com except empty subdomain & www
# blocks: sub.example.com
# allows: example.com
# allows: www.example.com
domain example.com allow=,www
# block all of example.com except empty subdomain & www root pages
# blocks: example.com/dir/file.html
# allows: example.com/file.html
# allows: www.example.com/index.html
domain example.com allow=,www allowrootpages
# block all of example.com except empty subdomain & www index page
# blocks: example.com/file.html
# blocks: example.com/index.html
# allows: example.com/?param=value
# allows: www.example.com/
domain example.com allow=,www allowindexpage
# file example
# ============
# block file (exact match)
# blocks: www.example.com/wp-login.php
# blocks: www.example.com/blog/wp-login.php
# allows: www.example.com/blog/wp-login.php5
# allows: www.example.com/blog/nwp-login.php
file wp-login.php
# host example
# ============
# block specific host
# blocks: www.example.com
# allows: sub.example.com
host www.example.com
# block specific host with specific port
# blocks: www.example.com:3001
# allows: www.example.com
# allows: www.example.com:3002
host www.example.com:3001
# block specific host with path (prefix)
# blocks: www.example.com/path/abc
# blocks: www.example.com/path/def
# allows: www.example.com/
# allows: www.example.com/some/
host www.example.com /path/
# block host with suffix
# blocks: sub2.sub1.example.com
# blocks: sub1.example.com
# allows: www.example.com
# allows: notsub1.example.com
hostsuffix sub1.example.com
# param example
# =============
# block specific param (case insensitive)
# blocks: www.example.com/file.html?good=abc&bad=123
# blocks: www.example.com/?bad=123
# allows: www.example.com/?good=abc
param bad
# block specific param (case insensitive) with specific value (case sensitive)
# blocks: www.example.com/file.html?good=abc&bad=xyz
# blocks: www.example.com/file.html?good=abc&BAD=xyz
# allows: www.example.com/file.html?good=abc&bad=abc
# blocks: www.example.com/file.html?good=abc&bad=XYZ
# allows: www.example.com/file.html?good=abc&bad=xyz1
param bad xyz
# path example
# ============
# blocks specific path (prefix)
# blocks: www.example.com/wp-admin
# blocks: www.example.com/wp-admin/login
# allows: www.example.com/en/wp-admin
path /wp-admin
# regex example
# =============
# blocks url by regex
regex * https?://example\.com/(a|b)\.html
# blocks url by regex (specific domain)
regex example.com https?://example\.com/(a|b)\.html
# tld example
# ===========
# block entire country specific domain
# blocks: www.example.my
# blocks: www.example.com.my
# blocks: www.example.sg
tld my,sg