forked from skroll/privoxy-adblock
-
Notifications
You must be signed in to change notification settings - Fork 0
/
privoxy-adblock.sh
executable file
·208 lines (182 loc) · 7.7 KB
/
privoxy-adblock.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
#!/bin/sh
sedcmd=${SEDCMD:-sed}
defaultprivoxydir="/usr/local/etc/privoxy"
defaulturl="https://easylist-downloads.adblockplus.org/easylist.txt"
#=== FUNCTION ================================================================
# NAME: cleanup
# DESCRIPTION: cleans up after script termination
# PARAMETERS: none
# RETURNS: none
#===============================================================================
cleanup() {
trap - INT TERM EXIT
[ -f "${pidfile}" ] && rm "$pidfile"
exit
}
#=== FUNCTION ================================================================
# NAME: isrunning
# DESCRIPTION: is any previous instance of this script already running
# PARAMETERS: pid file path
# RETURNS: boolean
#===============================================================================
isrunning() {
pidfile="${1}"
[ ! -f "${pidfile}" ] && return 1 #pid file is nonexistent
procpid=$(cat "${pidfile}")
[ -z "${procpid}" ] && return 1 #pid file contains no pid
# check process list for pid existence and is an instance of this script
[ ! "$(ps -p "${procpid}" | grep "$(basename "${0}")")" = "" ] && value=0 || value=1
return ${value}
}
#=== FUNCTION ================================================================
# NAME: createpidfile
# DESCRIPTION: atomic creation of pid file with no race condition
# PARAMETERS: the pid to put in the file, the filename to use as a lock
# RETURNS: none
#===============================================================================
createpidfile() {
mypid=${1}
pidfile=${2}
#Close stderr, don't overwrite existing file, shove my pid in the lock file.
(exec 2>&-; set -o noclobber; echo "$mypid" > "$pidfile")
[ ! -f "${pidfile}" ] && exit #Lock file creation failed
procpid=$(cat "${pidfile}")
[ "${mypid}" -ne "${procpid}" ] && {
#I'm not the pid in the lock file
# Is the process pid in the lockfile still running?
isrunning "${pidfile}" || {
# No. Kill the pidfile and relaunch
rm "${pidfile}"
"$0" "$@"
}
exit
}
}
#=== FUNCTION ================================================================
# NAME: pidfilename
# DESCRIPTION: create a predictable pid file name, put it in the right inode
# PARAMETERS: none
# RETURNS: path and filename
#===============================================================================
pidfilename() {
myfile=$(basename "$0" .sh)
whoiam=$(whoami)
mypidfile="/tmp/${myfile}.pid"
[ "$whoiam" = 'root' ] && mypidfile="/var/run/$myfile.pid"
echo "$mypidfile"
}
#=== FUNCTION ================================================================
# NAME: doconvert
# DESCRIPTION: download requested scripts and perform the conversion
# PARAMETERS: privoxy conf dir, list of urls
# RETURNS: none
#===============================================================================
doconvert() {
privoxydir=$1
urls=$2
for url in ${urls}
do
file="${tempdir}/$(basename "${url}")"
actionfile="${file%\.*}.script.action"
filterfile="${file%\.*}.script.filter"
list="$(basename "${file%\.*}")"
# clean up files
[ -f "${file}" ] && rm "${file}"
[ -f "${actionfile}" ] && rm "${actionfile}"
[ -f "${filterfile}" ] && rm "${filterfile}"
echo "downloading ${url} ..."
if command -v curl >/dev/null; then
curl -k "${url}" > "${file}"
elif command -v wget >/dev/null; then
wget -t 3 --no-check-certificate -O "${file}" "${url}"
else
echo "No curl or wget" 1>&2
exit 255
fi
[ "$(grep -E '^.*\[Adblock.*\].*$' "${file}")" = "" ] && echo "The list recieved from ${url} isn't an AdblockPlus list. Skipped" && continue
echo "Creating actionfile for ${list} ..."
printf '{ +block{%s} }\n' "${list}" > "${actionfile}"
$sedcmd '/^!.*/d;1,1 d;/^@@.*/d;/\$.*/d;/#/d;s/\./\\./g;s/\?/\\?/g;s/\*/.*/g;s/(/\\(/g;s/)/\\)/g;s/\[/\\[/g;s/\]/\\]/g;s/\^/[\/\&:\?=_]/g;s/^||/\./g;s/^|/^/g;s/|$/\$/g;/|/d' "${file}" >> "${actionfile}"
echo "... creating filterfile for ${list} ..."
echo "FILTER: ${list} Tag filter of ${list}" > "${filterfile}"
$sedcmd '/^#/!d;s/^##//g;s/^#\(.*\)\[.*\]\[.*\]*/s@<([a-zA-Z0-9]+)\\s+.*id=.?\1.*>.*<\/\\1>@@g/g;s/^#\(.*\)/s@<([a-zA-Z0-9]+)\\s+.*id=.?\1.*>.*<\/\\1>@@g/g;s/^\.\(.*\)/s@<([a-zA-Z0-9]+)\\s+.*class=.?\1.*>.*<\/\\1>@@g/g;s/^a\[\(.*\)\]/s@<a.*\1.*>.*<\/a>@@g/g;s/^\([a-zA-Z0-9]*\)\.\(.*\)\[.*\]\[.*\]*/s@<\1.*class=.?\2.*>.*<\/\1>@@g/g;s/^\([a-zA-Z0-9]*\)#\(.*\):.*[:[^:]]*[^:]*/s@<\1.*id=.?\2.*>.*<\/\1>@@g/g;s/^\([a-zA-Z0-9]*\)#\(.*\)/s@<\1.*id=.?\2.*>.*<\/\1>@@g/g;s/^\[\([a-zA-Z]*\).=\(.*\)\]/s@\1^=\2>@@g/g;s/\^/[\/\&:\?=_]/g;s/\.\([a-zA-Z0-9]\)/\\.\1/g' "${file}" >> "${filterfile}"
echo "... filterfile created - adding filterfile to actionfile ..."
echo "{ +filter{${list}} }" >> "${actionfile}"
echo "*" >> "${actionfile}"
echo "... filterfile added ..."
echo "... creating and adding whitlist for urls ..."
echo "{ -block }" >> "${actionfile}"
$sedcmd '/^@@.*/!d;s/^@@//g;/\$.*/d;/#/d;s/\./\\./g;s/\?/\\?/g;s/\*/.*/g;s/(/\\(/g;s/)/\\)/g;s/\[/\\[/g;s/\]/\\]/g;s/\^/[\/\&:\?=_]/g;s/^||/\./g;s/^|/^/g;s/|$/\$/g;/|/d' "${file}" >> "${actionfile}"
echo "... created and added whitelist - creating and adding image handler ..."
echo "{ -block +handle-as-image }" >> "${actionfile}"
$sedcmd '/^@@.*/!d;s/^@@//g;/\$.*image.*/!d;s/\$.*image.*//g;/#/d;s/\./\\./g;s/\?/\\?/g;s/\*/.*/g;s/(/\\(/g;s/)/\\)/g;s/\[/\\[/g;s/\]/\\]/g;s/\^/[\/\&:\?=_]/g;s/^||/\./g;s/^|/^/g;s/|$/\$/g;/|/d' "${file}" >> "${actionfile}"
echo "... created and added image handler ..."
echo "... created actionfile for ${list}."
actionfiledest="${privoxydir}/$(basename "${actionfile}")"
echo "... copying ${actionfile} to ${actionfiledest}"
cp "${actionfile}" "${actionfiledest}"
filterfiledest="${privoxydir}/$(basename "${filterfile}")"
echo "... copying ${filterfile} to ${filterfiledest}"
cp "${filterfile}" "${filterfiledest}"
done
}
#=== FUNCTION ================================================================
# NAME: usage
# DESCRIPTION: prints command usage
# PARAMETERS: none
# RETURNS: none
#===============================================================================
usage() {
# echo "Usage: ${0} [-d] [-p <privoxy config dir>] [-u <url1>] [-u <url2>]..."
echo "Usage: ${0} [-p <privoxy config dir>] [-u <url1>] [-u <url2>]..."
exit 1
}
#=== FUNCTION ================================================================
# NAME: main
# DESCRIPTION: main script entry point
# PARAMETERS: none
# RETURNS: none
#===============================================================================
main() {
pidfile="$(pidfilename)"
tempfile="$(mktemp -t j.XXX)"
tempdir="$(dirname "${tempfile}")"
rm "${tempfile}"
isrunning "${pidfile}" && {
echo "$(basename "${0}") is already running"
exit 1
}
createpidfile $$ "${pidfile}"
trap 'cleanup' INT TERM EXIT
# debug="false"
# trap 'logger -t $0 -i -- $USER : $BASH_COMMAND' ERR #log errors regardless
privoxydir=$defaultprivoxydir
urls="${defaulturl}"
while getopts "dp:u:" opt; do
case "${opt}" in
p)
privoxydir=${OPTARG}
;;
u)
urls=$(printf '%s\n%s' "${urls}" "${OPTARG}")
;;
# d)
# debug="true"
# ;;
*)
usage
;;
:)
echo "Option -${OPTARG} requires an argument." >&2
usage
;;
esac
done
# [ "${debug}" = "true" ] && trap 'logger -t $0 -i -- $USER : $BASH_COMMAND' DEBUG #syslog everything if we're debugging
[ ! -d "${privoxydir}" ] && usage
[ "${urls}" = "" ] && usage
# perform the operation
doconvert "$privoxydir" "$urls"
}
main "$@"
exit 0