proxy.pac.test/build.sh

274 lines
8.1 KiB
Bash
Raw Normal View History

2024-10-07 01:30:54 +00:00
#!/usr/bin/env bash
IFS='.' read -r __major __minor _ <<< "${BASH_VERSION:-0.0.0}"
if [ "$__major" -lt 4 ] || { [ "$__major" -eq 4 ] && [ "$__minor" -lt 3 ]; }; then
echo "Error: this script requires Bash version 4.3 or higher. Your current version is ${BASH_VERSION:-unknown}." >&2
echo "" >&2
echo "$BASH --version" >&2
"$BASH" --version >&2
exit 1
fi
2024-10-08 02:08:09 +00:00
set -euo pipefail
shopt -s nullglob
2024-10-07 01:30:54 +00:00
cd "$(dirname "$0")"
declare -A files
files[auto-proxy.txt]=https://raw.githubusercontent.com/gfwlist/gfwlist/master/gfwlist.txt
files[ipv4-rules-direct.txt]=https://gaoyifan.github.io/china-operator-ip/china.txt
files[ipv6-rules-direct.txt]=https://gaoyifan.github.io/china-operator-ip/china6.txt
2024-10-07 01:30:54 +00:00
declare -a files_to_be_deleted=()
2024-10-07 01:30:54 +00:00
function cleanup() {
local retval="$?"
local file
for file in "${files_to_be_deleted[@]}"; do
2024-10-10 04:16:19 +00:00
if [[ -e "${file}" ]]; then
echo "Remove $file"
rm -v "${file}"
fi
done
exit "$retval"
2024-10-07 01:30:54 +00:00
} >&2
trap cleanup EXIT ERR SIGINT
for f in "${!files[@]}"; do
url="${files[$f]}"
2024-10-10 04:16:19 +00:00
if [[ ! -e "$f" ]]; then
files_to_be_deleted=("$f" "${f}.tmp")
2024-10-07 01:30:54 +00:00
if command -v wget &>/dev/null; then
wget -O "${f}.tmp" "$url"
2024-10-07 01:30:54 +00:00
elif command -v curl &>/dev/null; then
curl --output "${f}.tmp" "$url"
2024-10-07 01:30:54 +00:00
else
echo "Error: please install wget or curl."
exit 1
fi
if [[ "$f" = auto-proxy.txt ]]; then
base64 -d <"${f}.tmp" > "$f"
else
mv "${f}.tmp" "$f"
fi
2024-10-07 01:30:54 +00:00
fi
done
files_to_be_deleted=()
2024-10-07 01:30:54 +00:00
domain_segments() {
local domain="$1"
while [[ -n "${domain}" ]]; do
echo "$domain"
[[ "${domain-}" = *.* ]] || break
domain="${domain#*.}"
done
}
actual="$(domain_segments foo.bar.example.com)"
expected="foo.bar.example.com bar.example.com example.com com"
if [[ "$actual" = "$expected" ]]; then
echo "Fail: test for function domain_segments"
echo " expected: $expected"
echo " actual: $actual"
exit 1
fi >&2
expand_ipv6() {
local ipv6="$1"
local full_ipv6=""
if [[ "$ipv6" == *"::"* ]]; then
local left_part="${ipv6%%::*}"
local right_part="${ipv6##*::}"
local left_segments=(${left_part//:/ })
local right_segments=(${right_part//:/ })
local num_missing=$(( 8 - ${#left_segments[@]} - ${#right_segments[@]} ))
for segment in "${left_segments[@]}"; do
full_ipv6+="$(printf "%04x" "0x$segment"):"
done
for ((i=0; i<num_missing; i++)); do
full_ipv6+="0000:"
done
for segment in "${right_segments[@]}"; do
full_ipv6+="$(printf "%04x" "0x$segment"):"
done
echo "${full_ipv6%:}"
else
echo "$ipv6"
fi
}
generate_pac() {
local jsfile="$1"
declare -A domain_rules
local file rule domain
2024-10-07 01:30:54 +00:00
for file in domain-rules-*.txt; do
rule="${file#domain-rules-}"
rule="${rule%.txt}"
while IFS= read -r domain; do
domain="${domain%%#*}"
domain="${domain// }"
[[ -n "$domain" ]] || continue
domain_rules["$domain"]="$rule";
done < "$file"
done
for file in auto-proxy*.txt; do
local line item rule parent_rule
while read -r line; do
echo "$line" >&2
rule=
case "$line" in
(/*)
echo "Skip regrex rul: $line"
;;
(\!*|\[*)
: comment
;;
(@@\|\|*)
line="${line#@}"
;&
(@@\|*)
line="${line#@?|}"
line="${line#*://}"
line="${line%%\%2F*}"
domain="${line%%/*}"
rule=direct
echo "==> direct access: $domain"
;;
(\|\|*)
line="${line#|}"
;&
(\|*)
line="${line#|}"
line="${line#*://}"
;&
([.a-z0-9]*)
line="${line#.}"
line="${line%%\%2F*}"
domain="${line%%/*}"
domain="${domain#*\**.}"
rule=proxy
echo "==> proxy access: $domain"
;;
(*)
[[ "$line" =~ ^[[:space:]]*$ ]] ||
echo "Skip: $line"
;;
esac >&2
[[ -n "${rule}" ]] || continue
[[ -z "${domain_rules[$domain]-}" ]] || continue
parent_rule=
for item in $(domain_segments "$domain"); do
if [[ -n "${domain_rules[$item]-}" ]]; then
parent_rule="${domain_rules[$item]}"
break
fi
done
if [[ -z "$parent_rule" ]] || [[ "$parent_rule" != "$rule" ]]; then
domain_rules["$domain"]="$rule"
2024-10-07 01:30:54 +00:00
fi
done < <(sed '/URL Keywords/,/^!/d' "$file")
done
2024-10-07 01:30:54 +00:00
local domain rule parent_rule
declare -a segments
for domain in "${!domain_rules[@]}"; do
rule="${domain_rules[$domain]}"
segments=($(domain_segments "$domain" 2>/dev/null))
parent_rule=
for item in ${segments[@]:1}; do
parent_rule="${domain_rules[$item]-}"
[[ -z "${parent_rule-}" ]] || break
done
if [[ "${parent_rule-}" = "${rule}" ]]; then
unset "domain_rules[$domain]"
fi
done
sed -n '1,/ begin of ipv4 networks$/p' "$jsfile"
2024-10-10 04:16:19 +00:00
for file in ipv4-rules-*.txt; do
rule="${file#ipv?-rules-}"
rule="${rule%%.*}"
[[ "$rule" = @(blocked|direct|proxy) ]] || rule="\"$rule\""
while IFS= read -r line; do
line="${line%%#*}"
line="${line// }"
echo "$rule: $line" >&2
2024-10-10 04:16:19 +00:00
while IFS=/ read -r ip prefix; do
2024-10-07 01:30:54 +00:00
while IFS=. read n1 n2 n3 n4; do
printf " [0x%02x%02x%02x%02x, %s, %s], // %s\n" "${n1:-0}" "${n2:-0}" "${n3:-0}" "${n4:-0}" "$prefix" "$rule" "$line"
2024-10-07 01:30:54 +00:00
done <<< "$ip"
done <<< "${line}";
done < "$file"
done | sort -n
2024-10-10 04:16:19 +00:00
2024-10-07 01:30:54 +00:00
sed -n '/ end of ipv4 networks$/,/ begin of ipv6 networks$/p' "$jsfile"
2024-10-10 04:16:19 +00:00
for file in ipv6-rules-*.txt; do
rule="${file#ipv?-rules-}"
rule="${rule%%.*}"
[[ "$rule" = @(blocked|direct|proxy) ]] || rule="\"$rule\""
while IFS= read -r line; do
line="${line%%#*}"
line="${line// }"
echo "$rule: $line" >&2
local ipv6="${line%%/*}"
local prefix="${line##*/}"
local expanded_ipv6=$(expand_ipv6 "$ipv6")
local full_hex="${expanded_ipv6//:/}"
echo " [0x${full_hex:0:16}n, 0x${full_hex:16:16}n, ${prefix}, ${rule}], // ${line}"
done < "$file"
done | sort
2024-10-10 04:16:19 +00:00
2024-10-07 01:30:54 +00:00
sed -n '/ end of ipv6 networks$/,/ begin of proxy rules$/p' "$jsfile"
2024-10-10 04:16:19 +00:00
2024-10-07 01:30:54 +00:00
local domain
for domain in "${!domain_rules[@]}"; do
rule="${domain_rules[$domain]}"
[[ "$rule" = @(blocked|direct|proxy) ]] || rule="\"$rule\""
printf " \"%s\": %s,\n" "$domain" "$rule"
done | sort -n
2024-10-10 04:16:19 +00:00
2024-10-09 03:06:34 +00:00
sed -n '/ end of proxy rules$/,/ begin of regexp rules$/p' "$jsfile"
2024-10-10 04:16:19 +00:00
2024-10-09 03:06:34 +00:00
for file in domain-regexp*.txt; do
rule=""
while IFS= read -r line; do
line="${line%%#*}"
line="${line// }"
[[ -n "$line" ]] || continue
if [[ "$line" = \[*\] ]]; then
rule="${line#[}"
rule="${rule%]}"
[[ "$rule" = @(blocked|direct|proxy) ]] || rule="\"$rule\""
elif [[ -n "$rule" ]]; then
printf " [/%s/, %s],\n" "$line" "$rule"
fi
done < "$file"
done
2024-10-10 04:16:19 +00:00
2024-10-09 03:06:34 +00:00
sed -n '/ end of regexp rules$/,$p' "$jsfile"
2024-10-07 01:30:54 +00:00
}
is_up_to_date=true
files_to_be_deleted=(proxy.pac)
for file in "$0" *.js *.txt; do
if [ "$file" -nt proxy.pac ]; then
is_up_to_date=false
break;
fi
done
"$is_up_to_date" || generate_pac "./proxy.js" > proxy.pac
2024-10-07 01:30:54 +00:00
if command -v node &>/dev/null; then
node proxy.pac test
fi
files_to_be_deleted=()