aboutsummaryrefslogtreecommitdiff
path: root/utils/gambling_sites_download.sh
diff options
context:
space:
mode:
authorlns <matzeton@googlemail.com>2023-05-20 15:04:06 +0200
committerlns <matzeton@googlemail.com>2023-05-20 15:04:06 +0200
commitebd0f9eebc28d7ea83a73114e6b91ad2eedf2d83 (patch)
treef604b98e632a4286e75fa4d452ff903f37051b6a /utils/gambling_sites_download.sh
parent5ca6f0ac62d6b2c346bc99d2a1b1200fe9df7917 (diff)
Added scripts to auto generate hostname/SNI *.inc files.add/hostname-inc-generator-and-gambling-sites
* add illegal gambling sites (Belgium) Signed-off-by: lns <matzeton@googlemail.com>
Diffstat (limited to 'utils/gambling_sites_download.sh')
-rwxr-xr-xutils/gambling_sites_download.sh17
1 files changed, 17 insertions, 0 deletions
diff --git a/utils/gambling_sites_download.sh b/utils/gambling_sites_download.sh
new file mode 100755
index 000000000..614e7c694
--- /dev/null
+++ b/utils/gambling_sites_download.sh
@@ -0,0 +1,17 @@
+#!/usr/bin/env sh
+
+set -e
+
+cd "$(dirname "${0}")" || exit 1
+
+DEST=../src/lib/inc_generated/ndpi_gambling_match.c.inc
+LIST=/tmp/gambling.list
+
+printf '(1) %s\n' "Scraping Illegal Gambling Sites (Belgium)"
+DOMAINS="$(curl -s 'https://www.gamingcommission.be/en/gaming-commission/illegal-games-of-chance/list-of-illegal-gambling-sites' | sed -n 's/^<td[^>]\+>\(.\+\.[a-zA-Z0-9]\+\)\(\|\/.*[^<]*\)<\/td>/\1/gp' || exit 1)"
+
+echo "${DOMAINS}" >${LIST}
+./hostname2list.py "${LIST}" "Gambling" NDPI_PROTOCOL_GAMBLING NDPI_PROTOCOL_CATEGORY_WEB NDPI_PROTOCOL_UNSAFE >${DEST}
+rm -f "${LIST}"
+
+exit 0