diff options
Diffstat (limited to 'utils/gambling_sites_download.sh')
-rwxr-xr-x | utils/gambling_sites_download.sh | 17 |
1 files changed, 17 insertions, 0 deletions
diff --git a/utils/gambling_sites_download.sh b/utils/gambling_sites_download.sh new file mode 100755 index 000000000..614e7c694 --- /dev/null +++ b/utils/gambling_sites_download.sh @@ -0,0 +1,17 @@ +#!/usr/bin/env sh + +set -e + +cd "$(dirname "${0}")" || exit 1 + +DEST=../src/lib/inc_generated/ndpi_gambling_match.c.inc +LIST=/tmp/gambling.list + +printf '(1) %s\n' "Scraping Illegal Gambling Sites (Belgium)" +DOMAINS="$(curl -s 'https://www.gamingcommission.be/en/gaming-commission/illegal-games-of-chance/list-of-illegal-gambling-sites' | sed -n 's/^<td[^>]\+>\(.\+\.[a-zA-Z0-9]\+\)\(\|\/.*[^<]*\)<\/td>/\1/gp' || exit 1)" + +echo "${DOMAINS}" >${LIST} +./hostname2list.py "${LIST}" "Gambling" NDPI_PROTOCOL_GAMBLING NDPI_PROTOCOL_CATEGORY_WEB NDPI_PROTOCOL_UNSAFE >${DEST} +rm -f "${LIST}" + +exit 0 |