#!/bin/env python3 # Copyright 2019 Pekka Helenius # Permission is hereby granted, free of charge, to any person obtaining a copy of this software # and associated documentation files (the "Software"), to deal in the Software without restriction, # including without limitation the rights to use, copy, modify, merge, publish, distribute, # sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is # furnished to do so, subject to the following conditions: # The above copyright notice and this permission notice shall be included in all copies or # substantial portions of the Software. # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, # INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR # PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE # FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, # ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. ######################################## # Simple DNS sinkhole file generation for DNSCrypt & pdnsd servers # Block DNS query resolutions for specific network domains ######################################## import os import re import readline import signal import sys import time import numpy as np import urllib.request as URL from datetime import datetime from socket import timeout ######################################## url_useragent = 'Mozilla/5.0 (Windows NT 6.1; Win64; x64; rv:62.0) Gecko/20100101 Firefox/62.0' url_timeout = 60 filepath = '/tmp/' #timestamp_short = datetime.now().strftime('%Y-%m-%d') timestamp_long = datetime.now().strftime('%Y-%m-%d %H:%M:%S') #################### pdnsd_datafile = 'pdnsd.sinkhole' pdnsd_tempfile = pdnsd_datafile + '.tmp' pdnsd_fileheader = "// Auto-generated list, build date " + timestamp_long + "\n// No addresses of these domains must be resolved" + "\n\n" pdnsd_outmessage = ("Move it to /etc/ folder and add the following configuration setting in /etc/pdnsd.conf:\n\n" + \ "//Blacklisted domains\ninclude { file = \"/etc/" + pdnsd_datafile + "\"; }\n\n--------------------\nRestart pdnsd by issuing command 'systemctl restart pdnsd'\n\nYou may need to delete your pdnsd.cache file before the list rules apply.\n") #################### dnscrypt_datafile = 'dnscrypt.cloaking.txt' dnscrypt_tempfile = dnscrypt_datafile + ".tmp" dnscrypt_fileheader = "# Auto-generated list, build date " + datetime.now().strftime('%Y-%m-%d %H:%M:%S') + "\n# No addresses of these domains must be resolved" + "\n\n" dnscrypt_outmessage = ("Move it to /etc/dnscrypt-proxy/ and add the following configuration setting in\n/etc/dnscrypt-proxy/dnscrypt-proxy.toml:\n\n" + \ "cloaking_rules = '/etc/dnscrypt-proxy/" + dnscrypt_datafile + "'\n\n--------------------\nRestart dnscrypt-proxy by issuing command 'systemctl restart dnscrypt-proxy'\n") ######################################## domains_blacklists = [ # { # 'name': 'Cameleon blocklist', # 'url': 'https://sysctl.org/cameleon/hosts' # }, # { # 'name': 'Xiaomi spyware blocklist (kevle2)', # 'url': 'https://raw.githubusercontent.com/kevle2/XiaomiSpywareBlockList/master/xiaomiblock.txt' # }, { 'name': 'My custom blocklist', 'url': 'file:///home/' + os.environ['USER'] + '/dns-sinkhole.txt' }, { 'name': 'Simple tracking', 'url': 'https://s3.amazonaws.com/lists.disconnect.me/simple_tracking.txt' }, { 'name': 'Simple ads', 'url': 'https://s3.amazonaws.com/lists.disconnect.me/simple_ad.txt' }, { 'name': 'Zeustracker blocklist', 'url': 'https://zeustracker.abuse.ch/blocklist.php?download=domainblocklist' }, { 'name': 'Zeustracker baddomains', 'url': 'https://zeustracker.abuse.ch/blocklist.php?download=baddomains' }, { 'name': 'StevenBlack blocklist', 'url': 'https://raw.githubusercontent.com/StevenBlack/hosts/master/hosts' }, { 'name': 'Malwaredomains blocklist', 'url': 'https://mirror1.malwaredomains.com/files/justdomains' }, { 'name': 'Ad servers', 'url': 'https://hosts-file.net/ad_servers.txt' }, { 'name': 'YouTube ads (kboghdady)', 'url': 'https://raw.githubusercontent.com/kboghdady/youTube_ads_4_pi-hole/master/black.list' }, { 'name': 'YouTube ads (Akamaru)', 'url': 'https://raw.githubusercontent.com/Akamaru/Pi-Hole-Lists/master/youtube.txt' }, { 'name': 'HbbTV ads (Akamaru)', 'url': 'https://raw.githubusercontent.com/Akamaru/Pi-Hole-Lists/master/hbbtv.txt' }, { 'name': 'Windows ads (Akamaru)', 'url': 'https://raw.githubusercontent.com/Akamaru/Pi-Hole-Lists/master/nomsdata.txt' }, { 'name': 'Android & iOS ads (Akamaru)', 'url': 'https://raw.githubusercontent.com/Akamaru/Pi-Hole-Lists/master/appads.txt' }, { 'name': 'Fake jailbreak websites (Akamaru)', 'url': 'https://raw.githubusercontent.com/Akamaru/Pi-Hole-Lists/master/jbfake.txt' }, { 'name': 'Adobe updates (Akamaru)', 'url': 'https://raw.githubusercontent.com/Akamaru/Pi-Hole-Lists/master/adobeblock.txt' }, { 'name': 'Fake emulators (Akamaru)', 'url': 'https://raw.githubusercontent.com/Akamaru/Pi-Hole-Lists/master/gamefake.txt' }, { 'name': 'ADsecu blocklist', 'url': 'https://raw.githubusercontent.com/ADsecu/black-domains/master/domain_hosts.txt' }, { 'name': 'SweetSophia blocklist', 'url': 'https://raw.githubusercontent.com/SweetSophia/mifitxiaomipiholelist/master/mifitblocklist.txt' }, { 'name': 'Android ads (SweetSophia)', 'url': 'https://raw.githubusercontent.com/SweetSophia/androidappspihole/master/testrareandroappblock.txt' }, { 'name': 'Blocklist (zebpalmer)', 'url': 'https://raw.githubusercontent.com/zebpalmer/dns_blocklists/master/blocklist.txt' }, { 'name': 'Ads and tracking extended (lightswitch05)', 'url': 'https://raw.githubusercontent.com/lightswitch05/hosts/master/ads-and-tracking-extended.txt' }, { 'name': 'Amp hosts extended (lightswitch05)', 'url': 'https://raw.githubusercontent.com/lightswitch05/hosts/master/amp-hosts-extended.txt' }, { 'name': 'Tracking aggressive (lightswitch05)', 'url': 'https://raw.githubusercontent.com/lightswitch05/hosts/master/tracking-aggressive-extended.txt' }, { 'name': 'dnscrypt.info blacklist', 'url': 'https://download.dnscrypt.info/blacklists/domains/mybase.txt' }, { 'name': 'dnscrypt-proxy blacklist', 'url': 'https://raw.githubusercontent.com/CNMan/dnscrypt-proxy-config/master/dnscrypt-blacklist-domains.txt' }, { 'name': 'dnscrypt - activation blocklist', 'url': 'https://raw.githubusercontent.com/zeffy/dnscrypt-blocking-additions/master/hosts/blacklist/activation.txt' }, { 'name': 'dnscrypt - ads blocklist', 'url': 'https://raw.githubusercontent.com/zeffy/dnscrypt-blocking-additions/master/hosts/blacklist/ads.txt' }, { 'name': 'dnscrypt - anticheat blocklist', 'url': 'https://raw.githubusercontent.com/zeffy/dnscrypt-blocking-additions/master/hosts/blacklist/anticheat.txt' }, { 'name': 'dnscrypt - fakenews blocklist', 'url': 'https://raw.githubusercontent.com/zeffy/dnscrypt-blocking-additions/master/hosts/blacklist/fakenews.txt' }, { 'name': 'dnscrypt - tracking blocklist', 'url': 'https://raw.githubusercontent.com/zeffy/dnscrypt-blocking-additions/master/hosts/blacklist/tracking.txt' }, { 'name': 'dnscrypt - misc blocklist', 'url': 'https://raw.githubusercontent.com/zeffy/dnscrypt-blocking-additions/master/hosts/blacklist/misc.txt' }, { 'name': 'WindowsSpyBlocker - spy (crazy-max)', 'url': 'https://raw.githubusercontent.com/crazy-max/WindowsSpyBlocker/master/data/dnscrypt/spy.txt' }, { 'name': 'WindowsSpyBlocker - update (crazy-max)', 'url': 'https://raw.githubusercontent.com/crazy-max/WindowsSpyBlocker/master/data/dnscrypt/update.txt' }, { 'name': 'WindowsSpyBlocker - extra (crazy-max)', 'url': 'https://raw.githubusercontent.com/crazy-max/WindowsSpyBlocker/master/data/dnscrypt/extra.txt' } ] ######################################## # Exclude these pre-blacklisted domains from the final DNS sinkhole blacklist domains_whitelists = [ # { # 'name': 'My custom whitelist', # 'url': 'file:///home/' + os.environ['USER'] + '/dns-whitelist.txt' # } ] ######################################## failedlists = [] ########## def filewrite(filepath, datafile, string, operationmode, closefile): with open(os.path.join(filepath, datafile),operationmode) as f: f.write(string) if closefile is True: f.close() ########## def getlist(domainlist,timeout): if not domainlist is None: try: print("Processing list:\t\t" + domainlist['name']) request = URL.Request(domainlist['url'],headers={'User-Agent': url_useragent}) return np.array(URL.urlopen(request, timeout=timeout).read().decode('utf-8').split('\n')) except KeyboardInterrupt: exit(0) except: print("Data retrieval failed:\t\t" + domainlist['url'] + "\n") failedlists.append(domainlist['name']) pass ########## def fetchdomaindata(dataset): fetched_data = set() if not dataset is None: for line in dataset: if not re.search('.*:.*', line) \ and not re.search('[\[|\]]', line) \ and not re.search('^.*#', line) \ and not re.search('.*localhost.*', line) \ and not re.search('\slocal$', line) \ and not re.search('^$', line) \ and re.search('[a-z]+', line): line = re.sub(r'^[0-9]+\.[0-9]+\.[0-9]+\.[0-9]+[ \t]+','',line) # Windows EOL last character substitution, corrects misformatted line variable line = re.sub('[\n]?\r$','',line) if not re.match('^$',line): fetched_data.add(line) if len(set(fetched_data)) == 0: print("\t\t\t\tNo domain entries found\n") return fetched_data ######################################## # DNS sinkhole file headers filewrite(filepath, pdnsd_datafile, pdnsd_fileheader, 'w', True) filewrite(filepath, dnscrypt_datafile, dnscrypt_fileheader, 'w', True) #################### # Download and parse white/blocklists ########## if domains_whitelists: for whitelist in domains_whitelists: whitelist_dataset = getlist(whitelist, url_timeout) whitelist_fetched_data = fetchdomaindata(whitelist_dataset) else: whitelist_fetched_data = set() ########## for blacklist in domains_blacklists: blacklist_dataset = getlist(blacklist, url_timeout) if not blacklist_dataset is None: for line in (fetchdomaindata(blacklist_dataset)): if not line in whitelist_fetched_data: if re.search('^\.', line): pdnsd_line = "neg { name=*" + line + "; types = domain; }" elif re.search('\*', line): pdnsd_line = "neg { name=" + line + "; types = domain; }" else: pdnsd_line = "rr { name=" + line + "; a=0.0.0.0; }" dnscrypt_line = line + " " + "0.0.0.0" filewrite(filepath, pdnsd_tempfile, pdnsd_line + '\n', 'a', False) if not dnscrypt_line is None: filewrite(filepath, dnscrypt_tempfile, dnscrypt_line + '\n', 'a', False) #################### # Parse generated list, get only unique lines and write to final file def parseuniqlines(filepath, tempfile, outfile, outmessage): uniqdata = set() with open(os.path.join(filepath, outfile),'a') as f: for line in open(os.path.join(filepath, tempfile),'r'): if not line in uniqdata: f.write(line) uniqdata.add(line) f.close() os.remove(os.path.join(filepath, tempfile)) print("----------------------------------------") print("Added " + str(len(set(uniqdata))) + " unique domains to the sinkhole file " + filepath + outfile) print("DNS sinkhole file " + filepath + outfile + " generated successfully.") print(outmessage) parseuniqlines(filepath, pdnsd_tempfile, pdnsd_datafile, pdnsd_outmessage) parseuniqlines(filepath, dnscrypt_tempfile, dnscrypt_datafile, dnscrypt_outmessage) #################### # Inform user about failed DNS blocklist downloads if len(failedlists) > 0: print("Warning: could not get data for the following blocklists:\n") for i in range(len(failedlists)): print("\t" + failedlists[i]) print("")