pybl/py-squid-blacklists-cdb.py
2016-02-20 14:46:12 +01:00

81 lines
2.1 KiB
Python
Executable File

#!/usr/bin/env python2.7
import sys
import os
import re
from urlparse import urlparse
try:
import config
except ImportError:
print("Please create config.py using config.py.sample")
exit()
try:
import cdb
except ImportError:
print("Please install python-cdb from pypi or via package manager")
exit()
def make_list(files):
blacklists = []
for l in files:
splitlist = l.split("/")
list_type = splitlist[len(splitlist) - 2]
blacklists.append([list_type, l])
return blacklists
def make_db(blacklist_files, config):
lib = []
for bl in blacklist_files:
bl_cdb_file = ("%s/%s.cdb" % (config.blacklists_dir, bl[0]))
bl_cdb_file_tmp = ("%s/%s.tmp" % (config.blacklists_dir, bl[0]))
if (bl[0] in config.blacklists):
if not os.path.isfile(bl_cdb_file):
cdb_file = cdb.cdbmake(bl_cdb_file, bl_cdb_file_tmp)
cache = dict()
f = open(bl[1], "r")
for line in f:
cdb_file.add(line.strip("\n"), "True")
cdb_file.finish()
lib.append(bl_cdb_file)
return lib
def compare(outline, blacklist_cache):
result = False
for blacklist in blacklist_cache:
cdb_file = cdb.init(blacklist)
tmpline = outline
while not result and tmpline != "":
try:
result = cdb_file[tmpline]
pass
except KeyError:
pass
tmpline = tmpline.partition('.')[2]
return result
def squid_response(response):
sys.stdout.write("%s\n" % response)
sys.stdout.flush()
domain_files = [os.path.join(dp, f) for dp, dn, fn in os.walk(os.path.expanduser(config.blacklists_dir)) for f in fn if re.match(r"domains*", f)]
blacklist_files = make_list(domain_files)
blacklist_cache = make_db(blacklist_files, config)
while True:
try:
line = sys.stdin.readline().strip()
outline = urlparse(line).netloc
if line:
if compare(outline, blacklist_cache):
squid_response("OK")
else:
squid_response("ERR")
except KeyboardInterrupt:
break