Pickle implemented (but not activated by default). Closes #1

This commit is contained in:
Stephane Bortzmeyer 2021-07-07 15:50:47 +02:00
parent ae00a81f79
commit 04fb72e408
2 changed files with 52 additions and 21 deletions

View File

@ -14,42 +14,63 @@ import os
import sys import sys
import time import time
import fcntl import fcntl
import pickle
IANABASE = "https://data.iana.org/rdap/dns.json" IANABASE = "https://data.iana.org/rdap/dns.json"
CACHE = os.environ["HOME"] + "/.ianardapcache.json" CACHE = os.environ["HOME"] + "/.ianardapcache"
MAXAGE = 24 # Hours MAXAGE = 24 # Hours
IANATIMEOUT = 10 # Seconds IANATIMEOUT = 10 # Seconds
MAXTESTS = 3 # Maximum attempts to get the database MAXTESTS = 3 # Maximum attempts to get the database
class IanaRDAPDatabase(): class IanaRDAPDatabase():
def __init__(self, maxage=MAXAGE, cachefile=CACHE): def __init__(self, maxage=MAXAGE, cachefile=CACHE, pickleformat=False):
""" Retrieves the IANA databse, if not already cached. maxage is in hours. """ """Retrieves the IANA database, if not already cached. maxage is in
hours. The cache file argument should not have an extension (it will
be added automatically). pickleformat is not the default because it is
not really faster *and* it introduces security risks if someone can
write in the file (see the documentation of the module)."""
cache_valid = False cache_valid = False
self.cachefile = cachefile if pickleformat:
self.cachefile = cachefile + ".pickle"
else:
self.cachefile = cachefile + ".json"
self.lockname = self.cachefile + ".lock" self.lockname = self.cachefile + ".lock"
loaded = False loaded = False
tests = 0 tests = 0
errmsg = "No error" errmsg = "No error"
while not loaded and tests < MAXTESTS: while not loaded and tests < MAXTESTS:
self.lock() self.lock()
if os.path.exists(cachefile) and \ if os.path.exists(self.cachefile) and \
datetime.datetime.fromtimestamp(os.path.getmtime(cachefile)) > \ datetime.datetime.fromtimestamp(os.path.getmtime(self.cachefile)) > \
(datetime.datetime.now() - datetime.timedelta(hours = maxage)): (datetime.datetime.now() - datetime.timedelta(hours = maxage)):
cache = open(cachefile, "rb") cache = open(self.cachefile, "rb")
content = cache.read() content = cache.read()
cache.close() cache.close()
self.unlock() self.unlock()
if pickleformat:
try:
database = pickle.loads(content)
loaded = True
self.retrieved = datetime.datetime.fromtimestamp(os.path.getmtime(self.cachefile))
cache_valid = True
except (pickle.UnpicklingError, EOFError):
tests += 1
errmsg = "Invalid pickle content in %s" % self.cachefile
# Delete it without mercy
os.remove(self.cachefile)
continue
else:
try: try:
database = json.loads(content) database = json.loads(content)
loaded = True loaded = True
self.retrieved = datetime.datetime.fromtimestamp(os.path.getmtime(cachefile)) self.retrieved = datetime.datetime.fromtimestamp(os.path.getmtime(self.cachefile))
cache_valid = True cache_valid = True
except json.decoder.JSONDecodeError: except json.decoder.JSONDecodeError:
tests += 1 tests += 1
errmsg = "Invalid JSON content in %s" % cachefile errmsg = "Invalid JSON content in %s" % self.cachefile
# Delete it without mercy # Delete it without mercy
os.remove(cachefile) os.remove(self.cachefile)
continue continue
else: else:
self.unlock() self.unlock()
@ -81,7 +102,10 @@ class IanaRDAPDatabase():
self.services[tld] = server self.services[tld] = server
if not cache_valid: if not cache_valid:
self.lock() self.lock()
cache = open(cachefile, "wb") cache = open(self.cachefile, "wb")
if pickleformat:
cache.write(pickle.dumps(database))
else:
cache.write(content) cache.write(content)
cache.close() cache.close()
self.unlock() self.unlock()

View File

@ -23,7 +23,7 @@ def test_alternative_cache():
datetime.datetime.fromtimestamp(os.path.getmtime(tmpfile.name)) > \ datetime.datetime.fromtimestamp(os.path.getmtime(tmpfile.name)) > \
(datetime.datetime.now() - datetime.timedelta(minutes=1)) (datetime.datetime.now() - datetime.timedelta(minutes=1))
os.remove(tmpfile.name) os.remove(tmpfile.name)
os.remove(tmpfile.name + ".lock") os.remove(tmpfile.name + ".json.lock")
def test_refresh(): def test_refresh():
# Force a resfresh # Force a resfresh
@ -41,3 +41,10 @@ def test_find_not_exists():
database = ianardap.IanaRDAPDatabase() database = ianardap.IanaRDAPDatabase()
server = database.find("www.foobar.example") server = database.find("www.foobar.example")
assert server is None assert server is None
def test_pickle():
database = ianardap.IanaRDAPDatabase(pickleformat=True)
assert database.description.startswith("RDAP bootstrap file") and database.version == "1.0" and \
len(database.services) > 1000