wttr.in/lib/cache.py

157 lines
4.1 KiB
Python
Raw Normal View History

"""
LRU-Cache implementation for formatted (`format=`) answers
"""
import datetime
import re
import time
2020-04-05 09:50:58 +00:00
import os
import hashlib
2020-04-30 09:20:32 +00:00
import random
2020-04-05 09:50:58 +00:00
import pytz
2020-04-05 09:50:58 +00:00
import pylru
from globals import LRU_CACHE
CACHE_SIZE = 10000
CACHE = pylru.lrucache(CACHE_SIZE)
2020-04-05 09:50:58 +00:00
# strings longer than this are stored not in ram
# but in the file cache
MIN_SIZE_FOR_FILECACHE = 80
def _update_answer(answer):
def _now_in_tz(timezone):
return datetime.datetime.now(pytz.timezone(timezone)).strftime("%H:%M:%S%z")
2020-04-05 11:48:16 +00:00
if isinstance(answer, str) and "%{{NOW(" in answer:
answer = re.sub(r"%{{NOW\(([^}]*)\)}}", lambda x: _now_in_tz(x.group(1)), answer)
return answer
def get_signature(user_agent, query_string, client_ip_address, lang):
"""
Get cache signature based on `user_agent`, `url_string`,
`lang`, and `client_ip_address`
2020-06-08 05:26:38 +00:00
Return `None` if query should not be cached.
"""
2020-06-08 05:26:38 +00:00
if "?" in query_string:
location = query_string.split("?", 1)[0]
else:
location = query_string
if location.startswith("http://"):
location = location[7:]
elif location.startswith("https://"):
location = location[8:]
2020-06-08 05:26:38 +00:00
if ":" in location:
return None
2020-04-30 09:20:32 +00:00
signature = "%s:%s:%s:%s" % \
(user_agent, query_string, client_ip_address, lang)
2020-04-05 09:50:58 +00:00
print(signature)
return signature
def get(signature):
"""
If `update_answer` is not True, return answer as it is
stored in the cache. Otherwise update it, using
the `_update_answer` function.
"""
2020-06-08 05:26:38 +00:00
if not signature:
return None
2020-04-30 09:20:32 +00:00
value_record = CACHE.get(signature)
if not value_record:
return None
value = value_record["val"]
expiry = value_record["expiry"]
if value and time.time() < expiry:
2020-04-05 11:48:16 +00:00
if value.startswith("file:") or value.startswith("bfile:"):
value = _read_from_file(signature, sighash=value)
2020-04-05 09:50:58 +00:00
if not value:
return None
return _update_answer(value)
return None
2020-04-30 09:20:32 +00:00
def _randint(minimum, maximum):
return random.randrange(maximum - minimum)
def store(signature, value):
"""
Store in cache `value` for `signature`
"""
2020-06-08 05:26:38 +00:00
if not signature:
return _update_answer(value)
2020-04-30 09:20:32 +00:00
if len(value) >= MIN_SIZE_FOR_FILECACHE:
value_to_store = _store_in_file(signature, value)
2020-04-05 09:50:58 +00:00
else:
2020-04-30 09:20:32 +00:00
value_to_store = value
value_record = {
"val": value_to_store,
2020-05-07 21:41:13 +00:00
"expiry": time.time() + _randint(1000, 2000),
2020-04-30 09:20:32 +00:00
}
CACHE[signature] = value_record
return _update_answer(value)
2020-04-05 09:50:58 +00:00
def _hash(signature):
return hashlib.md5(signature.encode("utf-8")).hexdigest()
def _store_in_file(signature, value):
"""Store `value` for `signature` in cache file.
Return file name (signature_hash) as the result.
2020-04-05 11:48:16 +00:00
`value` can be string as well as bytes.
Returned filename is prefixed with "file:" (for text files)
or "bfile:" (for binary files).
2020-04-05 09:50:58 +00:00
"""
signature_hash = _hash(signature)
filename = os.path.join(LRU_CACHE, signature_hash)
if not os.path.exists(LRU_CACHE):
os.makedirs(LRU_CACHE)
2020-04-05 11:48:16 +00:00
if isinstance(value, bytes):
mode = "wb"
signature_hash = "bfile:%s" % signature_hash
else:
mode = "w"
signature_hash = "file:%s" % signature_hash
with open(filename, mode) as f_cache:
2020-04-05 09:50:58 +00:00
f_cache.write(value)
return signature_hash
def _read_from_file(signature, sighash=None):
"""Read value for `signature` from cache file,
or return None if file is not found.
If `sighash` is specified, do not calculate file name
from signature, but use `sighash` instead.
2020-04-05 11:48:16 +00:00
`sigash` can be prefixed with "file:" (for text files)
or "bfile:" (for binary files).
2020-04-05 09:50:58 +00:00
"""
2020-04-05 11:48:16 +00:00
mode = "r"
if sighash:
if sighash.startswith("file:"):
sighash = sighash[5:]
elif sighash.startswith("bfile:"):
sighash = sighash[6:]
mode = "rb"
else:
sighash = _hash(signature)
filename = os.path.join(LRU_CACHE, sighash)
2020-04-05 09:50:58 +00:00
if not os.path.exists(filename):
return None
2020-04-05 11:48:16 +00:00
with open(filename, mode) as f_cache:
2020-04-05 09:50:58 +00:00
return f_cache.read()