2021-03-24 16:26:38 +00:00
|
|
|
"""Functions that help us generate and use info.json files.
|
|
|
|
"""
|
|
|
|
import json
|
2023-01-01 19:16:38 +00:00
|
|
|
import hjson
|
|
|
|
import jsonschema
|
2021-03-24 16:26:38 +00:00
|
|
|
from collections.abc import Mapping
|
2021-08-16 22:33:30 +00:00
|
|
|
from functools import lru_cache
|
2023-01-01 19:16:38 +00:00
|
|
|
from typing import OrderedDict
|
2021-03-24 16:26:38 +00:00
|
|
|
from pathlib import Path
|
2024-03-01 21:45:01 +00:00
|
|
|
from copy import deepcopy
|
2021-03-24 16:26:38 +00:00
|
|
|
|
|
|
|
from milc import cli
|
|
|
|
|
|
|
|
|
2022-11-09 15:50:43 +00:00
|
|
|
def _dict_raise_on_duplicates(ordered_pairs):
|
|
|
|
"""Reject duplicate keys."""
|
|
|
|
d = {}
|
|
|
|
for k, v in ordered_pairs:
|
|
|
|
if k in d:
|
|
|
|
raise ValueError("duplicate key: %r" % (k,))
|
|
|
|
else:
|
|
|
|
d[k] = v
|
|
|
|
return d
|
|
|
|
|
|
|
|
|
2024-03-01 21:45:01 +00:00
|
|
|
@lru_cache(maxsize=20)
|
|
|
|
def _json_load_impl(json_file, strict=True):
|
2021-03-24 16:26:38 +00:00
|
|
|
"""Load a json file from disk.
|
|
|
|
|
|
|
|
Note: file must be a Path object.
|
|
|
|
"""
|
|
|
|
try:
|
2022-02-28 20:02:39 +00:00
|
|
|
# Get the IO Stream for Path objects
|
|
|
|
# Not necessary if the data is provided via stdin
|
|
|
|
if isinstance(json_file, Path):
|
|
|
|
json_file = json_file.open(encoding='utf-8')
|
2022-11-09 15:50:43 +00:00
|
|
|
return hjson.load(json_file, object_pairs_hook=_dict_raise_on_duplicates if strict else None)
|
2021-03-24 16:26:38 +00:00
|
|
|
|
2021-08-09 15:27:02 +00:00
|
|
|
except (json.decoder.JSONDecodeError, hjson.HjsonDecodeError) as e:
|
2021-03-24 16:26:38 +00:00
|
|
|
cli.log.error('Invalid JSON encountered attempting to load {fg_cyan}%s{fg_reset}:\n\t{fg_red}%s', json_file, e)
|
|
|
|
exit(1)
|
2021-08-09 15:27:02 +00:00
|
|
|
except Exception as e:
|
|
|
|
cli.log.error('Unknown error attempting to load {fg_cyan}%s{fg_reset}:\n\t{fg_red}%s', json_file, e)
|
|
|
|
exit(1)
|
2021-03-24 16:26:38 +00:00
|
|
|
|
|
|
|
|
2024-03-01 21:45:01 +00:00
|
|
|
def json_load(json_file, strict=True):
|
|
|
|
return deepcopy(_json_load_impl(json_file=json_file, strict=strict))
|
|
|
|
|
|
|
|
|
|
|
|
@lru_cache(maxsize=20)
|
2021-03-24 16:26:38 +00:00
|
|
|
def load_jsonschema(schema_name):
|
|
|
|
"""Read a jsonschema file from disk.
|
|
|
|
"""
|
2021-06-25 03:48:53 +00:00
|
|
|
if Path(schema_name).exists():
|
|
|
|
return json_load(schema_name)
|
|
|
|
|
2021-03-24 16:26:38 +00:00
|
|
|
schema_path = Path(f'data/schemas/{schema_name}.jsonschema')
|
|
|
|
|
|
|
|
if not schema_path.exists():
|
|
|
|
schema_path = Path('data/schemas/false.jsonschema')
|
|
|
|
|
|
|
|
return json_load(schema_path)
|
|
|
|
|
|
|
|
|
2024-03-01 21:45:01 +00:00
|
|
|
@lru_cache(maxsize=1)
|
2021-08-16 22:33:30 +00:00
|
|
|
def compile_schema_store():
|
|
|
|
"""Compile all our schemas into a schema store.
|
2021-03-24 16:26:38 +00:00
|
|
|
"""
|
2021-06-25 03:48:53 +00:00
|
|
|
schema_store = {}
|
2021-03-24 16:26:38 +00:00
|
|
|
|
2021-06-25 03:48:53 +00:00
|
|
|
for schema_file in Path('data/schemas').glob('*.jsonschema'):
|
|
|
|
schema_data = load_jsonschema(schema_file)
|
|
|
|
if not isinstance(schema_data, dict):
|
|
|
|
cli.log.debug('Skipping schema file %s', schema_file)
|
|
|
|
continue
|
|
|
|
schema_store[schema_data['$id']] = schema_data
|
|
|
|
|
2021-08-16 22:33:30 +00:00
|
|
|
return schema_store
|
|
|
|
|
|
|
|
|
2024-03-01 21:45:01 +00:00
|
|
|
@lru_cache(maxsize=20)
|
2021-08-16 22:33:30 +00:00
|
|
|
def create_validator(schema):
|
|
|
|
"""Creates a validator for the given schema id.
|
|
|
|
"""
|
|
|
|
schema_store = compile_schema_store()
|
2022-02-28 20:02:39 +00:00
|
|
|
resolver = jsonschema.RefResolver.from_schema(schema_store[schema], store=schema_store)
|
2021-06-25 03:48:53 +00:00
|
|
|
|
2022-06-18 05:30:46 +00:00
|
|
|
return jsonschema.Draft202012Validator(schema_store[schema], resolver=resolver).validate
|
2021-03-24 16:26:38 +00:00
|
|
|
|
|
|
|
|
2021-06-25 03:48:53 +00:00
|
|
|
def validate(data, schema):
|
|
|
|
"""Validates data against a schema.
|
2021-03-24 16:26:38 +00:00
|
|
|
"""
|
2021-06-25 03:48:53 +00:00
|
|
|
validator = create_validator(schema)
|
2021-03-24 16:26:38 +00:00
|
|
|
|
|
|
|
return validator(data)
|
|
|
|
|
|
|
|
|
|
|
|
def deep_update(origdict, newdict):
|
2021-06-25 03:48:53 +00:00
|
|
|
"""Update a dictionary in place, recursing to do a depth-first deep copy.
|
2021-03-24 16:26:38 +00:00
|
|
|
"""
|
|
|
|
for key, value in newdict.items():
|
|
|
|
if isinstance(value, Mapping):
|
|
|
|
origdict[key] = deep_update(origdict.get(key, {}), value)
|
|
|
|
|
|
|
|
else:
|
|
|
|
origdict[key] = value
|
|
|
|
|
|
|
|
return origdict
|
2023-01-01 19:16:38 +00:00
|
|
|
|
|
|
|
|
|
|
|
def merge_ordered_dicts(dicts):
|
|
|
|
"""Merges nested OrderedDict objects resulting from reading a hjson file.
|
|
|
|
Later input dicts overrides earlier dicts for plain values.
|
2023-02-22 22:50:09 +00:00
|
|
|
If any value is "!delete!", the existing value will be removed from its parent.
|
2023-01-01 19:16:38 +00:00
|
|
|
Arrays will be appended. If the first entry of an array is "!reset!", the contents of the array will be cleared and replaced with RHS.
|
|
|
|
Dictionaries will be recursively merged. If any entry is "!reset!", the contents of the dictionary will be cleared and replaced with RHS.
|
|
|
|
"""
|
|
|
|
result = OrderedDict()
|
|
|
|
|
|
|
|
def add_entry(target, k, v):
|
|
|
|
if k in target and isinstance(v, (OrderedDict, dict)):
|
|
|
|
if "!reset!" in v:
|
|
|
|
target[k] = v
|
|
|
|
else:
|
|
|
|
target[k] = merge_ordered_dicts([target[k], v])
|
|
|
|
if "!reset!" in target[k]:
|
|
|
|
del target[k]["!reset!"]
|
|
|
|
elif k in target and isinstance(v, list):
|
|
|
|
if v[0] == '!reset!':
|
|
|
|
target[k] = v[1:]
|
|
|
|
else:
|
|
|
|
target[k] = target[k] + v
|
2023-02-22 22:50:09 +00:00
|
|
|
elif v == "!delete!" and isinstance(target, (OrderedDict, dict)):
|
|
|
|
del target[k]
|
2023-01-01 19:16:38 +00:00
|
|
|
else:
|
|
|
|
target[k] = v
|
|
|
|
|
|
|
|
for d in dicts:
|
|
|
|
for (k, v) in d.items():
|
|
|
|
add_entry(result, k, v)
|
|
|
|
|
|
|
|
return result
|