|
1
|
|
|
from copy import deepcopy |
|
2
|
|
|
from typing import Any, Dict |
|
3
|
|
|
import json |
|
4
|
|
|
|
|
5
|
|
|
from omi.base import get_metadata_specification |
|
6
|
|
|
from omi.validation import validate_metadata # parse_metadata |
|
7
|
|
|
from sqlalchemy.engine import Engine |
|
8
|
|
|
|
|
9
|
|
|
from egon.data.metadata import settings |
|
10
|
|
|
|
|
11
|
|
|
|
|
12
|
|
|
class OEMetadataPackage: |
|
13
|
|
|
def __init__(self, version: str = settings.OEMETADATA_VERSION) -> None: |
|
14
|
|
|
self.spec = get_metadata_specification(version) |
|
15
|
|
|
self._doc: Dict[str, Any] = { |
|
16
|
|
|
"@context": "https://raw.githubusercontent.com/OpenEnergyPlatform/oemetadata/production/oemetadata/latest/context.json", # noqa: E501 |
|
17
|
|
|
"name": "", |
|
18
|
|
|
"title": "", |
|
19
|
|
|
"description": "", |
|
20
|
|
|
"@id": "", |
|
21
|
|
|
"resources": [], |
|
22
|
|
|
"metaMetadata": { |
|
23
|
|
|
"metadataVersion": version, |
|
24
|
|
|
"metadataLicense": {"name": "CC0-1.0"}, |
|
25
|
|
|
}, |
|
26
|
|
|
} |
|
27
|
|
|
self._validated = False |
|
28
|
|
|
|
|
29
|
|
|
def set_root( |
|
30
|
|
|
self, |
|
31
|
|
|
*, |
|
32
|
|
|
name: str, |
|
33
|
|
|
title: str = "", |
|
34
|
|
|
description: str = "", |
|
35
|
|
|
id_: str = "", |
|
36
|
|
|
) -> "OEMetadataPackage": |
|
37
|
|
|
self._doc["name"] = name |
|
38
|
|
|
self._doc["title"] = title |
|
39
|
|
|
self._doc["description"] = description |
|
40
|
|
|
self._doc["@id"] = id_ |
|
41
|
|
|
self._validated = False |
|
42
|
|
|
return self |
|
43
|
|
|
|
|
44
|
|
|
def add_resource( |
|
45
|
|
|
self, |
|
46
|
|
|
resource: dict, |
|
47
|
|
|
*, |
|
48
|
|
|
dedupe_by: str = "name", |
|
49
|
|
|
overwrite: bool = True, |
|
50
|
|
|
) -> "OEMetadataPackage": |
|
51
|
|
|
if dedupe_by and overwrite: |
|
52
|
|
|
self._doc["resources"] = [ |
|
53
|
|
|
r |
|
54
|
|
|
for r in self._doc["resources"] |
|
55
|
|
|
if r.get(dedupe_by) != resource.get(dedupe_by) |
|
56
|
|
|
] |
|
57
|
|
|
self._doc["resources"].append(deepcopy(resource)) |
|
58
|
|
|
self._validated = False |
|
59
|
|
|
return self |
|
60
|
|
|
|
|
61
|
|
|
def add_from_full_document( |
|
62
|
|
|
self, full_doc: dict, *, take_root_if_empty: bool = False |
|
63
|
|
|
) -> "OEMetadataPackage": |
|
64
|
|
|
# Optionally fill root if still empty |
|
65
|
|
|
if take_root_if_empty and not self._doc["name"]: |
|
66
|
|
|
for k in ("name", "title", "description", "@id"): |
|
67
|
|
|
if k in full_doc: |
|
68
|
|
|
self._doc[k] = full_doc[k] |
|
69
|
|
|
for r in full_doc.get("resources", []): |
|
70
|
|
|
self.add_resource(r) |
|
71
|
|
|
return self |
|
72
|
|
|
|
|
73
|
|
|
def add_from_table_comment( |
|
74
|
|
|
self, engine: Engine, schema: str, table: str |
|
75
|
|
|
) -> "OEMetadataPackage": |
|
76
|
|
|
sql = """ |
|
77
|
|
|
SELECT obj_description((quote_ident(%s)||'.'||quote_ident(%s))::regclass, 'pg_class') AS comment |
|
78
|
|
|
""" # noqa: E501 |
|
79
|
|
|
with engine.begin() as conn: |
|
80
|
|
|
comment = conn.exec_driver_sql(sql, (schema, table)).scalar() |
|
81
|
|
|
if not comment: |
|
82
|
|
|
return self |
|
83
|
|
|
try: |
|
84
|
|
|
full_doc = json.loads(comment) |
|
85
|
|
|
except Exception: |
|
86
|
|
|
return self |
|
87
|
|
|
# Optionally validate the doc before merging |
|
88
|
|
|
try: |
|
89
|
|
|
validate_metadata(full_doc, check_license=False) |
|
90
|
|
|
except Exception: |
|
91
|
|
|
pass |
|
92
|
|
|
return self.add_from_full_document(full_doc) |
|
93
|
|
|
|
|
94
|
|
|
def finalize(self, *, license_check: bool = True) -> "OEMetadataPackage": |
|
95
|
|
|
validate_metadata(self._doc, check_license=license_check) |
|
96
|
|
|
self._validated = True |
|
97
|
|
|
return self |
|
98
|
|
|
|
|
99
|
|
|
def as_dict(self) -> dict: |
|
100
|
|
|
if not self._validated: |
|
101
|
|
|
self.finalize() |
|
102
|
|
|
return deepcopy(self._doc) |
|
103
|
|
|
|
|
104
|
|
|
def as_json(self) -> str: |
|
105
|
|
|
return json.dumps(self.as_dict(), ensure_ascii=False) |
|
106
|
|
|
|