|
1
|
|
|
""" |
|
2
|
|
|
This module adds DataManagers for Atramhasis. These are service layer objects |
|
3
|
|
|
that abstract all interactions with the database away from the views. |
|
4
|
|
|
|
|
5
|
|
|
:versionadded: 0.4.1 |
|
6
|
|
|
""" |
|
7
|
|
|
import uuid |
|
8
|
|
|
from datetime import date |
|
9
|
|
|
from datetime import datetime |
|
10
|
|
|
from typing import List |
|
11
|
|
|
|
|
12
|
|
|
import dateutil.relativedelta |
|
13
|
|
|
import sqlalchemy as sa |
|
14
|
|
|
from skosprovider_sqlalchemy.models import Collection |
|
15
|
|
|
from skosprovider_sqlalchemy.models import Concept |
|
16
|
|
|
from skosprovider_sqlalchemy.models import ConceptScheme |
|
17
|
|
|
from skosprovider_sqlalchemy.models import Label |
|
18
|
|
|
from skosprovider_sqlalchemy.models import LabelType |
|
19
|
|
|
from skosprovider_sqlalchemy.models import Language |
|
20
|
|
|
from skosprovider_sqlalchemy.models import Match |
|
21
|
|
|
from skosprovider_sqlalchemy.models import MatchType |
|
22
|
|
|
from skosprovider_sqlalchemy.models import Thing |
|
23
|
|
|
from sqlalchemy import desc |
|
24
|
|
|
from sqlalchemy import func |
|
25
|
|
|
from sqlalchemy import select |
|
26
|
|
|
from sqlalchemy.orm import Session |
|
27
|
|
|
from sqlalchemy.orm import joinedload |
|
28
|
|
|
|
|
29
|
|
|
from atramhasis.data import popular_concepts |
|
30
|
|
|
from atramhasis.data.models import ConceptVisitLog |
|
31
|
|
|
from atramhasis.data.models import ConceptschemeCounts |
|
32
|
|
|
from atramhasis.data.models import IDGenerationStrategy |
|
33
|
|
|
from atramhasis.data.models import Provider |
|
34
|
|
|
from atramhasis.scripts import delete_scheme |
|
35
|
|
|
|
|
36
|
|
|
|
|
37
|
|
|
class DataManager: |
|
38
|
|
|
""" |
|
39
|
|
|
A DataManager abstracts all interactions with the database for a certain model. |
|
40
|
|
|
""" |
|
41
|
|
|
|
|
42
|
|
|
def __init__(self, session: Session) -> None: |
|
43
|
|
|
self.session: Session = session |
|
44
|
|
|
|
|
45
|
|
|
|
|
46
|
|
|
class ConceptSchemeManager(DataManager): |
|
47
|
|
|
""" |
|
48
|
|
|
A :class:`DataManager` for |
|
49
|
|
|
:class:`ConceptSchemes <skosprovider_sqlalchemy.models.ConceptScheme>.` |
|
50
|
|
|
""" |
|
51
|
|
|
|
|
52
|
|
|
def __init__(self, session): |
|
53
|
|
|
super().__init__(session) |
|
54
|
|
|
|
|
55
|
|
|
def get(self, conceptscheme_id): |
|
56
|
|
|
""" |
|
57
|
|
|
|
|
58
|
|
|
:param conceptscheme_id: a concepscheme id |
|
59
|
|
|
:return: the concepscheme for the given id |
|
60
|
|
|
""" |
|
61
|
|
|
return self.session.execute( |
|
62
|
|
|
select(ConceptScheme) |
|
63
|
|
|
.filter(ConceptScheme.id == conceptscheme_id) |
|
64
|
|
|
).scalar_one() |
|
65
|
|
|
|
|
66
|
|
|
def find(self, conceptscheme_id, query): |
|
67
|
|
|
""" |
|
68
|
|
|
Find concepts and collections in this concept scheme. |
|
69
|
|
|
|
|
70
|
|
|
:param conceptscheme_id: a concepscheme id |
|
71
|
|
|
:param query: A python dictionary containing query parameters. |
|
72
|
|
|
:returns: A :class:`list` of |
|
73
|
|
|
:class:`skosprovider_sqlalchemy.models.Thing` instances. |
|
74
|
|
|
""" |
|
75
|
|
|
db_query = ( |
|
76
|
|
|
select(Thing) |
|
77
|
|
|
.options(joinedload(Thing.labels)) |
|
78
|
|
|
.filter(Thing.conceptscheme_id == conceptscheme_id) |
|
79
|
|
|
) |
|
80
|
|
|
if 'type' in query and query['type'] in ['concept', 'collection']: |
|
81
|
|
|
db_query = db_query.filter(Thing.type == query['type']) |
|
82
|
|
|
if 'label' in query: |
|
83
|
|
|
db_query = db_query.filter( |
|
84
|
|
|
Thing.labels.any( |
|
85
|
|
|
Label.label.ilike('%' + query['label'].lower() + '%') |
|
86
|
|
|
) |
|
87
|
|
|
) |
|
88
|
|
|
return self.session.execute(db_query).unique().scalars().all() |
|
89
|
|
|
|
|
90
|
|
|
def get_concepts_for_scheme_tree(self, conceptscheme_id): |
|
91
|
|
|
""" |
|
92
|
|
|
|
|
93
|
|
|
:param conceptscheme_id: a concepscheme id |
|
94
|
|
|
:return: all concepts for the scheme_tree |
|
95
|
|
|
""" |
|
96
|
|
|
return self.session.execute( |
|
97
|
|
|
select(Concept) |
|
98
|
|
|
.filter( |
|
99
|
|
|
Concept.conceptscheme_id == conceptscheme_id, |
|
100
|
|
|
~Concept.broader_concepts.any(), |
|
101
|
|
|
~Collection.member_of.any() |
|
102
|
|
|
) |
|
103
|
|
|
).scalars().all() |
|
104
|
|
|
|
|
105
|
|
|
def get_collections_for_scheme_tree(self, conceptscheme_id): |
|
106
|
|
|
""" |
|
107
|
|
|
|
|
108
|
|
|
:param conceptscheme_id: a concepscheme id |
|
109
|
|
|
:return: all collections for the scheme_tree |
|
110
|
|
|
""" |
|
111
|
|
|
return self.session.execute( |
|
112
|
|
|
select(Collection) |
|
113
|
|
|
.filter( |
|
114
|
|
|
Collection.conceptscheme_id == conceptscheme_id, |
|
115
|
|
|
~Collection.broader_concepts.any(), |
|
116
|
|
|
~Collection.member_of.any(), |
|
117
|
|
|
) |
|
118
|
|
|
).scalars().all() |
|
119
|
|
|
|
|
120
|
|
|
def get_all(self, conceptscheme_id): |
|
121
|
|
|
""" |
|
122
|
|
|
Get all concepts and collections in this concept scheme. |
|
123
|
|
|
|
|
124
|
|
|
:param conceptscheme_id: a concepscheme id |
|
125
|
|
|
:returns: A :class:`list` of |
|
126
|
|
|
:class:`skosprovider_sqlalchemy.models.Thing` instances. |
|
127
|
|
|
""" |
|
128
|
|
|
all_results = self.session.execute( |
|
129
|
|
|
select(Thing) |
|
130
|
|
|
.options(joinedload(Thing.labels)) |
|
131
|
|
|
.filter(Thing.conceptscheme_id == conceptscheme_id) |
|
132
|
|
|
).unique().scalars().all() |
|
133
|
|
|
return all_results |
|
134
|
|
|
|
|
135
|
|
|
def save(self, conceptscheme): |
|
136
|
|
|
""" |
|
137
|
|
|
|
|
138
|
|
|
:param conceptscheme: conceptscheme to save |
|
139
|
|
|
:return: saved conceptscheme |
|
140
|
|
|
""" |
|
141
|
|
|
self.session.merge(conceptscheme) |
|
142
|
|
|
self.session.flush() |
|
143
|
|
|
return conceptscheme |
|
144
|
|
|
|
|
145
|
|
|
|
|
146
|
|
|
class SkosManager(DataManager): |
|
147
|
|
|
""" |
|
148
|
|
|
A :class:`DataManager` for |
|
149
|
|
|
:class:`Concepts and Collections <skosprovider_sqlalchemy.models.Thing>.` |
|
150
|
|
|
""" |
|
151
|
|
|
|
|
152
|
|
|
def __init__(self, session): |
|
153
|
|
|
super().__init__(session) |
|
154
|
|
|
|
|
155
|
|
|
def get_thing(self, concept_id, conceptscheme_id): |
|
156
|
|
|
""" |
|
157
|
|
|
|
|
158
|
|
|
:param concept_id: a concept id |
|
159
|
|
|
:param conceptscheme_id: a conceptscheme id |
|
160
|
|
|
:return: the selected thing (Concept or Collection) |
|
161
|
|
|
""" |
|
162
|
|
|
return self.session.execute( |
|
163
|
|
|
select(Thing) |
|
164
|
|
|
.filter( |
|
165
|
|
|
Thing.concept_id == concept_id, |
|
166
|
|
|
Thing.conceptscheme_id == conceptscheme_id |
|
167
|
|
|
) |
|
168
|
|
|
).scalar_one() |
|
169
|
|
|
|
|
170
|
|
|
def save(self, thing): |
|
171
|
|
|
""" |
|
172
|
|
|
|
|
173
|
|
|
:param thing: thing to save |
|
174
|
|
|
:return: saved thing |
|
175
|
|
|
""" |
|
176
|
|
|
self.session.add(thing) |
|
177
|
|
|
self.session.flush() |
|
178
|
|
|
return thing |
|
179
|
|
|
|
|
180
|
|
|
def change_type(self, thing, concept_id, conceptscheme_id, new_type, uri): |
|
181
|
|
|
self.delete_thing(thing) |
|
182
|
|
|
self.session.flush() |
|
183
|
|
|
thing = Concept() if new_type == 'concept' else Collection() |
|
184
|
|
|
thing.type = new_type |
|
185
|
|
|
thing.concept_id = concept_id |
|
186
|
|
|
thing.conceptscheme_id = conceptscheme_id |
|
187
|
|
|
thing.uri = uri |
|
188
|
|
|
self.save(thing) |
|
189
|
|
|
return thing |
|
190
|
|
|
|
|
191
|
|
|
def delete_thing(self, thing): |
|
192
|
|
|
""" |
|
193
|
|
|
|
|
194
|
|
|
:param thing: the thing to delete |
|
195
|
|
|
""" |
|
196
|
|
|
self.session.delete(thing) |
|
197
|
|
|
|
|
198
|
|
|
def get_by_list_type(self, list_type): |
|
199
|
|
|
""" |
|
200
|
|
|
|
|
201
|
|
|
:param list_type: a specific list type |
|
202
|
|
|
:return: all results for the specific list type |
|
203
|
|
|
""" |
|
204
|
|
|
return self.session.execute(select(list_type)).scalars().all() |
|
205
|
|
|
|
|
206
|
|
|
def get_match_type(self, match_type): |
|
207
|
|
|
return self.session.execute( |
|
208
|
|
|
select(MatchType) |
|
209
|
|
|
.filter(MatchType.name == match_type) |
|
210
|
|
|
).scalar_one() |
|
211
|
|
|
|
|
212
|
|
|
def get_match(self, uri, matchtype_id, concept_id): |
|
213
|
|
|
return self.session.execute( |
|
214
|
|
|
select(Match) |
|
215
|
|
|
.filter( |
|
216
|
|
|
Match.uri == uri, |
|
217
|
|
|
Match.matchtype_id == matchtype_id, |
|
218
|
|
|
Match.concept_id == concept_id |
|
219
|
|
|
) |
|
220
|
|
|
).scalar_one() |
|
221
|
|
|
|
|
222
|
|
|
def get_all_label_types(self): |
|
223
|
|
|
return self.session.execute(select(LabelType)).scalars().all() |
|
224
|
|
|
|
|
225
|
|
|
def get_next_cid(self, conceptscheme_id, id_generation_strategy): |
|
226
|
|
|
if id_generation_strategy == IDGenerationStrategy.NUMERIC: |
|
227
|
|
|
max_id = self.session.execute( |
|
228
|
|
|
select(func.max(sa.cast(Thing.concept_id, sa.Integer))) |
|
229
|
|
|
.filter_by(conceptscheme_id=conceptscheme_id) |
|
230
|
|
|
).scalar_one() |
|
231
|
|
|
return max_id + 1 if max_id else 1 |
|
232
|
|
|
elif id_generation_strategy == IDGenerationStrategy.GUID: |
|
233
|
|
|
return str(uuid.uuid4()) |
|
234
|
|
|
else: |
|
235
|
|
|
raise ValueError("unsupported id_generation_strategy") |
|
236
|
|
|
|
|
237
|
|
|
|
|
238
|
|
|
class LanguagesManager(DataManager): |
|
239
|
|
|
""" |
|
240
|
|
|
A :class:`DataManager` for |
|
241
|
|
|
:class:`Languages <skosprovider_sqlalchemy.models.Language>.` |
|
242
|
|
|
""" |
|
243
|
|
|
|
|
244
|
|
|
def __init__(self, session): |
|
245
|
|
|
super().__init__(session) |
|
246
|
|
|
|
|
247
|
|
|
def get(self, language_id): |
|
248
|
|
|
return self.session.execute( |
|
249
|
|
|
select(Language) |
|
250
|
|
|
.filter(Language.id == language_id) |
|
251
|
|
|
).scalar_one() |
|
252
|
|
|
|
|
253
|
|
|
def save(self, language): |
|
254
|
|
|
""" |
|
255
|
|
|
|
|
256
|
|
|
:param language: language to save |
|
257
|
|
|
:return: saved language |
|
258
|
|
|
""" |
|
259
|
|
|
self.session.add(language) |
|
260
|
|
|
self.session.flush() |
|
261
|
|
|
return language |
|
262
|
|
|
|
|
263
|
|
|
def delete(self, language): |
|
264
|
|
|
""" |
|
265
|
|
|
|
|
266
|
|
|
:param language: the language to delete |
|
267
|
|
|
""" |
|
268
|
|
|
self.session.delete(language) |
|
269
|
|
|
|
|
270
|
|
|
def get_all(self): |
|
271
|
|
|
""" |
|
272
|
|
|
|
|
273
|
|
|
:return: list of all languages |
|
274
|
|
|
""" |
|
275
|
|
|
return self.session.execute(select(Language)).scalars().all() |
|
276
|
|
|
|
|
277
|
|
|
def get_all_sorted(self, sort_coll, sort_desc): |
|
278
|
|
|
""" |
|
279
|
|
|
|
|
280
|
|
|
:param sort_coll: sort on this column |
|
281
|
|
|
:param sort_desc: descending or not |
|
282
|
|
|
:return: sorted list of languages |
|
283
|
|
|
""" |
|
284
|
|
|
if sort_desc: |
|
285
|
|
|
return self.session.execute( |
|
286
|
|
|
select(Language) |
|
287
|
|
|
.order_by(desc(sort_coll)) |
|
288
|
|
|
).scalars().all() |
|
289
|
|
|
else: |
|
290
|
|
|
return self.session.execute( |
|
291
|
|
|
select(Language) |
|
292
|
|
|
.order_by(sort_coll) |
|
293
|
|
|
).scalars().all() |
|
294
|
|
|
|
|
295
|
|
|
def count_languages(self, language_tag): |
|
296
|
|
|
return self.session.execute( |
|
297
|
|
|
select(func.count(Language.id)) |
|
298
|
|
|
.filter(Language.id == language_tag) |
|
299
|
|
|
).scalar_one() |
|
300
|
|
|
|
|
301
|
|
|
|
|
302
|
|
|
class AuditManager(DataManager): |
|
303
|
|
|
""" |
|
304
|
|
|
A data manager for logging the visit. |
|
305
|
|
|
""" |
|
306
|
|
|
|
|
307
|
|
|
def save(self, visit_log): |
|
308
|
|
|
""" |
|
309
|
|
|
save a certain visit |
|
310
|
|
|
:param visit_log: log of visit to save |
|
311
|
|
|
:return: The saved visit log |
|
312
|
|
|
""" |
|
313
|
|
|
self.session.add(visit_log) |
|
314
|
|
|
self.session.flush() |
|
315
|
|
|
return visit_log |
|
316
|
|
|
|
|
317
|
|
|
@popular_concepts.cache_on_arguments(expiration_time=86400) |
|
318
|
|
|
def get_most_popular_concepts_for_conceptscheme( |
|
319
|
|
|
self, conceptscheme_id, max_results=5, period='last_month' |
|
320
|
|
|
): |
|
321
|
|
|
""" |
|
322
|
|
|
get the most popular concepts for a conceptscheme |
|
323
|
|
|
:param conceptscheme_id: id of the conceptscheme |
|
324
|
|
|
:param max_results: maximum number of results, default 5 |
|
325
|
|
|
:param period: 'last_day' or 'last_week' or 'last_month' or 'last_year', default 'last_mont h' |
|
326
|
|
|
:return: List of the most popular concepts of a conceptscheme over a certain period |
|
327
|
|
|
""" |
|
328
|
|
|
|
|
329
|
|
|
start_date = self._get_first_day(period) |
|
330
|
|
|
rows = self.session.execute( |
|
331
|
|
|
select( |
|
332
|
|
|
ConceptVisitLog.concept_id, |
|
333
|
|
|
func.count(ConceptVisitLog.concept_id).label('count') |
|
334
|
|
|
) |
|
335
|
|
|
.filter( |
|
336
|
|
|
ConceptVisitLog.conceptscheme_id == str(conceptscheme_id), |
|
337
|
|
|
ConceptVisitLog.visited_at >= start_date |
|
338
|
|
|
) |
|
339
|
|
|
.group_by(ConceptVisitLog.concept_id) |
|
340
|
|
|
.order_by(desc('count')) |
|
341
|
|
|
.limit(max_results) |
|
342
|
|
|
).all() |
|
343
|
|
|
results = [] |
|
344
|
|
|
for row in rows: |
|
345
|
|
|
results.append({'concept_id': row.concept_id, 'scheme_id': conceptscheme_id}) |
|
346
|
|
|
return results |
|
347
|
|
|
|
|
348
|
|
|
@staticmethod |
|
349
|
|
|
def _get_first_day(period): |
|
350
|
|
|
""" |
|
351
|
|
|
get the first day of a certain period until now |
|
352
|
|
|
:param period: 'last_day' or 'last_week' or 'last_month' or 'last_year' |
|
353
|
|
|
:return: (string) the first day of the period |
|
354
|
|
|
""" |
|
355
|
|
|
d = date.today() |
|
356
|
|
|
datetime.combine(d, datetime.min.time()) |
|
357
|
|
|
start_date = d - dateutil.relativedelta.relativedelta( |
|
358
|
|
|
days=1 if period == 'last_day' else 0, |
|
359
|
|
|
weeks=1 if period == 'last_week' else 0, |
|
360
|
|
|
months=1 if period == 'last_month' else 0, |
|
361
|
|
|
years=1 if period == 'last_year' else 0 |
|
362
|
|
|
) |
|
363
|
|
|
return start_date.strftime("%Y-%m-%d") |
|
364
|
|
|
|
|
365
|
|
|
|
|
366
|
|
|
class CountsManager(DataManager): |
|
367
|
|
|
""" |
|
368
|
|
|
A data manager that deals with triple counts. |
|
369
|
|
|
""" |
|
370
|
|
|
|
|
371
|
|
|
def save(self, counts): |
|
372
|
|
|
""" |
|
373
|
|
|
Save a certain counts object |
|
374
|
|
|
|
|
375
|
|
|
:param atramhasis.data.models.ConceptschemeCounts counts: Counts object to save |
|
376
|
|
|
|
|
377
|
|
|
:return: The saved count |
|
378
|
|
|
""" |
|
379
|
|
|
self.session.add(counts) |
|
380
|
|
|
self.session.flush() |
|
381
|
|
|
return counts |
|
382
|
|
|
|
|
383
|
|
|
def get_most_recent_count_for_scheme(self, conceptscheme_id): |
|
384
|
|
|
recent = self.session.execute( |
|
385
|
|
|
select(ConceptschemeCounts) |
|
386
|
|
|
.filter(ConceptschemeCounts.conceptscheme_id == conceptscheme_id) |
|
387
|
|
|
.order_by(desc('counted_at')) |
|
388
|
|
|
).scalar_one() |
|
389
|
|
|
return recent |
|
390
|
|
|
|
|
391
|
|
|
|
|
392
|
|
|
class ProviderDataManager(DataManager): |
|
393
|
|
|
"""A data manager for managing Providers.""" |
|
394
|
|
|
|
|
395
|
|
|
def get_provider_by_id(self, provider_id) -> Provider: |
|
396
|
|
|
return self.session.execute( |
|
397
|
|
|
select(Provider) |
|
398
|
|
|
.filter(Provider.id == provider_id) |
|
399
|
|
|
).scalar_one() |
|
400
|
|
|
|
|
401
|
|
|
def get_all_providers(self) -> List[Provider]: |
|
402
|
|
|
""" |
|
403
|
|
|
Retrieve all providers from the database. |
|
404
|
|
|
|
|
405
|
|
|
:return: All providers |
|
406
|
|
|
""" |
|
407
|
|
|
return self.session.execute(select(Provider)).scalars().all() |
|
408
|
|
|
|