forked from ThePalaceProject/library-registry
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathauthentication_document.py
487 lines (433 loc) · 18.4 KB
/
authentication_document.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
import json
from collections import defaultdict
from flask_babel import lazy_gettext as _
from sqlalchemy.orm.exc import MultipleResultsFound, NoResultFound
from sqlalchemy.orm.session import Session
from model import Audience, CollectionSummary, Place, ServiceArea, get_one_or_create
from problem_details import INVALID_INTEGRATION_DOCUMENT
class AuthenticationDocument:
"""Parse an Authentication For OPDS document, including the
Library Simplified-specific extensions, extracting all the information
that's of interest to the library registry.
"""
ANONYMOUS_ACCESS_REL = "https://librarysimplified.org/rel/auth/anonymous"
AUTHENTICATION_DOCUMENT_REL = "http://opds-spec.org/auth/document"
MEDIA_TYPE = "application/vnd.opds.authentication.v1.0+json"
COVERAGE_EVERYWHERE = "everywhere"
# The list of color schemes supported by SimplyE.
SIMPLYE_COLOR_SCHEMES = [
"red",
"blue",
"gray",
"gold",
"green",
"teal",
"purple",
]
PUBLIC_AUDIENCE = "public"
AUDIENCES = [
PUBLIC_AUDIENCE,
"educational-primary",
"educational-secondary",
"research",
"print-disability",
"other",
]
def __init__(
self,
_db,
id,
title,
authentication,
service_description,
color_scheme,
collection_size,
public_key,
audiences,
service_area,
focus_area,
links,
place_class=Place,
):
self.id = id
self.title = title
self.authentication = authentication
self.service_description = service_description
self.color_scheme = color_scheme
self.collection_size = collection_size
self.public_key = public_key
self.audiences = audiences or [self.PUBLIC_AUDIENCE]
self.service_area, self.focus_area = self.parse_service_and_focus_area(
_db, service_area, focus_area, place_class
)
self.links = links
self.website = self.extract_link(rel="alternate", require_type="text/html")
self.online_registration = self.has_link(rel="register")
self.root = self.extract_link(
rel="start", prefer_type="application/atom+xml;profile=opds-catalog"
)
logo = self.extract_link(rel="logo")
self.logo = None
self.logo_link = None
if logo:
data = logo.get("href", "")
if data and data.startswith("data:"):
self.logo = data
else:
self.logo_link = logo
self.anonymous_access = False
for flow in self.authentication_flows:
if flow.get("type") == self.ANONYMOUS_ACCESS_REL:
self.anonymous_access = True
break
@property
def authentication_flows(self):
"""Return all valid authentication flows in this document."""
for i in self.authentication:
if not isinstance(i, dict):
# Not a valid authentication flow.
continue
yield i
def extract_link(self, rel, require_type=None, prefer_type=None):
"""Find a link with the given link relation in the main authentication
document.
Does not consider links found in the authentication flows.
:param rel: The link must use this as the link relation.
:param require_type: The link must have this as its type.
:param prefer_type: A link with this type is better than a link of
some other type.
"""
return self._extract_link(self.links, rel, require_type, prefer_type)
def has_link(self, rel):
"""Is there a link with this link relation anywhere in the document?
This checks both the main document and the authentication flows.
:rel: The link must have this link relation.
:return: True if there is a link with the link relation in the document,
False otherwise.
"""
if self._extract_link(self.links, rel):
return True
# We couldn't find a matching link in the main set of
# links, but maybe there's a matching link associated with
# a particular authentication flow.
for flow in self.authentication_flows:
if self._extract_link(flow.get("links", []), rel):
return True
return False
@classmethod
def parse_service_and_focus_area(
cls, _db, service_area, focus_area, place_class=Place
):
if service_area:
service_area = cls.parse_coverage(
_db, service_area, place_class=place_class
)
else:
service_area = [], {}, {}
if focus_area:
focus_area = cls.parse_coverage(_db, focus_area, place_class=place_class)
else:
focus_area = service_area
return service_area, focus_area
@classmethod
def parse_coverage(cls, _db, coverage, place_class=Place):
"""Derive Place objects from an Authentication For OPDS coverage
object (i.e. a value for `service_area` or `focus_area`)
:param coverage: An Authentication For OPDS coverage object.
:param place_class: In unit tests, pass in a mock replacement
for the Place class here.
:return: A 3-tuple (places, unknown, ambiguous).
`places` is a list of Place model objects.
`unknown` is a coverage object representing the subset of
`coverage` that had no corresponding Place objects. This
object will not be used for any purpose except error display.
`ambiguous` is a coverage object representing the subset of
`coverage` that had more than one corresponding Place
object. This object will not be used for any purpose except
error display.
"""
place_objs = []
unknown = defaultdict(list)
ambiguous = defaultdict(list)
if coverage == cls.COVERAGE_EVERYWHERE:
# This library covers the entire universe! No need to
# parse anything.
place_objs.append(place_class.everywhere(_db))
coverage = dict() # Do no more processing
elif not isinstance(coverage, dict):
# The coverage is not in { nation: place } format.
# Convert it into that format using the default nation.
default_nation = place_class.default_nation(_db)
if default_nation:
coverage = {default_nation.abbreviated_name: coverage}
else:
# Oops, that's not going to work. We don't know which
# nation this place is in. Return a coverage object
# that makes it semi-clear what the problem is.
unknown["??"] = coverage
coverage = dict() # Do no more processing
for nation, places in list(coverage.items()):
try:
nation_obj = place_class.lookup_one_by_name(
_db,
nation,
place_type=Place.NATION,
)
if places == cls.COVERAGE_EVERYWHERE:
# This library covers an entire nation.
place_objs.append(nation_obj)
else:
# This library covers a list of places within a
# nation.
if isinstance(places, str):
# This is invalid -- you're supposed to always
# pass in a list -- but we can support it.
places = [places]
for place in places:
try:
place_obj = nation_obj.lookup_inside(place)
if place_obj:
# We found it.
place_objs.append(place_obj)
else:
# We couldn't find any place with this name.
unknown[nation].append(place)
except MultipleResultsFound:
# The place was ambiguously named.
ambiguous[nation].append(place)
except MultipleResultsFound:
# A nation was ambiguously named -- not very likely.
ambiguous[nation] = places
except NoResultFound:
# Either this isn't a recognized nation
# or we don't have a geography for it.
unknown[nation] = places
return place_objs, unknown, ambiguous
@classmethod
def _extract_link(cls, links, rel, require_type=None, prefer_type=None):
if require_type and prefer_type:
raise ValueError(
"At most one of require_type and prefer_type may be specified."
)
if not links:
# There are no links, period.
return None
good_enough = None
if not isinstance(links, list):
# Invalid links object; ignore it.
return
for link in links:
if rel != link.get("rel"):
continue
if not require_type and not prefer_type:
# Any link with this relation will work. Return the
# first one we see.
return link
# Beyond this point, either require_type or prefer_type is
# set, so the type of the link becomes relevant.
type = link.get("type", "")
if type:
if (
require_type
and type.startswith(require_type)
or prefer_type
and type.startswith(prefer_type)
):
# If we have a require_type, this means we have
# met the requirement. If we have a prefer_type,
# we will not find a better link than this
# one. Return it immediately.
return link
if not require_type and not good_enough:
# We would prefer a link of a certain type, but if it
# turns out there is no such link, we will accept the
# first link of the given type.
good_enough = link
return good_enough
@classmethod
def from_string(cls, _db, s, place_class=Place):
data = json.loads(s)
return cls.from_dict(_db, data, place_class)
@classmethod
def from_dict(cls, _db, data, place_class=Place):
return AuthenticationDocument(
_db,
id=data.get("id", None),
title=data.get("title", data.get("name", None)),
authentication=data.get("authentication", []),
service_description=data.get("service_description", None),
color_scheme=data.get("color_scheme"),
collection_size=data.get("collection_size"),
public_key=data.get("public_key"),
audiences=data.get("audience"),
service_area=data.get("service_area"),
focus_area=data.get("focus_area"),
links=data.get("links", []),
place_class=place_class,
)
def update_library(self, library):
"""Modify a library to reflect the current state of this
AuthenticationDocument.
:param library: A Library.
:return: A ProblemDetail if there's a problem, otherwise None.
"""
library.name = self.title
library.description = self.service_description
library.online_registration = self.online_registration
library.anonymous_access = self.anonymous_access
problem = self.update_audiences(library)
if not problem:
problem = self.update_service_areas(library)
if not problem:
problem = self.update_collection_size(library)
return problem
def update_audiences(self, library):
return self._update_audiences(library, self.audiences)
@classmethod
def _update_audiences(self, library, audiences):
if not audiences:
# Most of the libraries in this system are open to at
# least some subset of the general public.
audiences = [Audience.PUBLIC]
if isinstance(audiences, str):
# This is invalid but we can easily support it.
audiences = [audiences]
if not isinstance(audiences, list):
return INVALID_INTEGRATION_DOCUMENT.detailed(
_("'audience' must be a list: %(audiences)r", audiences=audiences)
)
# Unrecognized audiences become Audience.OTHER.
filtered_audiences = set()
for audience in audiences:
if audience in Audience.KNOWN_AUDIENCES:
filtered_audiences.add(audience)
else:
filtered_audiences.add(Audience.OTHER)
audiences = filtered_audiences
audience_objs = []
_db = Session.object_session(library)
for audience in audiences:
audience_obj = Audience.lookup(_db, audience)
audience_objs.append(audience_obj)
library.audiences = audience_objs
def update_service_areas(self, library):
"""Update a library's ServiceAreas based on the contents of this
document.
"""
return self.set_service_areas(library, self.service_area, self.focus_area)
@classmethod
def set_service_areas(cls, library, service_area, focus_area):
"""Replace a library's ServiceAreas with specific new values."""
service_areas = []
# What service_area or focus_area looks like when
# no input was specified.
empty = [[], {}, {}]
if focus_area == empty and service_area == empty:
# A library can't lose its entire coverage area -- it's
# more likely that the coverage area was grandfathered in
# and it just isn't set on the remote side.
#
# Do nothing.
return
if focus_area == empty and service_area != empty or service_area == focus_area:
# Service area and focus area are the same, either because
# they were defined that way explicitly or because focus
# area was not specified.
#
# Register the service area as the focus area and call it
# a day.
problem = cls._update_service_areas(
library, service_area, ServiceArea.FOCUS, service_areas
)
if problem:
return problem
else:
# Service area and focus area are different.
problem = cls._update_service_areas(
library, service_area, ServiceArea.ELIGIBILITY, service_areas
)
if problem:
return problem
problem = cls._update_service_areas(
library, focus_area, ServiceArea.FOCUS, service_areas
)
if problem:
return problem
# Delete any ServiceAreas associated with the given library
# which are not mentioned in the list we just gathered.
library.service_areas = service_areas
@classmethod
def _update_service_areas(cls, library, areas, type, service_areas):
"""Update a Library's ServiceAreas with a new set based on
`areas`.
:param library: A Library.
:param areas: A list [place_objs, unknown, ambiguous]
of the sort returned by `parse_coverage()`.
:param type: A value to use for `ServiceAreas.type`.
:param service_areas: All ServiceAreas that became associated
with the Library will be inserted into this list.
:return: A ProblemDetailDocument if any of the service areas could
not be transformed into Place objects. Otherwise, None.
"""
_db = Session.object_session(library)
places, unknown, ambiguous = areas
if unknown or ambiguous:
msgs = []
if unknown:
msgs.append(
str(
_(
"The following service area was unknown: %(service_area)s.",
service_area=json.dumps(unknown),
)
)
)
if ambiguous:
msgs.append(
str(
_(
"The following service area was ambiguous: %(service_area)s.",
service_area=json.dumps(ambiguous),
)
)
)
return INVALID_INTEGRATION_DOCUMENT.detailed(" ".join(msgs))
for place in places:
service_area, is_new = get_one_or_create(
_db, ServiceArea, library_id=library.id, place_id=place.id, type=type
)
service_areas.append(service_area)
def update_collection_size(self, library):
return self._update_collection_size(library, self.collection_size)
@classmethod
def _update_collection_size(self, library, sizes):
if isinstance(sizes, str) or isinstance(sizes, int):
# A single collection with no known language.
sizes = {None: sizes}
if sizes is None:
# No collections are specified.
sizes = {}
if not isinstance(sizes, dict):
return INVALID_INTEGRATION_DOCUMENT.detailed(
_(
"'collection_size' must be a number or an object mapping language codes to numbers"
)
)
new_collections = set()
unknown_size = 0
try:
for language, size in list(sizes.items()):
summary = CollectionSummary.set(library, language, size)
if summary.language is None:
unknown_size += summary.size
new_collections.add(summary)
if unknown_size:
# We found one or more collections in languages we
# didn't recognize. Set the total size of this collection
# as the size of a collection with unknown language.
new_collections.add(CollectionSummary.set(library, None, unknown_size))
except ValueError as e:
return INVALID_INTEGRATION_DOCUMENT.detailed(str(e))
# Destroy any CollectionSummaries representing collections
# no longer associated with this library.
library.collections = list(new_collections)