From 8402fae95ebf909b8f455c207de50acd90c56517 Mon Sep 17 00:00:00 2001 From: Ward Van Heddeghem Date: Thu, 22 Feb 2024 17:50:18 +0100 Subject: [PATCH 1/7] Fix forgotten inlline return --- src/mijnbib/login_handlers.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/mijnbib/login_handlers.py b/src/mijnbib/login_handlers.py index bbb5d73..0805b3a 100644 --- a/src/mijnbib/login_handlers.py +++ b/src/mijnbib/login_handlers.py @@ -125,7 +125,7 @@ def _log_in(self): ) if "/mijn-bibliotheek/overzicht" in oauth_location_url: _log.info("Already authenticated. No need to log in again.") - return + return response # better for extensibility (i.e. sOlid) # (2) Authorize based on Location url (get session id) response = self._s.get(oauth_location_url, allow_redirects=False) From 6b68a72befc2db42792077dd40cf06880466df1f Mon Sep 17 00:00:00 2001 From: Ward Van Heddeghem Date: Mon, 26 Feb 2024 19:14:09 +0100 Subject: [PATCH 2/7] Raise tempsiteerror at login when 5xx (part 3) --- src/mijnbib/login_handlers.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/mijnbib/login_handlers.py b/src/mijnbib/login_handlers.py index 0805b3a..5b37814 100644 --- a/src/mijnbib/login_handlers.py +++ b/src/mijnbib/login_handlers.py @@ -164,6 +164,10 @@ def _log_in(self): _log.debug(f"login (3) hint : {hint}") if response.status_code == 200: raise AuthenticationError("Login not accepted. Correct credentials?") + if response.status_code >= 500: # we've observed 500 + raise TemporarySiteError( + f"Expected status code 303 during log in. Got '{response.status_code}'" + ) if response.status_code != 303: raise IncompatibleSourceError( f"Expected status code 303 during log in. Got '{response.status_code}'", From 8b6f7815c0c9fd52233d3ab1fb0bbfea8be46f1f Mon Sep 17 00:00:00 2001 From: "Laptop-Ward-o2o\\Ward" Date: Tue, 5 Mar 2024 13:29:00 +0100 Subject: [PATCH 3/7] Workaround for changed login page (by form. Oauth is still broken) --- src/mijnbib/login_handlers.py | 2 ++ tests/test_mijnbibliotheek.py | 7 +++++++ 2 files changed, 9 insertions(+) diff --git a/src/mijnbib/login_handlers.py b/src/mijnbib/login_handlers.py index 5b37814..c4e5a4f 100644 --- a/src/mijnbib/login_handlers.py +++ b/src/mijnbib/login_handlers.py @@ -45,6 +45,8 @@ def _log_in(self): _log.debug("Opening login page ... ") response = self._br.open(self._url, timeout=TIMEOUT) html_string_start_page = response.read().decode("utf-8") # type:ignore + # TODO Workaround for mechanize.BrowserStateError: not viewing HTML + self._br._factory.is_html = True self._br.select_form(nr=0) self._br["email"] = self._username self._br["password"] = self._pwd diff --git a/tests/test_mijnbibliotheek.py b/tests/test_mijnbibliotheek.py index 588d084..5fd0304 100644 --- a/tests/test_mijnbibliotheek.py +++ b/tests/test_mijnbibliotheek.py @@ -19,9 +19,16 @@ def creds_config(scope="module"): yield dict(**config.defaults()) +class X(str): + pass + + class FakeMechanizeBrowser: def __init__(self, form_response: str) -> None: self._form_response = form_response.encode("utf8") + # trick for nested prop, from https://stackoverflow.com/a/35190607/50899 + self._factory = X("_factory") + self._factory.is_html = None # can be whatever def __setitem__(self, key, value): pass From 6e6d2a711cdcb8e6cdc00810bd29afe09cef852c Mon Sep 17 00:00:00 2001 From: Ward Van Heddeghem Date: Tue, 5 Mar 2024 21:30:55 +0100 Subject: [PATCH 4/7] Extend info on content-type workaround --- src/mijnbib/login_handlers.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/src/mijnbib/login_handlers.py b/src/mijnbib/login_handlers.py index c4e5a4f..47d4ae9 100644 --- a/src/mijnbib/login_handlers.py +++ b/src/mijnbib/login_handlers.py @@ -45,7 +45,11 @@ def _log_in(self): _log.debug("Opening login page ... ") response = self._br.open(self._url, timeout=TIMEOUT) html_string_start_page = response.read().decode("utf-8") # type:ignore - # TODO Workaround for mechanize.BrowserStateError: not viewing HTML + # Workaround for mechanize.BrowserStateError: not viewing HTML + # because suddenly (March 2024) Content-Type header is "application/octet-stream;charset=UTF-8" + # which is not recognized as html by mechanize + # Alternative is to configure the browser instance with + # self._br.set_header("Accept", "text/html") self._br._factory.is_html = True self._br.select_form(nr=0) self._br["email"] = self._username From ffa85e675613e62f1d02631f964f7bc54120893a Mon Sep 17 00:00:00 2001 From: Ward Van Heddeghem Date: Tue, 5 Mar 2024 22:28:20 +0100 Subject: [PATCH 5/7] Add some debug separators --- src/mijnbib/login_handlers.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/mijnbib/login_handlers.py b/src/mijnbib/login_handlers.py index 47d4ae9..da4f26a 100644 --- a/src/mijnbib/login_handlers.py +++ b/src/mijnbib/login_handlers.py @@ -106,6 +106,7 @@ def _log_in(self): # GET https://gent.bibliotheek.be/mijn-bibliotheek/aanmelden # example response: # header Location: https://mijn.bibliotheek.be/openbibid/rest/auth/authorize?hint=login&oauth_callback=https://gent.bibliotheek.be/my-library/login/callback&oauth_token=5abee3c0f5c04beead64d8e625ead0e7&uilang=nl + _log.debug("----") response = self._s.get(self._url, allow_redirects=False) _log.debug(f"login (1) status code : {response.status_code}") _log.debug(f"login (1) headers : {response.headers}") @@ -134,6 +135,7 @@ def _log_in(self): return response # better for extensibility (i.e. sOlid) # (2) Authorize based on Location url (get session id) + _log.debug("----") response = self._s.get(oauth_location_url, allow_redirects=False) _log.debug(f"login (2) status code : {response.status_code}") _log.debug(f"login (2) headers : {response.headers}") @@ -155,6 +157,7 @@ def _log_in(self): "email": self._username, "password": self._pwd, } + _log.debug("----") response = self._s.post(url, data=data, allow_redirects=False) _log.debug(f"login (3) status code : {response.status_code}") _log.debug(f"login (3) headers : {response.headers}") @@ -181,6 +184,7 @@ def _log_in(self): ) # (4) Call login callback based on Location url + _log.debug("----") response = self._s.get(login_location_url, allow_redirects=False) _log.debug(f"login (4) status code : {response.status_code}") _log.debug(f"login (4) headers : {response.headers}") From 943aa5475ff670e77b7cae58adb6cd06b0fb4831 Mon Sep 17 00:00:00 2001 From: Ward Van Heddeghem Date: Tue, 5 Mar 2024 22:38:43 +0100 Subject: [PATCH 6/7] Bump to v0.5.5 and oauth remark in readme --- README.md | 6 ++++-- changelog.md | 5 +++++ pyproject.toml | 2 +- 3 files changed, 10 insertions(+), 3 deletions(-) diff --git a/README.md b/README.md index 56f6d0c..7a48741 100644 --- a/README.md +++ b/README.md @@ -58,12 +58,14 @@ Tenslotte, via de commandline kan je de module ook als volgt aanroepen: ## Opmerkingen - **Authenticatie**. Inloggen bij de bibliotheek.be website gebeurt standaard - via een webformulier. Het is ook mogelijk om de snellere `oauth` manier te - gebruiken; dit is nog experimenteel. + via een webformulier. Het is ook mogelijk om de `oauth` manier te gebruiken; + maar dit is nog experimenteel. mb = MijnBibliotheek(username, password, login_by="oauth") accounts = mb.get_accounts() + ! Opmerking: De oauth flow is sinds maart 2024 broken, en vereist nog een aanpassing. + - **Foutafhandeling**. Afhankelijk van de toepassing, kan het aangeraden zijn om foutafhandeling te voorzien. Het bestand `errors.py` bevat de lijst van Mijnbib-specifieke exceptions. De docstrings van de publieke methods bevatten diff --git a/changelog.md b/changelog.md index d7a58a5..f72f621 100644 --- a/changelog.md +++ b/changelog.md @@ -2,6 +2,11 @@ new: new feature / impr: improvement / fix: bug fix +## v0.5.5 - 2024-03-05 + +- fix: broken login (form) because of change at site. + Note: alternative oauth login still broken. + ## v0.5.4 - 2024-02-21 - impr: improve extensibility of oauth login handler diff --git a/pyproject.toml b/pyproject.toml index 6526e7c..5bc2857 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta" [project] name = "mijnbib" -version = "0.5.4" +version = "0.5.5" description = "Python API voor de website mijn.bibliotheek.be" readme = "README.md" authors = [{ name = "Ward Van Heddeghem", email = "wardvh@fastmail.fm" }] From 93b4ea2f5c089f87ebeedcf50174ee93f7cb2eb0 Mon Sep 17 00:00:00 2001 From: Ward Van Heddeghem Date: Tue, 5 Mar 2024 22:41:30 +0100 Subject: [PATCH 7/7] Update changelog with forgotten change --- changelog.md | 1 + 1 file changed, 1 insertion(+) diff --git a/changelog.md b/changelog.md index f72f621..fc72f3b 100644 --- a/changelog.md +++ b/changelog.md @@ -6,6 +6,7 @@ new: new feature / impr: improvement / fix: bug fix - fix: broken login (form) because of change at site. Note: alternative oauth login still broken. +- impr: raise TemporarySiteError at oauth login when 5xx (part 3) ## v0.5.4 - 2024-02-21