From b849eb382f49d1a6e94defcf974dc70bdab71c79 Mon Sep 17 00:00:00 2001
From: Maciej Urbanski <maciej.rooter.urbanski@reef.pl>
Date: Sat, 16 Mar 2024 17:18:50 +0100
Subject: [PATCH 1/2] `b2 ls` without arguments now lists all buckets

---
 b2/_internal/_cli/b2args.py       | 34 ++++++++++++----
 b2/_internal/_utils/uri.py        | 48 ++++++++++++++++------
 b2/_internal/b2v3/registry.py     | 12 +++++-
 b2/_internal/console_tool.py      | 63 ++++++++++++++++++++++-------
 changelog.d/+ls_buckets.added.md  |  1 +
 test/unit/_utils/test_uri.py      | 23 +++++++----
 test/unit/console_tool/test_ls.py | 66 +++++++++++++++++++++++++++++++
 7 files changed, 204 insertions(+), 43 deletions(-)
 create mode 100644 changelog.d/+ls_buckets.added.md
 create mode 100644 test/unit/console_tool/test_ls.py

diff --git a/b2/_internal/_cli/b2args.py b/b2/_internal/_cli/b2args.py
index 7ddb47899..b27cd7686 100644
--- a/b2/_internal/_cli/b2args.py
+++ b/b2/_internal/_cli/b2args.py
@@ -11,6 +11,7 @@
 Utility functions for adding b2-specific arguments to an argparse parser.
 """
 import argparse
+import functools
 
 from b2._internal._cli.arg_parser_types import wrap_with_argument_type_error
 from b2._internal._cli.argcompleters import b2uri_file_completer
@@ -30,21 +31,40 @@ def b2id_or_file_like_b2_uri(value: str) -> B2URIBase:
 
 
 B2ID_OR_B2_URI_ARG_TYPE = wrap_with_argument_type_error(parse_b2_uri)
+B2ID_OR_B2_URI_OR_ALL_BUCKETS_ARG_TYPE = wrap_with_argument_type_error(
+    functools.partial(parse_b2_uri, allow_all_buckets=True)
+)
 B2ID_OR_FILE_LIKE_B2_URI_ARG_TYPE = wrap_with_argument_type_error(b2id_or_file_like_b2_uri)
 
 
-def add_b2id_or_b2_uri_argument(parser: argparse.ArgumentParser, name="B2_URI"):
+def add_b2id_or_b2_uri_argument(
+    parser: argparse.ArgumentParser, name="B2_URI", *, allow_all_buckets: bool = False
+):
     """
     Add B2 URI (b2:// or b2id://) as an argument to the parser.
     B2 URI can point to a bucket optionally with a object name prefix (directory)
     or a file-like object.
+
+    If allow_all_buckets is True, the argument will accept B2 URI pointing to all buckets.
     """
-    parser.add_argument(
-        name,
-        type=B2ID_OR_B2_URI_ARG_TYPE,
-        help="B2 URI pointing to a bucket, directory or a file."
-        "e.g. b2://yourBucket, b2://yourBucket/file.txt, b2://yourBucket/folderName/, or b2id://fileId",
-    ).completer = b2uri_file_completer
+    if allow_all_buckets:
+        argument_spec = parser.add_argument(
+            name,
+            type=B2ID_OR_B2_URI_OR_ALL_BUCKETS_ARG_TYPE,
+            default=None,
+            nargs="?",
+            help="B2 URI pointing to a bucket, directory, file or all buckets. "
+            "e.g. b2://yourBucket, b2://yourBucket/file.txt, b2://yourBucket/folderName/, b2id://fileId, or b2://",
+        )
+    else:
+        argument_spec = parser.add_argument(
+            name,
+            type=B2ID_OR_B2_URI_ARG_TYPE,
+            help="B2 URI pointing to a bucket, directory or a file. "
+            "e.g. b2://yourBucket, b2://yourBucket/file.txt, b2://yourBucket/folderName/, or b2id://fileId",
+        )
+
+    argument_spec.completer = b2uri_file_completer
 
 
 def add_b2id_or_file_like_b2_uri_argument(parser: argparse.ArgumentParser, name="B2_URI"):
diff --git a/b2/_internal/_utils/uri.py b/b2/_internal/_utils/uri.py
index 7e0962e32..cdee5f60e 100644
--- a/b2/_internal/_utils/uri.py
+++ b/b2/_internal/_utils/uri.py
@@ -39,15 +39,13 @@ class B2URI(B2URIBase):
     there is no such thing as "directory" in B2, but it is possible to mimic it by using object names with non-trailing
     slashes.
     To make it possible, it is highly discouraged to use trailing slashes in object names.
+
+    Please note `path` attribute should exclude prefixing slash, i.e. `path` should be empty string for the root of the bucket.
     """
 
     bucket_name: str
     path: str = ""
 
-    def __post_init__(self):
-        path = removeprefix(self.path, "/")
-        self.__dict__["path"] = path  # hack for a custom init in frozen dataclass
-
     def __str__(self) -> str:
         return f"b2://{self.bucket_name}/{self.path}"
 
@@ -82,30 +80,56 @@ def __str__(self) -> str:
         return f"b2id://{self.file_id}"
 
 
-def parse_uri(uri: str) -> Path | B2URI | B2FileIdURI:
+def parse_uri(uri: str, *, allow_all_buckets: bool = False) -> Path | B2URI | B2FileIdURI:
+    """
+    Parse URI.
+
+    :param uri: string to parse
+    :param allow_all_buckets: if True, allow `b2://` without a bucket name to refer to all buckets
+    :return: B2 URI or Path
+    :raises ValueError: if the URI is invalid
+    """
+    if not uri:
+        raise ValueError("URI cannot be empty")
     parsed = urllib.parse.urlsplit(uri)
     if parsed.scheme == "":
         return pathlib.Path(uri)
-    return _parse_b2_uri(uri, parsed)
+    return _parse_b2_uri(uri, parsed, allow_all_buckets=allow_all_buckets)
+
 
+def parse_b2_uri(uri: str, *, allow_all_buckets: bool = False) -> B2URI | B2FileIdURI:
+    """
+    Parse B2 URI.
 
-def parse_b2_uri(uri: str) -> B2URI | B2FileIdURI:
+    :param uri: string to parse
+    :param allow_all_buckets: if True, allow `b2://` without a bucket name to refer to all buckets
+    :return: B2 URI
+    :raises ValueError: if the URI is invalid
+    """
     parsed = urllib.parse.urlsplit(uri)
-    return _parse_b2_uri(uri, parsed)
+    return _parse_b2_uri(uri, parsed, allow_all_buckets=allow_all_buckets)
 
 
-def _parse_b2_uri(uri, parsed: urllib.parse.SplitResult) -> B2URI | B2FileIdURI:
+def _parse_b2_uri(
+    uri, parsed: urllib.parse.SplitResult, allow_all_buckets: bool = False
+) -> B2URI | B2FileIdURI:
     if parsed.scheme in ("b2", "b2id"):
+        path = urllib.parse.urlunsplit(parsed._replace(scheme="", netloc=""))
         if not parsed.netloc:
+            if allow_all_buckets:
+                if path:
+                    raise ValueError(
+                        f"Invalid B2 URI: all buckets URI doesn't allow non-empty path, but {path!r} was provided"
+                    )
+                return B2URI(bucket_name="")
             raise ValueError(f"Invalid B2 URI: {uri!r}")
         elif parsed.password or parsed.username:
             raise ValueError(
-                "Invalid B2 URI: credentials passed using `user@password:` syntax are not supported in URI"
+                "Invalid B2 URI: credentials passed using `user@password:` syntax is not supported in URI"
             )
 
         if parsed.scheme == "b2":
-            path = urllib.parse.urlunsplit(parsed._replace(scheme="", netloc=""))
-            return B2URI(bucket_name=parsed.netloc, path=path)
+            return B2URI(bucket_name=parsed.netloc, path=removeprefix(path, "/"))
         elif parsed.scheme == "b2id":
             return B2FileIdURI(file_id=parsed.netloc)
     else:
diff --git a/b2/_internal/b2v3/registry.py b/b2/_internal/b2v3/registry.py
index c603a1767..09ad7bd51 100644
--- a/b2/_internal/b2v3/registry.py
+++ b/b2/_internal/b2v3/registry.py
@@ -32,24 +32,32 @@ class Ls(B2URIBucketNFolderNameArgMixin, BaseLs):
         {NAME} ls --recursive --withWildcard bucketName "*.[ct]sv"
 
 
-    List all info.txt files from buckets bX, where X is any character:
+    List all info.txt files from directories `b?`, where `?` is any character:
 
     .. code-block::
 
         {NAME} ls --recursive --withWildcard bucketName "b?/info.txt"
 
 
-    List all pdf files from buckets b0 to b9 (including sub-directories):
+    List all pdf files from directories b0 to b9 (including sub-directories):
 
     .. code-block::
 
         {NAME} ls --recursive --withWildcard bucketName "b[0-9]/*.pdf"
 
 
+    List all buckets:
+
+    .. code-block::
+
+        {NAME} ls
+
     Requires capability:
 
     - **listFiles**
+    - **listBuckets** (if bucket name is not provided)
     """
+    ALLOW_ALL_BUCKETS = True
 
 
 B2.register_subcommand(AuthorizeAccount)
diff --git a/b2/_internal/console_tool.py b/b2/_internal/console_tool.py
index eda3eb733..7b91bec10 100644
--- a/b2/_internal/console_tool.py
+++ b/b2/_internal/console_tool.py
@@ -15,6 +15,7 @@
 import tempfile
 
 from b2._internal._cli.autocomplete_cache import AUTOCOMPLETE  # noqa
+from b2._internal._utils.python_compat import removeprefix
 
 AUTOCOMPLETE.autocomplete_from_cache()
 
@@ -657,23 +658,30 @@ def get_b2_uri_from_arg(self, args: argparse.Namespace) -> B2URIBase:
 
 
 class B2URIBucketNFolderNameArgMixin:
+    ALLOW_ALL_BUCKETS: bool = False
+
     @classmethod
     def _setup_parser(cls, parser):
-        parser.add_argument('bucketName').completer = bucket_name_completer
+        parser.add_argument(
+            'bucketName',
+            nargs='?' if cls.ALLOW_ALL_BUCKETS else None,
+        ).completer = bucket_name_completer
         parser.add_argument('folderName', nargs='?').completer = file_name_completer
         super()._setup_parser(parser)
 
     def get_b2_uri_from_arg(self, args: argparse.Namespace) -> B2URI:
-        return B2URI(args.bucketName, args.folderName or '')
+        return B2URI(removeprefix(args.bucketName or '', "b2://"), args.folderName or '')
 
 
 class B2IDOrB2URIMixin:
+    ALLOW_ALL_BUCKETS: bool = False
+
     @classmethod
     def _setup_parser(cls, parser):
-        add_b2id_or_b2_uri_argument(parser)
+        add_b2id_or_b2_uri_argument(parser, allow_all_buckets=cls.ALLOW_ALL_BUCKETS)
         super()._setup_parser(parser)
 
-    def get_b2_uri_from_arg(self, args: argparse.Namespace) -> B2URI:
+    def get_b2_uri_from_arg(self, args: argparse.Namespace) -> B2URI | B2FileIdURI:
         return args.B2_URI
 
 
@@ -2063,13 +2071,17 @@ def _setup_parser(cls, parser):
         super()._setup_parser(parser)
 
     def _run(self, args):
-        buckets = self.api.list_buckets()
-        if args.json:
-            self._print_json(list(buckets))
+        return self.__class__.run_list_buckets(self, json_=args.json)
+
+    @classmethod
+    def run_list_buckets(cls, command: Command, *, json_: bool) -> int:
+        buckets = command.api.list_buckets()
+        if json_:
+            command._print_json(list(buckets))
             return 0
 
         for b in buckets:
-            self._print('%s  %-10s  %s' % (b.id_, b.type_, b.name))
+            command._print(f'{b.id_}  {b.type_:<10}  {b.name}')
         return 0
 
 
@@ -2236,8 +2248,8 @@ def _setup_parser(cls, parser):
         )
         super()._setup_parser(parser)
 
-    def _print_files(self, args):
-        generator = self._get_ls_generator(args)
+    def _print_files(self, args, b2_uri: B2URI | None = None):
+        generator = self._get_ls_generator(args, b2_uri=b2_uri)
 
         for file_version, folder_name in generator:
             self._print_file_version(args, file_version, folder_name)
@@ -2253,9 +2265,9 @@ def _print_file_version(
             name = escape_control_chars(name)
         self._print(name)
 
-    def _get_ls_generator(self, args):
+    def _get_ls_generator(self, args, b2_uri: B2URI | None = None):
+        b2_uri = b2_uri or self.get_b2_uri_from_arg(args)
         try:
-            b2_uri = self.get_b2_uri_from_arg(args)
             yield from self.api.list_file_versions_by_uri(
                 b2_uri,
                 latest_only=not args.versions,
@@ -2303,9 +2315,21 @@ def _setup_parser(cls, parser):
         super()._setup_parser(parser)
 
     def _run(self, args):
+        b2_uri = self.get_b2_uri_from_arg(args)
+        if args.long and args.json:
+            raise CommandError('Cannot use --long and --json options together')
+
+        if not b2_uri or b2_uri == B2URI(""):
+            for option_name in ('long', 'recursive', 'replication'):
+                if getattr(args, option_name, False):
+                    raise CommandError(
+                        f'Cannot use --{option_name} option without specifying a bucket name'
+                    )
+            return ListBuckets.run_list_buckets(self, json_=args.json)
+
         if args.json:
             i = -1
-            for i, (file_version, _) in enumerate(self._get_ls_generator(args)):
+            for i, (file_version, _) in enumerate(self._get_ls_generator(args, b2_uri=b2_uri)):
                 if i:
                     self._print(',', end='')
                 else:
@@ -2380,24 +2404,33 @@ class Ls(B2IDOrB2URIMixin, BaseLs):
         {NAME} ls --recursive --withWildcard "b2://bucketName/*.[ct]sv"
 
 
-    List all info.txt files from buckets bX, where X is any character:
+    List all info.txt files from directories named `b?`, where `?` is any character:
 
     .. code-block::
 
         {NAME} ls --recursive --withWildcard "b2://bucketName/b?/info.txt"
 
 
-    List all pdf files from buckets b0 to b9 (including sub-directories):
+    List all pdf files from directories b0 to b9 (including sub-directories):
 
     .. code-block::
 
         {NAME} ls --recursive --withWildcard "b2://bucketName/b[0-9]/*.pdf"
 
 
+    List all buckets:
+
+    .. code-block::
+
+        {NAME} ls
+
+
     Requires capability:
 
     - **listFiles**
+    - **listBuckets** (if bucket name is not provided)
     """
+    ALLOW_ALL_BUCKETS = True
 
 
 class BaseRm(ThreadsMixin, AbstractLsCommand, metaclass=ABCMeta):
diff --git a/changelog.d/+ls_buckets.added.md b/changelog.d/+ls_buckets.added.md
new file mode 100644
index 000000000..4437346af
--- /dev/null
+++ b/changelog.d/+ls_buckets.added.md
@@ -0,0 +1 @@
+Add support for calling `b2 ls` without arguments to list all buckets.
diff --git a/test/unit/_utils/test_uri.py b/test/unit/_utils/test_uri.py
index 34b706dec..2099d208f 100644
--- a/test/unit/_utils/test_uri.py
+++ b/test/unit/_utils/test_uri.py
@@ -16,14 +16,13 @@
 
 class TestB2URI:
     def test__str__(self):
-        uri = B2URI(bucket_name="testbucket", path="/path/to/file")
+        uri = B2URI(bucket_name="testbucket", path="path/to/file")
         assert str(uri) == "b2://testbucket/path/to/file"
 
     @pytest.mark.parametrize(
         "path, expected",
         [
             ("", True),
-            ("/", True),
             ("path/", True),
             ("path/subpath", None),
         ],
@@ -31,11 +30,10 @@ def test__str__(self):
     def test_is_dir(self, path, expected):
         assert B2URI("bucket", path).is_dir() is expected
 
-    def test__bucket_uris_is_normalized(self):
+    def test__bucket_uris_are_normalized(self):
         alternatives = [
             B2URI("bucket"),
             B2URI("bucket", ""),
-            B2URI("bucket", "/"),
         ]
         assert len(set(alternatives)) == 1
         assert {str(uri) for uri in alternatives} == {"b2://bucket/"}  # normalized
@@ -44,7 +42,6 @@ def test__bucket_uris_is_normalized(self):
         "path, expected_uri_str",
         [
             ("", "b2://bucket/"),
-            ("/", "b2://bucket/"),
             ("path/", "b2://bucket/path/"),
             ("path/subpath", "b2://bucket/path/subpath"),
         ],
@@ -64,6 +61,8 @@ def test_b2fileuri_str():
     [
         ("some/local/path", Path("some/local/path")),
         ("./some/local/path", Path("some/local/path")),
+        ("b2://bucket", B2URI(bucket_name="bucket")),
+        ("b2://bucket/", B2URI(bucket_name="bucket")),
         ("b2://bucket/path/to/dir/", B2URI(bucket_name="bucket", path="path/to/dir/")),
         ("b2id://file123", B2FileIdURI(file_id="file123")),
         ("b2://bucket/wild[card]", B2URI(bucket_name="bucket", path="wild[card]")),
@@ -75,20 +74,30 @@ def test_parse_uri(uri, expected):
     assert parse_uri(uri) == expected
 
 
+def test_parse_uri__allow_all_buckets():
+    assert parse_uri("b2://", allow_all_buckets=True) == B2URI("")
+    with pytest.raises(ValueError) as exc_info:
+        parse_uri("b2:///", allow_all_buckets=True)
+    assert "Invalid B2 URI: all buckets URI doesn't allow non-empty path, but '/' was provided" == str(
+        exc_info.value
+    )
+
+
 @pytest.mark.parametrize(
     "uri, expected_exception_message",
     [
+        ("", "URI cannot be empty"),
         # Test cases for invalid B2 URIs (missing netloc part)
         ("b2://", "Invalid B2 URI: 'b2://'"),
         ("b2id://", "Invalid B2 URI: 'b2id://'"),
         # Test cases for B2 URIs with credentials
         (
             "b2://user@password:bucket/path",
-            "Invalid B2 URI: credentials passed using `user@password:` syntax are not supported in URI",
+            "Invalid B2 URI: credentials passed using `user@password:` syntax is not supported in URI",
         ),
         (
             "b2id://user@password:file123",
-            "Invalid B2 URI: credentials passed using `user@password:` syntax are not supported in URI",
+            "Invalid B2 URI: credentials passed using `user@password:` syntax is not supported in URI",
         ),
         # Test cases for unsupported URI schemes
         ("unknown://bucket/path", "Unsupported URI scheme: 'unknown'"),
diff --git a/test/unit/console_tool/test_ls.py b/test/unit/console_tool/test_ls.py
new file mode 100644
index 000000000..360c22f62
--- /dev/null
+++ b/test/unit/console_tool/test_ls.py
@@ -0,0 +1,66 @@
+######################################################################
+#
+# File: test/unit/console_tool/test_ls.py
+#
+# Copyright 2024 Backblaze Inc. All Rights Reserved.
+#
+# License https://www.backblaze.com/using_b2_code.html
+#
+######################################################################
+######################################################################
+#
+# File: test/unit/console_tool/test_download_file.py
+#
+# Copyright 2023 Backblaze Inc. All Rights Reserved.
+#
+# License https://www.backblaze.com/using_b2_code.html
+#
+######################################################################
+
+import pytest
+
+
+def test_ls__without_bucket_name(b2_cli, bucket_info):
+    expected_output = "bucket_0  allPublic   my-bucket\n"
+
+    b2_cli.run(["ls"], expected_stdout=expected_output)
+    b2_cli.run(["ls", "b2://"], expected_stdout=expected_output)
+
+
+def test_ls__without_bucket_name__json(b2_cli, bucket_info):
+    expected_output = [
+        {
+            "accountId": "account-0",
+            "bucketId": "bucket_0",
+            "bucketInfo": {},
+            "bucketName": "my-bucket",
+            "bucketType": "allPublic",
+            "corsRules": [],
+            "defaultRetention": {
+                "mode": None
+            },
+            "defaultServerSideEncryption": {
+                "mode": "none"
+            },
+            "isFileLockEnabled": False,
+            "lifecycleRules": [],
+            "options": [],
+            "replication": {
+                "asReplicationDestination": None,
+                "asReplicationSource": None,
+            },
+            "revision": 1,
+        }
+    ]
+
+    b2_cli.run(["ls", "--json"], expected_json_in_stdout=expected_output)
+    b2_cli.run(["ls", "--json", "b2://"], expected_json_in_stdout=expected_output)
+
+
+@pytest.mark.parametrize("flag", ["--long", "--recursive", "--replication"])
+def test_ls__without_bucket_name__option_not_supported(b2_cli, bucket_info, flag):
+    b2_cli.run(
+        ["ls", flag],
+        expected_stderr=f"ERROR: Cannot use {flag} option without specifying a bucket name\n",
+        expected_status=1,
+    )

From 02a9e10f2091cb948a19ba522b50d3f157848eb6 Mon Sep 17 00:00:00 2001
From: Maciej Urbanski <maciej.rooter.urbanski@reef.pl>
Date: Sat, 16 Mar 2024 18:00:32 +0100
Subject: [PATCH 2/2] make autocomplete cache test fail easier to debug

---
 b2/_internal/_cli/autocomplete_cache.py   |  6 +++++-
 test/unit/_cli/test_autocomplete_cache.py | 14 +++++++++-----
 2 files changed, 14 insertions(+), 6 deletions(-)

diff --git a/b2/_internal/_cli/autocomplete_cache.py b/b2/_internal/_cli/autocomplete_cache.py
index ca0e517d3..73c75dfcd 100644
--- a/b2/_internal/_cli/autocomplete_cache.py
+++ b/b2/_internal/_cli/autocomplete_cache.py
@@ -100,7 +100,9 @@ def __init__(
     def _is_autocomplete_run(self) -> bool:
         return '_ARGCOMPLETE' in os.environ
 
-    def autocomplete_from_cache(self, uncached_args: dict | None = None) -> None:
+    def autocomplete_from_cache(
+        self, uncached_args: dict | None = None, raise_exc: bool = False
+    ) -> None:
         if not self._is_autocomplete_run():
             return
 
@@ -111,6 +113,8 @@ def autocomplete_from_cache(self, uncached_args: dict | None = None) -> None:
                 parser = self._unpickle(pickle_data)
                 argcomplete.autocomplete(parser, **(uncached_args or {}))
         except Exception:
+            if raise_exc:
+                raise
             # Autocomplete from cache failed but maybe we can autocomplete from scratch
             return
 
diff --git a/test/unit/_cli/test_autocomplete_cache.py b/test/unit/_cli/test_autocomplete_cache.py
index f3cf164f9..4ce1ad738 100644
--- a/test/unit/_cli/test_autocomplete_cache.py
+++ b/test/unit/_cli/test_autocomplete_cache.py
@@ -94,9 +94,14 @@ def argcomplete_result():
     return exit.code, output.getvalue()
 
 
-def cached_complete_result(cache: autocomplete_cache.AutocompleteCache):
+def cached_complete_result(cache: autocomplete_cache.AutocompleteCache, raise_exc: bool = True):
     exit, output = Exit(), io.StringIO()
-    cache.autocomplete_from_cache(uncached_args={'exit_method': exit, 'output_stream': output})
+    cache.autocomplete_from_cache(
+        uncached_args={
+            'exit_method': exit,
+            'output_stream': output
+        }, raise_exc=raise_exc
+    )
     return exit.code, output.getvalue()
 
 
@@ -307,6 +312,5 @@ def test_that_autocomplete_cache_loading_does_not_load_b2sdk(autocomplete_runner
         assert exit == 0
         assert 'get-bucket' in uncached_output
 
-        exit, output = cached_complete_result(cache)
-        assert exit == 0
-        assert output == uncached_output
+        exit, output = cached_complete_result(cache, raise_exc=True)
+        assert (exit, output) == (0, uncached_output)