From 08d7bab3ffa831bde7131151712a54154a6073e6 Mon Sep 17 00:00:00 2001 From: Dana Sherson Date: Sat, 25 Nov 2023 21:30:33 +1300 Subject: [PATCH] Update from writing doc --- .github/workflows/ci.yml | 2 +- .rubocop.yml | 5 +- lib/path_list.rb | 395 ++++----------------------------------- spec/path_list_spec.rb | 10 +- spec/spec_helper.rb | 2 +- 5 files changed, 44 insertions(+), 370 deletions(-) diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index 3539cac..f90cdf7 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -7,7 +7,7 @@ jobs: strategy: fail-fast: false matrix: - ruby: [2.7, '3.0', 3.1, 3.2, ruby-head, jruby-9.4, jruby-head] + ruby: ['3.0', 3.1, 3.2, ruby-head, jruby-9.4, jruby-head] platform: [ubuntu, windows, macos] continue-on-error: ${{ endsWith(matrix.ruby, 'head') }} runs-on: ${{matrix.platform}}-latest diff --git a/.rubocop.yml b/.rubocop.yml index d4df66c..37e7806 100644 --- a/.rubocop.yml +++ b/.rubocop.yml @@ -175,8 +175,11 @@ Style/Alias: Style/CollectionMethods: Enabled: true +Style/Documentation: + Enabled: false + Style/DocumentationMethod: - Enabled: true + Enabled: false # this can mess with the balance of symmetric cases Style/IfInsideElse: diff --git a/lib/path_list.rb b/lib/path_list.rb index 61f8d79..a01da15 100644 --- a/lib/path_list.rb +++ b/lib/path_list.rb @@ -1,26 +1,5 @@ # frozen_string_literal: true -# Build a `PathList` by chaining {#gitignore} {#only}, {#ignore}, -# and combining these chains with {#union}, or {#intersection} -# -# - Yield each of the files not ignored by your PathList with {#each} or any other enumerable methods. -# - Test if a file path would be yielded by this PathList with {#include?}. -# - Test if a file or directory path would hypothetically be matchable by your PathList with {#match?} -# -# **Note:** If you want use the same PathList match rules more than once, -# save the pathlist to a variable to avoid having to read and parse the patterns over and over again -# -# @example -# PathList.gitignore.each { |file| puts "#{file} is not ignored by git" } -# PathList.gitignore.filter_map { |file| ::File.read(file) if ::File.readable?(file) } -# PathList.only('*.rb', '!config/').each { |file| puts "#{file} is a ruby file not in the config directory" } -# PathList.ignore(patterns_from_file: '.dockerignore').each { |file| puts "#{file} would be copied with COPY" } -# PathList.intersection(PathList.gitignore, PathList.union(PathList.only('*.rb'), PathList.only('*.py'))) -# -# PathList.gitignore.include?("is/this/file/gitignored") -# PathList.gitignore.match?("is/this") -# PathList.gitignore.match?("is/this/hypothetical/directory", directory: true) -# class PathList class Error < StandardError; end @@ -28,6 +7,31 @@ class Error < StandardError; end Autoloader.autoload(self) include ::Enumerable + extend ::Enumerable + + class << self + def gitignore(root: nil, config: true) + new.gitignore(root: root, config: config) + end + + def ignore(*patterns, patterns_from_file: nil, format: :gitignore, root: nil) + new.ignore(*patterns, patterns_from_file: patterns_from_file, format: format, root: root) + end + + def only(*patterns, patterns_from_file: nil, format: :gitignore, root: nil) + new.only(*patterns, patterns_from_file: patterns_from_file, format: format, root: root) + end + + def union(path_list, *path_lists) + path_list.union(*path_lists) + end + + def intersection(path_list, *path_lists) + path_list.intersection(*path_lists) + end + + alias_method :all, :new + end def initialize @matcher = Matcher::Allow @@ -35,128 +39,10 @@ def initialize @file_matcher = nil end - # @!group Gitignore methods - - # Return a new PathList that filters files using .gitignore files. - # - # This matcher aims for fidelity with `git ls-files`, - # reading the configured core.excludesFile and .gitignore files in subdirectories - # - # @param root [String, Pathname, #to_s, nil] - # The git repo root. When nil, PathList will search up from the current directory like git does for a directory - # containing `.git/`. If it doesn't find anything, it will default to the current directory. - # @param config [Boolean] - # Whether to load the configured `core.excludesFile`. - # When this is false this will only load patterns in `.gitignore` files in the `root:` directory and its children, - # and the `.git/info/exclude` file in the `root:` directory. When true it will also load config files in all the - # locations that git would also look, to find the core.excludesFile. - # @return [PathList] - # a new PathList - # @example - # PathList.only('*.rb').gitignore # can be chained - # PathList.gitignore(root: Dir.pwd) # don't look for a .git directory - # PathList.gitignore(root: '../../') # the project root is two directories up - # PathList.gitignore(config: false) # don't look for a configured core.excludesFile - # @see #gitignore - # @see https://git-scm.com/docs/gitignore#_pattern_format - def self.gitignore(root: nil, config: true) - new.gitignore(root: root, config: config) - end - - # Return a new PathList that filters files using .gitignore files. - # - # This matcher aims for fidelity with `git ls-files`, - # reading the configured core.excludesFile and .gitignore files in subdirectories - # - # @param root [String, Pathname, #to_s, nil] - # The git repo root. When nil, PathList will search up from the current directory like git does for a directory - # containing `.git/`. If it doesn't find anything, it will default to the current directory. - # @param config [Boolean] - # Whether to load the configured `core.excludesFile`. - # When this is false this will only load patterns in `.gitignore` files in the `root:` directory and its children, - # and the `.git/info/exclude` file in the `root:` directory. When true it will also load config files in all the - # locations that git would also look, to find the core.excludesFile. - # @return [PathList] - # a new PathList - # @example - # PathList.only('*.rb').gitignore # can be chained - # PathList.gitignore(root: Dir.pwd) # don't look for a .git directory - # PathList.gitignore(root: '../../') # the project root is two directories up - # PathList.gitignore(config: false) # don't look for a configured core.excludesFile - # @see .gitignore - # @see https://git-scm.com/docs/gitignore#_pattern_format def gitignore(root: nil, config: true) new_and_matcher(Gitignore.build(root: root, config: config)) end - # @!group Ignore methods - - # Return a new PathList that filters out files using the given patterns. - # - # @overload ignore(*patterns, format: :gitignore, root: nil) - # @param patterns [Array] - # The list of patterns. Within an array, or as a line-separated string. - # The individual pattern format depends on the `format:` param - # @param root [String, Pathname, #to_s, nil] - # The root for any patterns that need it (e.g. gitignore patterns starting with `/`), - # defaults to the current directory when nil. - # @param format [:gitignore, :glob_gitignore, :exact, :shebang] - # The format of the rules - # @return [PathList] - # a new PathList - # @overload ignore(patterns_from_file:, format: :gitignore, root: nil) - # @param patterns_from_file [String, Pathname, #to_s] - # A file to read the list of patterns from, with each pattern on its own line - # @param root [String, Pathname, #to_s, nil] - # The root for any patterns that need it (e.g. gitignore patterns starting with `/`), - # when nil, defaults to the directory containing the patterns_from_file file. - # @param format [:gitignore, :glob_gitignore, :exact, :shebang] - # The format of the patterns, see {PatternParser::Gitignore}, - # {PatternParser::GlobGitignore}, - # {PatternParser::ExactPath}, - # {PatternParser::Shebang} - # @return [PathList] - # a new PathList - # @example - # PathList.ignore('*.md', root: './docs').ignore(patterns_from_file: '.dockerignore') - # PathList.ignore('/bin').ignore("ruby", format: :shebang) - # PathList.gitignore.ignore('spec', format: :exact) - # @see #ignore - def self.ignore(*patterns, patterns_from_file: nil, format: :gitignore, root: nil) - new.ignore(*patterns, patterns_from_file: patterns_from_file, format: format, root: root) - end - - # Return a new PathList that filters out files using the given patterns. - # - # @overload ignore(*patterns, format: :gitignore, root: nil) - # @param patterns [Array] - # The list of patterns. Within an array, or as a line-separated string. - # The individual pattern format depends on the `format:` param - # @param root [String, Pathname, #to_s, nil] - # The root for any patterns that need it (e.g. gitignore patterns starting with `/`), - # defaults to the current directory when nil. - # @param format [:gitignore, :glob_gitignore, :exact, :shebang] - # The format of the patterns, see {PatternParser::Gitignore}, - # {PatternParser::GlobGitignore}, - # {PatternParser::ExactPath}, - # {PatternParser::Shebang} - # @return [PathList] - # a new PathList - # @overload ignore(patterns_from_file:, format: :gitignore, root: nil) - # @param patterns_from_file [String, Pathname, #to_s] - # A file to read the list of patterns from, with each pattern on its own line - # @param root [String, Pathname, #to_s, nil] - # The root for any patterns that need it (e.g. gitignore patterns starting with `/`), - # when nil, defaults to the directory containing the patterns_from_file file. - # @param format [:gitignore, :glob_gitignore, :exact, :shebang] - # The format of the rules - # @return [PathList] - # a new PathList - # @example - # PathList.ignore('*.md', root: './docs').ignore(patterns_from_file: '.dockerignore') - # PathList.ignore('/bin').ignore("ruby", format: :shebang) - # PathList.gitignore.ignore('spec', format: :exact) - # @see .ignore def ignore(*patterns, patterns_from_file: nil, format: :gitignore, root: nil) new_and_matcher( PatternParser.build( @@ -165,74 +51,6 @@ def ignore(*patterns, patterns_from_file: nil, format: :gitignore, root: nil) ) end - # @!group Only methods - - # Return a new PathList that selects only those files that match given patterns. - # - # @overload only(*patterns, format: :gitignore, root: nil) - # @param patterns [Array, Array>, String] - # The list of patterns. Within an array, or as a line-separated string. - # The individual pattern format depends on the `format:` param - # @param root [String, Pathname, #to_s, nil] - # The root for any patterns that need it (e.g. gitignore-style patterns starting with `/`), - # defaults to the current directory when nil. - # @param format [:gitignore, :glob_gitignore, :exact, :shebang] - # The format of the patterns, see {PatternParser::Gitignore}, - # {PatternParser::GlobGitignore}, - # {PatternParser::ExactPath}, - # {PatternParser::Shebang} - # @return [PathList] - # a new PathList - # @overload only(patterns_from_file:, format: :gitignore, root: nil) - # @param patterns_from_file [String, Pathname, #to_s] - # A file to read the list of patterns from, with each pattern on its own line - # @param root [String, Pathname, #to_s, nil] - # The root for any patterns that need it (e.g. gitignore-style patterns starting with `/`), - # when nil, defaults to the directory containing the patterns_from_file file. - # @param format [:gitignore, :glob_gitignore, :exact, :shebang] - # The format of the rules - # @return [PathList] - # a new PathList - # @example - # PathList.only('*.md', root: './docs').ignore('CHANGELOG.md') - # PathList.only(patterns_from_file: './files_to_copy.txt', exact: true) - # PathList.only(['bin', 'lib', 'exe', 'README.md', 'LICENSE']) - # @see #only - def self.only(*patterns, patterns_from_file: nil, format: :gitignore, root: nil) - new.only(*patterns, patterns_from_file: patterns_from_file, format: format, root: root) - end - - # Return a new PathList that selects only those files that match given patterns. - # - # @overload only(*patterns, format: :gitignore, root: nil) - # @param patterns [Array, Array>, String] - # The list of patterns. Within an array, or as a line-separated string. - # The individual pattern format depends on the `format:` param - # @param root [String, Pathname, #to_s, nil] - # The root for any patterns that need it (e.g. gitignore-style patterns starting with `/`), - # defaults to the current directory when nil. - # @param format [:gitignore, :glob_gitignore, :exact, :shebang] - # The format of the patterns, see {PatternParser::Gitignore}, - # {PatternParser::GlobGitignore}, - # {PatternParser::ExactPath}, - # {PatternParser::Shebang} - # @return [PathList] - # a new PathList - # @overload only(patterns_from_file:, format: :gitignore, root: nil) - # @param patterns_from_file [String, Pathname, #to_s] - # A file to read the list of patterns from, with each pattern on its own line - # @param root [String, Pathname, #to_s, nil] - # The root for any patterns that need it (e.g. gitignore-style patterns starting with `/`), - # when nil, defaults to the directory containing the patterns_from_file file. - # @param format [:gitignore, :glob_gitignore, :exact, :shebang] - # The format of the rules - # @return [PathList] - # a new PathList - # @example - # PathList.only('*.md', root: './docs').ignore('CHANGELOG.md') - # PathList.only(patterns_from_file: './files_to_copy.txt', exact: true) - # PathList.only(['bin', 'lib', 'exe', 'README.md', 'LICENSE']) - # @see .only def only(*patterns, patterns_from_file: nil, format: :gitignore, root: nil) new_and_matcher( PatternParser.build( @@ -241,126 +59,26 @@ def only(*patterns, patterns_from_file: nil, format: :gitignore, root: nil) ) end - # @!group Union methods - - # Return a new PathList that matches any of path_lists. - # - # @param path_lists [*PathList] - # @return [PathList] - # a new PathList - # @example - # PathList.union(PathList.only("*.ts"), PathList.only("*.tsx")) - # # is equivalent to - # PathList.only(["*.ts", "*.tsx"]) - # @see #union - # @see #| - def self.union(path_list, *path_lists) - path_list.union(*path_lists) - end - - # Return a new PathList that matches the receiver OR any of path_lists. - # - # @param path_lists [*PathList] - # @return [PathList] - # a new PathList - # @example - # PathList.gitignore.only(["*.js", "*.jsx"]).union(PathList.only("*.ts"), PathList.only("*.tsx")) - # # is equivalent to - # PathList.gitignore.only(["*.js", "*.jsx", "*.ts", "*.tsx"]) - # @see .union - # @see #| - def union(*path_lists) + def union(path_list, *path_lists) new_with_matcher( - Matcher::Any.build([@matcher, *path_lists.map { |l| l.matcher }]) # rubocop:disable Style/SymbolProc + Matcher::Any.build([@matcher, path_list.matcher, *path_lists.map { |l| l.matcher }]) # rubocop:disable Style/SymbolProc ) end - # Return a new PathList that matches the receiver OR other. - # - # @param other [PathList] - # @return [PathList] - # a new PathList - # @example - # PathList.gitignore.only("*.rb") | PathList.only("*.sh") - # # is equivalent to - # PathList.gitignore.only(["*.rb", "*.sh"]) - # @see .union - # @see #union def |(other) union(other) end - # @!group Intersection methods - - # Return a new PathList that matches all of path_lists. - # - # @param path_lists [*PathList] - # @return [PathList] - # a new PathList - # @example - # PathList.intersection(PathList.only("*.rb"), PathList.ignore("/vendor/")) - # # is equivalent to - # PathList.only("*.rb").ignore("/vendor/") - # @see #intersection - # @see #& - def self.intersection(*path_lists) - new.intersection(*path_lists) - end - - # Return a new PathList that matches the receiver AND all of path_lists. - # - # @param path_lists [*PathList] - # @return [PathList] - # a new PathList - # @example - # PathList.gitignore.intersection(PathList.only("*.rb"), PathList.ignore("/vendor/")) - # # is equivalent to - # PathList.gitignore.only("*.rb").ignore("/vendor/") - # @see .intersection - # @see #& - def intersection(*path_lists) - new_and_matcher(Matcher::All.build(path_lists.map { |l| l.matcher })) # rubocop:disable Style/SymbolProc + def intersection(path_list, *path_lists) + new_with_matcher( + Matcher::All.build([@matcher, path_list.matcher, path_lists.map { |l| l.matcher }]) # rubocop:disable Style/SymbolProc + ) end - # Return a new PathList that matchers the receiver AND other. - # - # @param other [PathList] - # @return [PathList] - # a new PathList - # @example - # PathList.gitignore.only("*.rb") & PathList.ignore("/vendor/") - # # is equivalent to - # PathList.gitignore.only("*.rb").ignore("/vendor/") - # @see .intersection - # @see #intersection def &(other) intersection(other) end - # @!group Querying methods - - # Check if a single path would be yielded by {#each} - # This will always be false if the path is a directory, or doesn't exist. - # If you want to match directories or hypothetical paths, use {#match?} - # @see #match? - # @param [String, Pathname, #to_s] path - # relative or absolute path to check - # @return [Boolean] - # @example - # PathList.include?("relative/path") - # PathList.include?("./relative/path") - # PathList.include?("/absolute/path") - # PathList.include?("~/user/path") - # PathList.include?(Pathname.new("/stdlib/pathname")) - # - # # because this is aliased as `===` - # # PathList can be used in case statements. - # case my_path - # when PathList.gitignore - # "would be matched by git ls-files" - # when PathList.only("*.rb") - # "would be matched by Dir.glob('**/*.rb')" - # end def include?(path) full_path = CanonicalPath.full_path(path) candidate = Candidate.new(full_path) @@ -372,37 +90,10 @@ def include?(path) alias_method :member?, :include? alias_method :===, :include? - # @return [Proc] - # {#include?} as a proc - # @see #include? - # @example - # ["my/path", "my/other/path"].select(&PathList.gitignore) def to_proc method(:include?).to_proc end - # Looser than {#include?}, it also returns true for directories that could - # theoretically contain files in the PathList, or even for paths that don't - # exist but could hypothetically match the PathList. - # @see #include? - # - # @param [String, Pathname, #to_s] path - # relative or absolute path to check - # @param [nil, true, false] directory - # override whether to match this file as a directory or not. - # When `nil`, will check the filesystem for what this path actually is, - # before defaulting to `false` if the path is inaccessible or nonexistent. - # @param [String, nil] content - # override the content of the file when checking shebang rules. - # When nil, will check the filesystem for the actual first line if necessary, - # defaulting to an empty string if the path is inaccessible or nonexistent. - # @return [Boolean] - # @example - # PathList.include?('my_directory/my_file') # given this returns true - # PathList.include?('my_directory') # returns false, as it's a directory, not a file that would be yielded by each. - # PathList.match?('my_directory') # returns true, because it *could contain* 'my_file' - # PathList.match?('my_directory/my_file', directory: true) # you can lie about whether a file is a directory - # PathList.match?('my_directory/my_file', content: '#!/bin/ruby') # you can also just lie about the content def match?(path, directory: nil, content: nil) full_path = CanonicalPath.full_path(path) content = content.slice(/\A#!.*$/) || '' if content @@ -412,28 +103,8 @@ def match?(path, directory: nil, content: nil) @matcher.match(candidate) == :allow end - # yields each of the filenames not ignored by the `PathList` in a non-specific order, recursively. - # - # This works like git ls-files, in that it only returns files, not directories, - # and it treats symlinks as regular files, even symlinks to directories. - # - # This `each` method allows all `Enumerable` methods to work, `#to_a` or `#filter_map` or etc. - # - # Will return an `Enumerator` when not given a block. - # - # @param [String, Pathname, #to_s] root (Dir.pwd) - # relative or absolute path to start from - # @yieldparam [String] path - # relative path from `root` - # @return [self, Enumerator] - # @example - # PathList.gitignore.each { |path| puts "#{path} is not ignored by git" } - # PathList.gitignore.each("./within/a/subdirectory") { |path| puts path } - # PathList.each("/") { |path| puts path } # traverse a whole filesystem? - # PathList.gitignore.each.with_object({}) { |path, hash| hash[path] = true } - # PathList.gitignore.each("./within/a/subdirectory").select { |path| ::File.symlink?(path) } - def each(root = '.', &block) - return enum_for(:each, root) unless block + def each(root: '.', &block) + return enum_for(:each, root: root) unless block root = CanonicalPath.full_path(root) root_candidate = Candidate.new(root) diff --git a/spec/path_list_spec.rb b/spec/path_list_spec.rb index dac45c1..8d61ba8 100644 --- a/spec/path_list_spec.rb +++ b/spec/path_list_spec.rb @@ -38,18 +38,18 @@ end it 'copes with being given fs root' do - whatever_file_we_get = subject.each('/').first + whatever_file_we_get = subject.each(root: '/').first expect(whatever_file_we_get).not_to start_with('/') # use symlink? because it could be a symlink to nowhere and File.exist? would return false expect { File.symlink?("/#{whatever_file_we_get}") || File.exist?("/#{whatever_file_we_get}") }.not_to raise_error end it 'copes with being given nonsense root' do - expect(subject.each('nonsense').to_a).to be_empty + expect(subject.each(root: 'nonsense').to_a).to be_empty end context 'when given root as a child dir' do - subject(:to_a) { described_class.new.each(Dir.pwd + '/bar').to_a } + subject(:to_a) { described_class.new.each(root: Dir.pwd + '/bar').to_a } it 'returns relative to the root' do create_file_list 'bar/foo', 'bar/baz', 'fez', 'baz/foo', 'baz/baz' @@ -66,7 +66,7 @@ gitignore 'baz' Dir.chdir('bar') do - expect(subject.each('../').to_a).to contain_exactly('bar/foo', 'fez', '.gitignore') + expect(subject.each(root: '../').to_a).to contain_exactly('bar/foo', 'fez', '.gitignore') end end end @@ -115,7 +115,7 @@ end context 'when given root with a trailing slash' do - subject(:to_a) { described_class.new.each(Dir.pwd + '/bar/').to_a } + subject(:to_a) { described_class.new.each(root: Dir.pwd + '/bar/').to_a } it 'returns relative to the root' do create_file_list 'bar/foo', 'bar/baz', 'fez', 'baz/foo', 'baz/bar' diff --git a/spec/spec_helper.rb b/spec/spec_helper.rb index 19dca2e..10ebaef 100644 --- a/spec/spec_helper.rb +++ b/spec/spec_helper.rb @@ -23,7 +23,7 @@ def warn(msg) # leftovers:allow require 'simplecov' if ENV['COVERAGE'] require_relative '../lib/path_list' -PathList.only('support/**/*.rb', root: __dir__).each(__dir__) do |file| +PathList.only('support/**/*.rb', root: __dir__).each(root: __dir__) do |file| require_relative file end