Skip to content

Commit

Permalink
Merge pull request #135 from Kobzol/cache-dir
Browse files Browse the repository at this point in the history
Cache information about file type
  • Loading branch information
the8472 authored Jan 2, 2024
2 parents 7b29204 + e1981f2 commit 4172399
Show file tree
Hide file tree
Showing 2 changed files with 98 additions and 19 deletions.
88 changes: 69 additions & 19 deletions src/lib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -73,7 +73,9 @@ use std::cmp;
use std::error::Error;
use std::fmt;
use std::fs;
use std::fs::DirEntry;
use std::io;
use std::ops::Deref;
use std::path::{self, Component, Path, PathBuf};
use std::str::FromStr;

Expand All @@ -96,8 +98,8 @@ pub struct Paths {
dir_patterns: Vec<Pattern>,
require_dir: bool,
options: MatchOptions,
todo: Vec<Result<(PathBuf, usize), GlobError>>,
scope: Option<PathBuf>,
todo: Vec<Result<(PathWrapper, usize), GlobError>>,
scope: Option<PathWrapper>,
}

/// Return an iterator that produces all the `Path`s that match the given
Expand Down Expand Up @@ -242,6 +244,7 @@ pub fn glob_with(pattern: &str, options: MatchOptions) -> Result<Paths, PatternE
}

let scope = root.map_or_else(|| PathBuf::from("."), to_scope);
let scope = PathWrapper::from_path(scope);

let mut dir_patterns = Vec::new();
let components =
Expand Down Expand Up @@ -323,8 +326,52 @@ impl fmt::Display for GlobError {
}
}

fn is_dir(p: &Path) -> bool {
fs::metadata(p).map(|m| m.is_dir()).unwrap_or(false)
#[derive(Debug)]
struct PathWrapper {
path: PathBuf,
is_directory: bool,
}

impl PathWrapper {
fn from_dir_entry(path: PathBuf, e: DirEntry) -> Self {
let is_directory = e
.file_type()
.ok()
.and_then(|file_type| {
// We need to use fs::metadata to resolve the actual path
// if it's a symlink.
if file_type.is_symlink() {
None
} else {
Some(file_type.is_dir())
}
})
.or_else(|| fs::metadata(&path).map(|m| m.is_dir()).ok())
.unwrap_or(false);
Self { path, is_directory }
}
fn from_path(path: PathBuf) -> Self {
let is_directory = fs::metadata(&path).map(|m| m.is_dir()).unwrap_or(false);
Self { path, is_directory }
}

fn into_path(self) -> PathBuf {
self.path
}
}

impl Deref for PathWrapper {
type Target = Path;

fn deref(&self) -> &Self::Target {
self.path.deref()
}
}

impl AsRef<Path> for PathWrapper {
fn as_ref(&self) -> &Path {
self.path.as_ref()
}
}

/// An alias for a glob iteration result.
Expand Down Expand Up @@ -363,10 +410,10 @@ impl Iterator for Paths {
// idx -1: was already checked by fill_todo, maybe path was '.' or
// '..' that we can't match here because of normalization.
if idx == !0 as usize {
if self.require_dir && !is_dir(&path) {
if self.require_dir && !path.is_directory {
continue;
}
return Some(Ok(path));
return Some(Ok(path.into_path()));
}

if self.dir_patterns[idx].is_recursive {
Expand All @@ -379,7 +426,7 @@ impl Iterator for Paths {
next += 1;
}

if is_dir(&path) {
if path.is_directory {
// the path is a directory, so it's a match

// push this directory's contents
Expand All @@ -394,7 +441,7 @@ impl Iterator for Paths {
if next == self.dir_patterns.len() - 1 {
// pattern ends in recursive pattern, so return this
// directory as a result
return Some(Ok(path));
return Some(Ok(path.into_path()));
} else {
// advanced to the next pattern for this path
idx = next + 1;
Expand Down Expand Up @@ -427,8 +474,8 @@ impl Iterator for Paths {
// *AND* its children so we don't need to check the
// children

if !self.require_dir || is_dir(&path) {
return Some(Ok(path));
if !self.require_dir || path.is_directory {
return Some(Ok(path.into_path()));
}
} else {
fill_todo(
Expand Down Expand Up @@ -817,10 +864,10 @@ impl Pattern {
// special-casing patterns to match `.` and `..`, and avoiding `readdir()`
// calls when there are no metacharacters in the pattern.
fn fill_todo(
todo: &mut Vec<Result<(PathBuf, usize), GlobError>>,
todo: &mut Vec<Result<(PathWrapper, usize), GlobError>>,
patterns: &[Pattern],
idx: usize,
path: &Path,
path: &PathWrapper,
options: MatchOptions,
) {
// convert a pattern that's just many Char(_) to a string
Expand All @@ -836,7 +883,7 @@ fn fill_todo(
Some(s)
}

let add = |todo: &mut Vec<_>, next_path: PathBuf| {
let add = |todo: &mut Vec<_>, next_path: PathWrapper| {
if idx + 1 == patterns.len() {
// We know it's good, so don't make the iterator match this path
// against the pattern again. In particular, it can't match
Expand All @@ -848,8 +895,8 @@ fn fill_todo(
};

let pattern = &patterns[idx];
let is_dir = is_dir(path);
let curdir = path == Path::new(".");
let is_dir = path.is_directory;
let curdir = path.as_ref() == Path::new(".");
match pattern_as_str(pattern) {
Some(s) => {
// This pattern component doesn't have any metacharacters, so we
Expand All @@ -863,6 +910,7 @@ fn fill_todo(
} else {
path.join(&s)
};
let next_path = PathWrapper::from_path(next_path);
if (special && is_dir)
|| (!special
&& (fs::metadata(&next_path).is_ok()
Expand All @@ -875,19 +923,21 @@ fn fill_todo(
let dirs = fs::read_dir(path).and_then(|d| {
d.map(|e| {
e.map(|e| {
if curdir {
let path = if curdir {
PathBuf::from(e.path().file_name().unwrap())
} else {
e.path()
}
};
PathWrapper::from_dir_entry(path, e)
})
})
.collect::<Result<Vec<_>, _>>()
});
match dirs {
Ok(mut children) => {
if options.require_literal_leading_dot {
children.retain(|x| !x.file_name().unwrap().to_str().unwrap().starts_with("."));
children
.retain(|x| !x.file_name().unwrap().to_str().unwrap().starts_with("."));
}
children.sort_by(|p1, p2| p2.file_name().cmp(&p1.file_name()));
todo.extend(children.into_iter().map(|x| Ok((x, idx))));
Expand All @@ -900,7 +950,7 @@ fn fill_todo(
if !pattern.tokens.is_empty() && pattern.tokens[0] == Char('.') {
for &special in &[".", ".."] {
if pattern.matches_with(special, options) {
add(todo, path.join(special));
add(todo, PathWrapper::from_path(path.join(special)));
}
}
}
Expand Down
29 changes: 29 additions & 0 deletions tests/glob-std.rs
Original file line number Diff line number Diff line change
Expand Up @@ -44,6 +44,19 @@ fn main() {
}
}

fn mk_symlink_dir(original: &str, link: &str) {
#[cfg(unix)]
{
use std::os::unix::fs::symlink;
symlink(original, link).unwrap();
}
#[cfg(windows)]
{
use std::os::windows::fs::symlink_dir;
symlink_dir(original, link).unwrap();
}
}

fn glob_vec(pattern: &str) -> Vec<PathBuf> {
glob(pattern).unwrap().map(|r| r.unwrap()).collect()
}
Expand Down Expand Up @@ -99,6 +112,22 @@ fn main() {
mk_file("r/three", true);
mk_file("r/three/c.md", false);

mk_file("dirsym", true);
mk_symlink_dir(root.path().join("r").to_str().unwrap(), "dirsym/link");

assert_eq!(
glob_vec("dirsym/**/*.md"),
vec!(
PathBuf::from("dirsym/link/another/a.md"),
PathBuf::from("dirsym/link/current_dir.md"),
PathBuf::from("dirsym/link/one/a.md"),
PathBuf::from("dirsym/link/one/another/a.md"),
PathBuf::from("dirsym/link/one/another/deep/spelunking.md"),
PathBuf::from("dirsym/link/three/c.md"),
PathBuf::from("dirsym/link/two/b.md")
)
);

// all recursive entities
assert_eq!(
glob_vec("r/**"),
Expand Down

0 comments on commit 4172399

Please sign in to comment.