| 1 | /*! | 
| 2 | Crate `walkdir` provides an efficient and cross platform implementation | 
|---|
| 3 | of recursive directory traversal. Several options are exposed to control | 
|---|
| 4 | iteration, such as whether to follow symbolic links (default off), limit the | 
|---|
| 5 | maximum number of simultaneous open file descriptors and the ability to | 
|---|
| 6 | efficiently skip descending into directories. | 
|---|
| 7 |  | 
|---|
| 8 | To use this crate, add `walkdir` as a dependency to your project's | 
|---|
| 9 | `Cargo.toml`: | 
|---|
| 10 |  | 
|---|
| 11 | ```toml | 
|---|
| 12 | [dependencies] | 
|---|
| 13 | walkdir = "2" | 
|---|
| 14 | ``` | 
|---|
| 15 |  | 
|---|
| 16 | # From the top | 
|---|
| 17 |  | 
|---|
| 18 | The [`WalkDir`] type builds iterators. The [`DirEntry`] type describes values | 
|---|
| 19 | yielded by the iterator. Finally, the [`Error`] type is a small wrapper around | 
|---|
| 20 | [`std::io::Error`] with additional information, such as if a loop was detected | 
|---|
| 21 | while following symbolic links (not enabled by default). | 
|---|
| 22 |  | 
|---|
| 23 | [`WalkDir`]: struct.WalkDir.html | 
|---|
| 24 | [`DirEntry`]: struct.DirEntry.html | 
|---|
| 25 | [`Error`]: struct.Error.html | 
|---|
| 26 | [`std::io::Error`]: https://doc.rust-lang.org/stable/std/io/struct.Error.html | 
|---|
| 27 |  | 
|---|
| 28 | # Example | 
|---|
| 29 |  | 
|---|
| 30 | The following code recursively iterates over the directory given and prints | 
|---|
| 31 | the path for each entry: | 
|---|
| 32 |  | 
|---|
| 33 | ```no_run | 
|---|
| 34 | use walkdir::WalkDir; | 
|---|
| 35 | # use walkdir::Error; | 
|---|
| 36 |  | 
|---|
| 37 | # fn try_main() -> Result<(), Error> { | 
|---|
| 38 | for entry in WalkDir::new( "foo") { | 
|---|
| 39 | println!( "{}", entry?.path().display()); | 
|---|
| 40 | } | 
|---|
| 41 | # Ok(()) | 
|---|
| 42 | # } | 
|---|
| 43 | ``` | 
|---|
| 44 |  | 
|---|
| 45 | Or, if you'd like to iterate over all entries and ignore any errors that | 
|---|
| 46 | may arise, use [`filter_map`]. (e.g., This code below will silently skip | 
|---|
| 47 | directories that the owner of the running process does not have permission to | 
|---|
| 48 | access.) | 
|---|
| 49 |  | 
|---|
| 50 | ```no_run | 
|---|
| 51 | use walkdir::WalkDir; | 
|---|
| 52 |  | 
|---|
| 53 | for entry in WalkDir::new( "foo").into_iter().filter_map(|e| e.ok()) { | 
|---|
| 54 | println!( "{}", entry.path().display()); | 
|---|
| 55 | } | 
|---|
| 56 | ``` | 
|---|
| 57 |  | 
|---|
| 58 | [`filter_map`]: https://doc.rust-lang.org/stable/std/iter/trait.Iterator.html#method.filter_map | 
|---|
| 59 |  | 
|---|
| 60 | # Example: follow symbolic links | 
|---|
| 61 |  | 
|---|
| 62 | The same code as above, except [`follow_links`] is enabled: | 
|---|
| 63 |  | 
|---|
| 64 | ```no_run | 
|---|
| 65 | use walkdir::WalkDir; | 
|---|
| 66 | # use walkdir::Error; | 
|---|
| 67 |  | 
|---|
| 68 | # fn try_main() -> Result<(), Error> { | 
|---|
| 69 | for entry in WalkDir::new( "foo").follow_links(true) { | 
|---|
| 70 | println!( "{}", entry?.path().display()); | 
|---|
| 71 | } | 
|---|
| 72 | # Ok(()) | 
|---|
| 73 | # } | 
|---|
| 74 | ``` | 
|---|
| 75 |  | 
|---|
| 76 | [`follow_links`]: struct.WalkDir.html#method.follow_links | 
|---|
| 77 |  | 
|---|
| 78 | # Example: skip hidden files and directories on unix | 
|---|
| 79 |  | 
|---|
| 80 | This uses the [`filter_entry`] iterator adapter to avoid yielding hidden files | 
|---|
| 81 | and directories efficiently (i.e. without recursing into hidden directories): | 
|---|
| 82 |  | 
|---|
| 83 | ```no_run | 
|---|
| 84 | use walkdir::{DirEntry, WalkDir}; | 
|---|
| 85 | # use walkdir::Error; | 
|---|
| 86 |  | 
|---|
| 87 | fn is_hidden(entry: &DirEntry) -> bool { | 
|---|
| 88 | entry.file_name() | 
|---|
| 89 | .to_str() | 
|---|
| 90 | .map(|s| s.starts_with( ".")) | 
|---|
| 91 | .unwrap_or(false) | 
|---|
| 92 | } | 
|---|
| 93 |  | 
|---|
| 94 | # fn try_main() -> Result<(), Error> { | 
|---|
| 95 | let walker = WalkDir::new( "foo").into_iter(); | 
|---|
| 96 | for entry in walker.filter_entry(|e| !is_hidden(e)) { | 
|---|
| 97 | println!( "{}", entry?.path().display()); | 
|---|
| 98 | } | 
|---|
| 99 | # Ok(()) | 
|---|
| 100 | # } | 
|---|
| 101 | ``` | 
|---|
| 102 |  | 
|---|
| 103 | [`filter_entry`]: struct.IntoIter.html#method.filter_entry | 
|---|
| 104 | */ | 
|---|
| 105 |  | 
|---|
| 106 | #![ deny(missing_docs)] | 
|---|
| 107 | #![ allow(unknown_lints)] | 
|---|
| 108 |  | 
|---|
| 109 | #[ cfg(doctest)] | 
|---|
| 110 | doc_comment::doctest!( "../README.md"); | 
|---|
| 111 |  | 
|---|
| 112 | use std::cmp::{min, Ordering}; | 
|---|
| 113 | use std::fmt; | 
|---|
| 114 | use std::fs::{self, ReadDir}; | 
|---|
| 115 | use std::io; | 
|---|
| 116 | use std::iter; | 
|---|
| 117 | use std::path::{Path, PathBuf}; | 
|---|
| 118 | use std::result; | 
|---|
| 119 | use std::vec; | 
|---|
| 120 |  | 
|---|
| 121 | use same_file::Handle; | 
|---|
| 122 |  | 
|---|
| 123 | pub use crate::dent::DirEntry; | 
|---|
| 124 | #[ cfg(unix)] | 
|---|
| 125 | pub use crate::dent::DirEntryExt; | 
|---|
| 126 | pub use crate::error::Error; | 
|---|
| 127 |  | 
|---|
| 128 | mod dent; | 
|---|
| 129 | mod error; | 
|---|
| 130 | #[ cfg(test)] | 
|---|
| 131 | mod tests; | 
|---|
| 132 | mod util; | 
|---|
| 133 |  | 
|---|
| 134 | /// Like try, but for iterators that return [`Option<Result<_, _>>`]. | 
|---|
| 135 | /// | 
|---|
| 136 | /// [`Option<Result<_, _>>`]: https://doc.rust-lang.org/stable/std/option/enum.Option.html | 
|---|
| 137 | macro_rules! itry { | 
|---|
| 138 | ($e:expr) => { | 
|---|
| 139 | match $e { | 
|---|
| 140 | Ok(v) => v, | 
|---|
| 141 | Err(err) => return Some(Err(From::from(err))), | 
|---|
| 142 | } | 
|---|
| 143 | }; | 
|---|
| 144 | } | 
|---|
| 145 |  | 
|---|
| 146 | /// A result type for walkdir operations. | 
|---|
| 147 | /// | 
|---|
| 148 | /// Note that this result type embeds the error type in this crate. This | 
|---|
| 149 | /// is only useful if you care about the additional information provided by | 
|---|
| 150 | /// the error (such as the path associated with the error or whether a loop | 
|---|
| 151 | /// was dectected). If you want things to Just Work, then you can use | 
|---|
| 152 | /// [`io::Result`] instead since the error type in this package will | 
|---|
| 153 | /// automatically convert to an [`io::Result`] when using the [`try!`] macro. | 
|---|
| 154 | /// | 
|---|
| 155 | /// [`io::Result`]: https://doc.rust-lang.org/stable/std/io/type.Result.html | 
|---|
| 156 | /// [`try!`]: https://doc.rust-lang.org/stable/std/macro.try.html | 
|---|
| 157 | pub type Result<T> = ::std::result::Result<T, Error>; | 
|---|
| 158 |  | 
|---|
| 159 | /// A builder to create an iterator for recursively walking a directory. | 
|---|
| 160 | /// | 
|---|
| 161 | /// Results are returned in depth first fashion, with directories yielded | 
|---|
| 162 | /// before their contents. If [`contents_first`] is true, contents are yielded | 
|---|
| 163 | /// before their directories. The order is unspecified but if [`sort_by`] is | 
|---|
| 164 | /// given, directory entries are sorted according to this function. Directory | 
|---|
| 165 | /// entries `.` and `..` are always omitted. | 
|---|
| 166 | /// | 
|---|
| 167 | /// If an error occurs at any point during iteration, then it is returned in | 
|---|
| 168 | /// place of its corresponding directory entry and iteration continues as | 
|---|
| 169 | /// normal. If an error occurs while opening a directory for reading, then it | 
|---|
| 170 | /// is not descended into (but the error is still yielded by the iterator). | 
|---|
| 171 | /// Iteration may be stopped at any time. When the iterator is destroyed, all | 
|---|
| 172 | /// resources associated with it are freed. | 
|---|
| 173 | /// | 
|---|
| 174 | /// [`contents_first`]: struct.WalkDir.html#method.contents_first | 
|---|
| 175 | /// [`sort_by`]: struct.WalkDir.html#method.sort_by | 
|---|
| 176 | /// | 
|---|
| 177 | /// # Usage | 
|---|
| 178 | /// | 
|---|
| 179 | /// This type implements [`IntoIterator`] so that it may be used as the subject | 
|---|
| 180 | /// of a `for` loop. You may need to call [`into_iter`] explicitly if you want | 
|---|
| 181 | /// to use iterator adapters such as [`filter_entry`]. | 
|---|
| 182 | /// | 
|---|
| 183 | /// Idiomatic use of this type should use method chaining to set desired | 
|---|
| 184 | /// options. For example, this only shows entries with a depth of `1`, `2` or | 
|---|
| 185 | /// `3` (relative to `foo`): | 
|---|
| 186 | /// | 
|---|
| 187 | /// ```no_run | 
|---|
| 188 | /// use walkdir::WalkDir; | 
|---|
| 189 | /// # use walkdir::Error; | 
|---|
| 190 | /// | 
|---|
| 191 | /// # fn try_main() -> Result<(), Error> { | 
|---|
| 192 | /// for entry in WalkDir::new( "foo").min_depth(1).max_depth(3) { | 
|---|
| 193 | ///     println!( "{}", entry?.path().display()); | 
|---|
| 194 | /// } | 
|---|
| 195 | /// # Ok(()) | 
|---|
| 196 | /// # } | 
|---|
| 197 | /// ``` | 
|---|
| 198 | /// | 
|---|
| 199 | /// [`IntoIterator`]: https://doc.rust-lang.org/stable/std/iter/trait.IntoIterator.html | 
|---|
| 200 | /// [`into_iter`]: https://doc.rust-lang.org/nightly/core/iter/trait.IntoIterator.html#tymethod.into_iter | 
|---|
| 201 | /// [`filter_entry`]: struct.IntoIter.html#method.filter_entry | 
|---|
| 202 | /// | 
|---|
| 203 | /// Note that the iterator by default includes the top-most directory. Since | 
|---|
| 204 | /// this is the only directory yielded with depth `0`, it is easy to ignore it | 
|---|
| 205 | /// with the [`min_depth`] setting: | 
|---|
| 206 | /// | 
|---|
| 207 | /// ```no_run | 
|---|
| 208 | /// use walkdir::WalkDir; | 
|---|
| 209 | /// # use walkdir::Error; | 
|---|
| 210 | /// | 
|---|
| 211 | /// # fn try_main() -> Result<(), Error> { | 
|---|
| 212 | /// for entry in WalkDir::new( "foo").min_depth(1) { | 
|---|
| 213 | ///     println!( "{}", entry?.path().display()); | 
|---|
| 214 | /// } | 
|---|
| 215 | /// # Ok(()) | 
|---|
| 216 | /// # } | 
|---|
| 217 | /// ``` | 
|---|
| 218 | /// | 
|---|
| 219 | /// [`min_depth`]: struct.WalkDir.html#method.min_depth | 
|---|
| 220 | /// | 
|---|
| 221 | /// This will only return descendents of the `foo` directory and not `foo` | 
|---|
| 222 | /// itself. | 
|---|
| 223 | /// | 
|---|
| 224 | /// # Loops | 
|---|
| 225 | /// | 
|---|
| 226 | /// This iterator (like most/all recursive directory iterators) assumes that | 
|---|
| 227 | /// no loops can be made with *hard* links on your file system. In particular, | 
|---|
| 228 | /// this would require creating a hard link to a directory such that it creates | 
|---|
| 229 | /// a loop. On most platforms, this operation is illegal. | 
|---|
| 230 | /// | 
|---|
| 231 | /// Note that when following symbolic/soft links, loops are detected and an | 
|---|
| 232 | /// error is reported. | 
|---|
| 233 | #[ derive(Debug)] | 
|---|
| 234 | pub struct WalkDir { | 
|---|
| 235 | opts: WalkDirOptions, | 
|---|
| 236 | root: PathBuf, | 
|---|
| 237 | } | 
|---|
| 238 |  | 
|---|
| 239 | struct WalkDirOptions { | 
|---|
| 240 | follow_links: bool, | 
|---|
| 241 | follow_root_links: bool, | 
|---|
| 242 | max_open: usize, | 
|---|
| 243 | min_depth: usize, | 
|---|
| 244 | max_depth: usize, | 
|---|
| 245 | sorter: Option< | 
|---|
| 246 | Box< | 
|---|
| 247 | dyn FnMut(&DirEntry, &DirEntry) -> Ordering | 
|---|
| 248 | + Send | 
|---|
| 249 | + Sync | 
|---|
| 250 | + 'static, | 
|---|
| 251 | >, | 
|---|
| 252 | >, | 
|---|
| 253 | contents_first: bool, | 
|---|
| 254 | same_file_system: bool, | 
|---|
| 255 | } | 
|---|
| 256 |  | 
|---|
| 257 | impl fmt::Debug for WalkDirOptions { | 
|---|
| 258 | fn fmt( | 
|---|
| 259 | &self, | 
|---|
| 260 | f: &mut fmt::Formatter<'_>, | 
|---|
| 261 | ) -> result::Result<(), fmt::Error> { | 
|---|
| 262 | let sorter_str: &'static str = if self.sorter.is_some() { | 
|---|
| 263 | // FnMut isn't `Debug` | 
|---|
| 264 | "Some(...)" | 
|---|
| 265 | } else { | 
|---|
| 266 | "None" | 
|---|
| 267 | }; | 
|---|
| 268 | f&mut DebugStruct<'_, '_>.debug_struct( "WalkDirOptions") | 
|---|
| 269 | .field( "follow_links", &self.follow_links) | 
|---|
| 270 | .field( "follow_root_link", &self.follow_root_links) | 
|---|
| 271 | .field( "max_open", &self.max_open) | 
|---|
| 272 | .field( "min_depth", &self.min_depth) | 
|---|
| 273 | .field( "max_depth", &self.max_depth) | 
|---|
| 274 | .field( "sorter", &sorter_str) | 
|---|
| 275 | .field( "contents_first", &self.contents_first) | 
|---|
| 276 | .field(name: "same_file_system", &self.same_file_system) | 
|---|
| 277 | .finish() | 
|---|
| 278 | } | 
|---|
| 279 | } | 
|---|
| 280 |  | 
|---|
| 281 | impl WalkDir { | 
|---|
| 282 | /// Create a builder for a recursive directory iterator starting at the | 
|---|
| 283 | /// file path `root`. If `root` is a directory, then it is the first item | 
|---|
| 284 | /// yielded by the iterator. If `root` is a file, then it is the first | 
|---|
| 285 | /// and only item yielded by the iterator. If `root` is a symlink, then it | 
|---|
| 286 | /// is always followed for the purposes of directory traversal. (A root | 
|---|
| 287 | /// `DirEntry` still obeys its documentation with respect to symlinks and | 
|---|
| 288 | /// the `follow_links` setting.) | 
|---|
| 289 | pub fn new<P: AsRef<Path>>(root: P) -> Self { | 
|---|
| 290 | WalkDir { | 
|---|
| 291 | opts: WalkDirOptions { | 
|---|
| 292 | follow_links: false, | 
|---|
| 293 | follow_root_links: true, | 
|---|
| 294 | max_open: 10, | 
|---|
| 295 | min_depth: 0, | 
|---|
| 296 | max_depth: ::std::usize::MAX, | 
|---|
| 297 | sorter: None, | 
|---|
| 298 | contents_first: false, | 
|---|
| 299 | same_file_system: false, | 
|---|
| 300 | }, | 
|---|
| 301 | root: root.as_ref().to_path_buf(), | 
|---|
| 302 | } | 
|---|
| 303 | } | 
|---|
| 304 |  | 
|---|
| 305 | /// Set the minimum depth of entries yielded by the iterator. | 
|---|
| 306 | /// | 
|---|
| 307 | /// The smallest depth is `0` and always corresponds to the path given | 
|---|
| 308 | /// to the `new` function on this type. Its direct descendents have depth | 
|---|
| 309 | /// `1`, and their descendents have depth `2`, and so on. | 
|---|
| 310 | pub fn min_depth(mut self, depth: usize) -> Self { | 
|---|
| 311 | self.opts.min_depth = depth; | 
|---|
| 312 | if self.opts.min_depth > self.opts.max_depth { | 
|---|
| 313 | self.opts.min_depth = self.opts.max_depth; | 
|---|
| 314 | } | 
|---|
| 315 | self | 
|---|
| 316 | } | 
|---|
| 317 |  | 
|---|
| 318 | /// Set the maximum depth of entries yield by the iterator. | 
|---|
| 319 | /// | 
|---|
| 320 | /// The smallest depth is `0` and always corresponds to the path given | 
|---|
| 321 | /// to the `new` function on this type. Its direct descendents have depth | 
|---|
| 322 | /// `1`, and their descendents have depth `2`, and so on. | 
|---|
| 323 | /// | 
|---|
| 324 | /// Note that this will not simply filter the entries of the iterator, but | 
|---|
| 325 | /// it will actually avoid descending into directories when the depth is | 
|---|
| 326 | /// exceeded. | 
|---|
| 327 | pub fn max_depth(mut self, depth: usize) -> Self { | 
|---|
| 328 | self.opts.max_depth = depth; | 
|---|
| 329 | if self.opts.max_depth < self.opts.min_depth { | 
|---|
| 330 | self.opts.max_depth = self.opts.min_depth; | 
|---|
| 331 | } | 
|---|
| 332 | self | 
|---|
| 333 | } | 
|---|
| 334 |  | 
|---|
| 335 | /// Follow symbolic links. By default, this is disabled. | 
|---|
| 336 | /// | 
|---|
| 337 | /// When `yes` is `true`, symbolic links are followed as if they were | 
|---|
| 338 | /// normal directories and files. If a symbolic link is broken or is | 
|---|
| 339 | /// involved in a loop, an error is yielded. | 
|---|
| 340 | /// | 
|---|
| 341 | /// When enabled, the yielded [`DirEntry`] values represent the target of | 
|---|
| 342 | /// the link while the path corresponds to the link. See the [`DirEntry`] | 
|---|
| 343 | /// type for more details. | 
|---|
| 344 | /// | 
|---|
| 345 | /// [`DirEntry`]: struct.DirEntry.html | 
|---|
| 346 | pub fn follow_links(mut self, yes: bool) -> Self { | 
|---|
| 347 | self.opts.follow_links = yes; | 
|---|
| 348 | self | 
|---|
| 349 | } | 
|---|
| 350 |  | 
|---|
| 351 | /// Follow symbolic links if these are the root of the traversal. | 
|---|
| 352 | /// By default, this is enabled. | 
|---|
| 353 | /// | 
|---|
| 354 | /// When `yes` is `true`, symbolic links on root paths are followed | 
|---|
| 355 | /// which is effective if the symbolic link points to a directory. | 
|---|
| 356 | /// If a symbolic link is broken or is involved in a loop, an error is yielded | 
|---|
| 357 | /// as the first entry of the traversal. | 
|---|
| 358 | /// | 
|---|
| 359 | /// When enabled, the yielded [`DirEntry`] values represent the target of | 
|---|
| 360 | /// the link while the path corresponds to the link. See the [`DirEntry`] | 
|---|
| 361 | /// type for more details, and all future entries will be contained within | 
|---|
| 362 | /// the resolved directory behind the symbolic link of the root path. | 
|---|
| 363 | /// | 
|---|
| 364 | /// [`DirEntry`]: struct.DirEntry.html | 
|---|
| 365 | pub fn follow_root_links(mut self, yes: bool) -> Self { | 
|---|
| 366 | self.opts.follow_root_links = yes; | 
|---|
| 367 | self | 
|---|
| 368 | } | 
|---|
| 369 |  | 
|---|
| 370 | /// Set the maximum number of simultaneously open file descriptors used | 
|---|
| 371 | /// by the iterator. | 
|---|
| 372 | /// | 
|---|
| 373 | /// `n` must be greater than or equal to `1`. If `n` is `0`, then it is set | 
|---|
| 374 | /// to `1` automatically. If this is not set, then it defaults to some | 
|---|
| 375 | /// reasonably low number. | 
|---|
| 376 | /// | 
|---|
| 377 | /// This setting has no impact on the results yielded by the iterator | 
|---|
| 378 | /// (even when `n` is `1`). Instead, this setting represents a trade off | 
|---|
| 379 | /// between scarce resources (file descriptors) and memory. Namely, when | 
|---|
| 380 | /// the maximum number of file descriptors is reached and a new directory | 
|---|
| 381 | /// needs to be opened to continue iteration, then a previous directory | 
|---|
| 382 | /// handle is closed and has its unyielded entries stored in memory. In | 
|---|
| 383 | /// practice, this is a satisfying trade off because it scales with respect | 
|---|
| 384 | /// to the *depth* of your file tree. Therefore, low values (even `1`) are | 
|---|
| 385 | /// acceptable. | 
|---|
| 386 | /// | 
|---|
| 387 | /// Note that this value does not impact the number of system calls made by | 
|---|
| 388 | /// an exhausted iterator. | 
|---|
| 389 | /// | 
|---|
| 390 | /// # Platform behavior | 
|---|
| 391 | /// | 
|---|
| 392 | /// On Windows, if `follow_links` is enabled, then this limit is not | 
|---|
| 393 | /// respected. In particular, the maximum number of file descriptors opened | 
|---|
| 394 | /// is proportional to the depth of the directory tree traversed. | 
|---|
| 395 | pub fn max_open(mut self, mut n: usize) -> Self { | 
|---|
| 396 | if n == 0 { | 
|---|
| 397 | n = 1; | 
|---|
| 398 | } | 
|---|
| 399 | self.opts.max_open = n; | 
|---|
| 400 | self | 
|---|
| 401 | } | 
|---|
| 402 |  | 
|---|
| 403 | /// Set a function for sorting directory entries with a comparator | 
|---|
| 404 | /// function. | 
|---|
| 405 | /// | 
|---|
| 406 | /// If a compare function is set, the resulting iterator will return all | 
|---|
| 407 | /// paths in sorted order. The compare function will be called to compare | 
|---|
| 408 | /// entries from the same directory. | 
|---|
| 409 | /// | 
|---|
| 410 | /// ```rust,no_run | 
|---|
| 411 | /// use std::cmp; | 
|---|
| 412 | /// use std::ffi::OsString; | 
|---|
| 413 | /// use walkdir::WalkDir; | 
|---|
| 414 | /// | 
|---|
| 415 | /// WalkDir::new( "foo").sort_by(|a,b| a.file_name().cmp(b.file_name())); | 
|---|
| 416 | /// ``` | 
|---|
| 417 | pub fn sort_by<F>(mut self, cmp: F) -> Self | 
|---|
| 418 | where | 
|---|
| 419 | F: FnMut(&DirEntry, &DirEntry) -> Ordering + Send + Sync + 'static, | 
|---|
| 420 | { | 
|---|
| 421 | self.opts.sorter = Some(Box::new(cmp)); | 
|---|
| 422 | self | 
|---|
| 423 | } | 
|---|
| 424 |  | 
|---|
| 425 | /// Set a function for sorting directory entries with a key extraction | 
|---|
| 426 | /// function. | 
|---|
| 427 | /// | 
|---|
| 428 | /// If a compare function is set, the resulting iterator will return all | 
|---|
| 429 | /// paths in sorted order. The compare function will be called to compare | 
|---|
| 430 | /// entries from the same directory. | 
|---|
| 431 | /// | 
|---|
| 432 | /// ```rust,no_run | 
|---|
| 433 | /// use std::cmp; | 
|---|
| 434 | /// use std::ffi::OsString; | 
|---|
| 435 | /// use walkdir::WalkDir; | 
|---|
| 436 | /// | 
|---|
| 437 | /// WalkDir::new( "foo").sort_by_key(|a| a.file_name().to_owned()); | 
|---|
| 438 | /// ``` | 
|---|
| 439 | pub fn sort_by_key<K, F>(self, mut cmp: F) -> Self | 
|---|
| 440 | where | 
|---|
| 441 | F: FnMut(&DirEntry) -> K + Send + Sync + 'static, | 
|---|
| 442 | K: Ord, | 
|---|
| 443 | { | 
|---|
| 444 | self.sort_by(move |a, b| cmp(a).cmp(&cmp(b))) | 
|---|
| 445 | } | 
|---|
| 446 |  | 
|---|
| 447 | /// Sort directory entries by file name, to ensure a deterministic order. | 
|---|
| 448 | /// | 
|---|
| 449 | /// This is a convenience function for calling `Self::sort_by()`. | 
|---|
| 450 | /// | 
|---|
| 451 | /// ```rust,no_run | 
|---|
| 452 | /// use walkdir::WalkDir; | 
|---|
| 453 | /// | 
|---|
| 454 | /// WalkDir::new( "foo").sort_by_file_name(); | 
|---|
| 455 | /// ``` | 
|---|
| 456 | pub fn sort_by_file_name(self) -> Self { | 
|---|
| 457 | self.sort_by(|a, b| a.file_name().cmp(b.file_name())) | 
|---|
| 458 | } | 
|---|
| 459 |  | 
|---|
| 460 | /// Yield a directory's contents before the directory itself. By default, | 
|---|
| 461 | /// this is disabled. | 
|---|
| 462 | /// | 
|---|
| 463 | /// When `yes` is `false` (as is the default), the directory is yielded | 
|---|
| 464 | /// before its contents are read. This is useful when, e.g. you want to | 
|---|
| 465 | /// skip processing of some directories. | 
|---|
| 466 | /// | 
|---|
| 467 | /// When `yes` is `true`, the iterator yields the contents of a directory | 
|---|
| 468 | /// before yielding the directory itself. This is useful when, e.g. you | 
|---|
| 469 | /// want to recursively delete a directory. | 
|---|
| 470 | /// | 
|---|
| 471 | /// # Example | 
|---|
| 472 | /// | 
|---|
| 473 | /// Assume the following directory tree: | 
|---|
| 474 | /// | 
|---|
| 475 | /// ```text | 
|---|
| 476 | /// foo/ | 
|---|
| 477 | ///   abc/ | 
|---|
| 478 | ///     qrs | 
|---|
| 479 | ///     tuv | 
|---|
| 480 | ///   def/ | 
|---|
| 481 | /// ``` | 
|---|
| 482 | /// | 
|---|
| 483 | /// With contents_first disabled (the default), the following code visits | 
|---|
| 484 | /// the directory tree in depth-first order: | 
|---|
| 485 | /// | 
|---|
| 486 | /// ```no_run | 
|---|
| 487 | /// use walkdir::WalkDir; | 
|---|
| 488 | /// | 
|---|
| 489 | /// for entry in WalkDir::new( "foo") { | 
|---|
| 490 | ///     let entry = entry.unwrap(); | 
|---|
| 491 | ///     println!( "{}", entry.path().display()); | 
|---|
| 492 | /// } | 
|---|
| 493 | /// | 
|---|
| 494 | /// // foo | 
|---|
| 495 | /// // foo/abc | 
|---|
| 496 | /// // foo/abc/qrs | 
|---|
| 497 | /// // foo/abc/tuv | 
|---|
| 498 | /// // foo/def | 
|---|
| 499 | /// ``` | 
|---|
| 500 | /// | 
|---|
| 501 | /// With contents_first enabled: | 
|---|
| 502 | /// | 
|---|
| 503 | /// ```no_run | 
|---|
| 504 | /// use walkdir::WalkDir; | 
|---|
| 505 | /// | 
|---|
| 506 | /// for entry in WalkDir::new( "foo").contents_first(true) { | 
|---|
| 507 | ///     let entry = entry.unwrap(); | 
|---|
| 508 | ///     println!( "{}", entry.path().display()); | 
|---|
| 509 | /// } | 
|---|
| 510 | /// | 
|---|
| 511 | /// // foo/abc/qrs | 
|---|
| 512 | /// // foo/abc/tuv | 
|---|
| 513 | /// // foo/abc | 
|---|
| 514 | /// // foo/def | 
|---|
| 515 | /// // foo | 
|---|
| 516 | /// ``` | 
|---|
| 517 | pub fn contents_first(mut self, yes: bool) -> Self { | 
|---|
| 518 | self.opts.contents_first = yes; | 
|---|
| 519 | self | 
|---|
| 520 | } | 
|---|
| 521 |  | 
|---|
| 522 | /// Do not cross file system boundaries. | 
|---|
| 523 | /// | 
|---|
| 524 | /// When this option is enabled, directory traversal will not descend into | 
|---|
| 525 | /// directories that are on a different file system from the root path. | 
|---|
| 526 | /// | 
|---|
| 527 | /// Currently, this option is only supported on Unix and Windows. If this | 
|---|
| 528 | /// option is used on an unsupported platform, then directory traversal | 
|---|
| 529 | /// will immediately return an error and will not yield any entries. | 
|---|
| 530 | pub fn same_file_system(mut self, yes: bool) -> Self { | 
|---|
| 531 | self.opts.same_file_system = yes; | 
|---|
| 532 | self | 
|---|
| 533 | } | 
|---|
| 534 | } | 
|---|
| 535 |  | 
|---|
| 536 | impl IntoIterator for WalkDir { | 
|---|
| 537 | type Item = Result<DirEntry>; | 
|---|
| 538 | type IntoIter = IntoIter; | 
|---|
| 539 |  | 
|---|
| 540 | fn into_iter(self) -> IntoIter { | 
|---|
| 541 | IntoIter { | 
|---|
| 542 | opts: self.opts, | 
|---|
| 543 | start: Some(self.root), | 
|---|
| 544 | stack_list: vec![], | 
|---|
| 545 | stack_path: vec![], | 
|---|
| 546 | oldest_opened: 0, | 
|---|
| 547 | depth: 0, | 
|---|
| 548 | deferred_dirs: vec![], | 
|---|
| 549 | root_device: None, | 
|---|
| 550 | } | 
|---|
| 551 | } | 
|---|
| 552 | } | 
|---|
| 553 |  | 
|---|
| 554 | /// An iterator for recursively descending into a directory. | 
|---|
| 555 | /// | 
|---|
| 556 | /// A value with this type must be constructed with the [`WalkDir`] type, which | 
|---|
| 557 | /// uses a builder pattern to set options such as min/max depth, max open file | 
|---|
| 558 | /// descriptors and whether the iterator should follow symbolic links. After | 
|---|
| 559 | /// constructing a `WalkDir`, call [`.into_iter()`] at the end of the chain. | 
|---|
| 560 | /// | 
|---|
| 561 | /// The order of elements yielded by this iterator is unspecified. | 
|---|
| 562 | /// | 
|---|
| 563 | /// [`WalkDir`]: struct.WalkDir.html | 
|---|
| 564 | /// [`.into_iter()`]: struct.WalkDir.html#into_iter.v | 
|---|
| 565 | #[ derive(Debug)] | 
|---|
| 566 | pub struct IntoIter { | 
|---|
| 567 | /// Options specified in the builder. Depths, max fds, etc. | 
|---|
| 568 | opts: WalkDirOptions, | 
|---|
| 569 | /// The start path. | 
|---|
| 570 | /// | 
|---|
| 571 | /// This is only `Some(...)` at the beginning. After the first iteration, | 
|---|
| 572 | /// this is always `None`. | 
|---|
| 573 | start: Option<PathBuf>, | 
|---|
| 574 | /// A stack of open (up to max fd) or closed handles to directories. | 
|---|
| 575 | /// An open handle is a plain [`fs::ReadDir`] while a closed handle is | 
|---|
| 576 | /// a `Vec<fs::DirEntry>` corresponding to the as-of-yet consumed entries. | 
|---|
| 577 | /// | 
|---|
| 578 | /// [`fs::ReadDir`]: https://doc.rust-lang.org/stable/std/fs/struct.ReadDir.html | 
|---|
| 579 | stack_list: Vec<DirList>, | 
|---|
| 580 | /// A stack of file paths. | 
|---|
| 581 | /// | 
|---|
| 582 | /// This is *only* used when [`follow_links`] is enabled. In all other | 
|---|
| 583 | /// cases this stack is empty. | 
|---|
| 584 | /// | 
|---|
| 585 | /// [`follow_links`]: struct.WalkDir.html#method.follow_links | 
|---|
| 586 | stack_path: Vec<Ancestor>, | 
|---|
| 587 | /// An index into `stack_list` that points to the oldest open directory | 
|---|
| 588 | /// handle. If the maximum fd limit is reached and a new directory needs to | 
|---|
| 589 | /// be read, the handle at this index is closed before the new directory is | 
|---|
| 590 | /// opened. | 
|---|
| 591 | oldest_opened: usize, | 
|---|
| 592 | /// The current depth of iteration (the length of the stack at the | 
|---|
| 593 | /// beginning of each iteration). | 
|---|
| 594 | depth: usize, | 
|---|
| 595 | /// A list of DirEntries corresponding to directories, that are | 
|---|
| 596 | /// yielded after their contents has been fully yielded. This is only | 
|---|
| 597 | /// used when `contents_first` is enabled. | 
|---|
| 598 | deferred_dirs: Vec<DirEntry>, | 
|---|
| 599 | /// The device of the root file path when the first call to `next` was | 
|---|
| 600 | /// made. | 
|---|
| 601 | /// | 
|---|
| 602 | /// If the `same_file_system` option isn't enabled, then this is always | 
|---|
| 603 | /// `None`. Conversely, if it is enabled, this is always `Some(...)` after | 
|---|
| 604 | /// handling the root path. | 
|---|
| 605 | root_device: Option<u64>, | 
|---|
| 606 | } | 
|---|
| 607 |  | 
|---|
| 608 | /// An ancestor is an item in the directory tree traversed by walkdir, and is | 
|---|
| 609 | /// used to check for loops in the tree when traversing symlinks. | 
|---|
| 610 | #[ derive(Debug)] | 
|---|
| 611 | struct Ancestor { | 
|---|
| 612 | /// The path of this ancestor. | 
|---|
| 613 | path: PathBuf, | 
|---|
| 614 | /// An open file to this ancesor. This is only used on Windows where | 
|---|
| 615 | /// opening a file handle appears to be quite expensive, so we choose to | 
|---|
| 616 | /// cache it. This comes at the cost of not respecting the file descriptor | 
|---|
| 617 | /// limit set by the user. | 
|---|
| 618 | #[ cfg(windows)] | 
|---|
| 619 | handle: Handle, | 
|---|
| 620 | } | 
|---|
| 621 |  | 
|---|
| 622 | impl Ancestor { | 
|---|
| 623 | /// Create a new ancestor from the given directory path. | 
|---|
| 624 | #[ cfg(windows)] | 
|---|
| 625 | fn new(dent: &DirEntry) -> io::Result<Ancestor> { | 
|---|
| 626 | let handle = Handle::from_path(dent.path())?; | 
|---|
| 627 | Ok(Ancestor { path: dent.path().to_path_buf(), handle }) | 
|---|
| 628 | } | 
|---|
| 629 |  | 
|---|
| 630 | /// Create a new ancestor from the given directory path. | 
|---|
| 631 | #[ cfg(not(windows))] | 
|---|
| 632 | fn new(dent: &DirEntry) -> io::Result<Ancestor> { | 
|---|
| 633 | Ok(Ancestor { path: dent.path().to_path_buf() }) | 
|---|
| 634 | } | 
|---|
| 635 |  | 
|---|
| 636 | /// Returns true if and only if the given open file handle corresponds to | 
|---|
| 637 | /// the same directory as this ancestor. | 
|---|
| 638 | #[ cfg(windows)] | 
|---|
| 639 | fn is_same(&self, child: &Handle) -> io::Result<bool> { | 
|---|
| 640 | Ok(child == &self.handle) | 
|---|
| 641 | } | 
|---|
| 642 |  | 
|---|
| 643 | /// Returns true if and only if the given open file handle corresponds to | 
|---|
| 644 | /// the same directory as this ancestor. | 
|---|
| 645 | #[ cfg(not(windows))] | 
|---|
| 646 | fn is_same(&self, child: &Handle) -> io::Result<bool> { | 
|---|
| 647 | Ok(child == &Handle::from_path(&self.path)?) | 
|---|
| 648 | } | 
|---|
| 649 | } | 
|---|
| 650 |  | 
|---|
| 651 | /// A sequence of unconsumed directory entries. | 
|---|
| 652 | /// | 
|---|
| 653 | /// This represents the opened or closed state of a directory handle. When | 
|---|
| 654 | /// open, future entries are read by iterating over the raw `fs::ReadDir`. | 
|---|
| 655 | /// When closed, all future entries are read into memory. Iteration then | 
|---|
| 656 | /// proceeds over a [`Vec<fs::DirEntry>`]. | 
|---|
| 657 | /// | 
|---|
| 658 | /// [`fs::ReadDir`]: https://doc.rust-lang.org/stable/std/fs/struct.ReadDir.html | 
|---|
| 659 | /// [`Vec<fs::DirEntry>`]: https://doc.rust-lang.org/stable/std/vec/struct.Vec.html | 
|---|
| 660 | #[ derive(Debug)] | 
|---|
| 661 | enum DirList { | 
|---|
| 662 | /// An opened handle. | 
|---|
| 663 | /// | 
|---|
| 664 | /// This includes the depth of the handle itself. | 
|---|
| 665 | /// | 
|---|
| 666 | /// If there was an error with the initial [`fs::read_dir`] call, then it | 
|---|
| 667 | /// is stored here. (We use an [`Option<...>`] to make yielding the error | 
|---|
| 668 | /// exactly once simpler.) | 
|---|
| 669 | /// | 
|---|
| 670 | /// [`fs::read_dir`]: https://doc.rust-lang.org/stable/std/fs/fn.read_dir.html | 
|---|
| 671 | /// [`Option<...>`]: https://doc.rust-lang.org/stable/std/option/enum.Option.html | 
|---|
| 672 | Opened { depth: usize, it: result::Result<ReadDir, Option<Error>> }, | 
|---|
| 673 | /// A closed handle. | 
|---|
| 674 | /// | 
|---|
| 675 | /// All remaining directory entries are read into memory. | 
|---|
| 676 | Closed(vec::IntoIter<Result<DirEntry>>), | 
|---|
| 677 | } | 
|---|
| 678 |  | 
|---|
| 679 | impl Iterator for IntoIter { | 
|---|
| 680 | type Item = Result<DirEntry>; | 
|---|
| 681 | /// Advances the iterator and returns the next value. | 
|---|
| 682 | /// | 
|---|
| 683 | /// # Errors | 
|---|
| 684 | /// | 
|---|
| 685 | /// If the iterator fails to retrieve the next value, this method returns | 
|---|
| 686 | /// an error value. The error will be wrapped in an Option::Some. | 
|---|
| 687 | fn next(&mut self) -> Option<Result<DirEntry>> { | 
|---|
| 688 | if let Some(start) = self.start.take() { | 
|---|
| 689 | if self.opts.same_file_system { | 
|---|
| 690 | let result = util::device_num(&start) | 
|---|
| 691 | .map_err(|e| Error::from_path(0, start.clone(), e)); | 
|---|
| 692 | self.root_device = Some(itry!(result)); | 
|---|
| 693 | } | 
|---|
| 694 | let dent = itry!(DirEntry::from_path(0, start, false)); | 
|---|
| 695 | if let Some(result) = self.handle_entry(dent) { | 
|---|
| 696 | return Some(result); | 
|---|
| 697 | } | 
|---|
| 698 | } | 
|---|
| 699 | while !self.stack_list.is_empty() { | 
|---|
| 700 | self.depth = self.stack_list.len(); | 
|---|
| 701 | if let Some(dentry) = self.get_deferred_dir() { | 
|---|
| 702 | return Some(Ok(dentry)); | 
|---|
| 703 | } | 
|---|
| 704 | if self.depth > self.opts.max_depth { | 
|---|
| 705 | // If we've exceeded the max depth, pop the current dir | 
|---|
| 706 | // so that we don't descend. | 
|---|
| 707 | self.pop(); | 
|---|
| 708 | continue; | 
|---|
| 709 | } | 
|---|
| 710 | // Unwrap is safe here because we've verified above that | 
|---|
| 711 | // `self.stack_list` is not empty | 
|---|
| 712 | let next = self | 
|---|
| 713 | .stack_list | 
|---|
| 714 | .last_mut() | 
|---|
| 715 | .expect( "BUG: stack should be non-empty") | 
|---|
| 716 | .next(); | 
|---|
| 717 | match next { | 
|---|
| 718 | None => self.pop(), | 
|---|
| 719 | Some(Err(err)) => return Some(Err(err)), | 
|---|
| 720 | Some(Ok(dent)) => { | 
|---|
| 721 | if let Some(result) = self.handle_entry(dent) { | 
|---|
| 722 | return Some(result); | 
|---|
| 723 | } | 
|---|
| 724 | } | 
|---|
| 725 | } | 
|---|
| 726 | } | 
|---|
| 727 | if self.opts.contents_first { | 
|---|
| 728 | self.depth = self.stack_list.len(); | 
|---|
| 729 | if let Some(dentry) = self.get_deferred_dir() { | 
|---|
| 730 | return Some(Ok(dentry)); | 
|---|
| 731 | } | 
|---|
| 732 | } | 
|---|
| 733 | None | 
|---|
| 734 | } | 
|---|
| 735 | } | 
|---|
| 736 |  | 
|---|
| 737 | impl IntoIter { | 
|---|
| 738 | /// Skips the current directory. | 
|---|
| 739 | /// | 
|---|
| 740 | /// This causes the iterator to stop traversing the contents of the least | 
|---|
| 741 | /// recently yielded directory. This means any remaining entries in that | 
|---|
| 742 | /// directory will be skipped (including sub-directories). | 
|---|
| 743 | /// | 
|---|
| 744 | /// Note that the ergonomics of this method are questionable since it | 
|---|
| 745 | /// borrows the iterator mutably. Namely, you must write out the looping | 
|---|
| 746 | /// condition manually. For example, to skip hidden entries efficiently on | 
|---|
| 747 | /// unix systems: | 
|---|
| 748 | /// | 
|---|
| 749 | /// ```no_run | 
|---|
| 750 | /// use walkdir::{DirEntry, WalkDir}; | 
|---|
| 751 | /// | 
|---|
| 752 | /// fn is_hidden(entry: &DirEntry) -> bool { | 
|---|
| 753 | ///     entry.file_name() | 
|---|
| 754 | ///          .to_str() | 
|---|
| 755 | ///          .map(|s| s.starts_with( ".")) | 
|---|
| 756 | ///          .unwrap_or(false) | 
|---|
| 757 | /// } | 
|---|
| 758 | /// | 
|---|
| 759 | /// let mut it = WalkDir::new( "foo").into_iter(); | 
|---|
| 760 | /// loop { | 
|---|
| 761 | ///     let entry = match it.next() { | 
|---|
| 762 | ///         None => break, | 
|---|
| 763 | ///         Some(Err(err)) => panic!( "ERROR: {}", err), | 
|---|
| 764 | ///         Some(Ok(entry)) => entry, | 
|---|
| 765 | ///     }; | 
|---|
| 766 | ///     if is_hidden(&entry) { | 
|---|
| 767 | ///         if entry.file_type().is_dir() { | 
|---|
| 768 | ///             it.skip_current_dir(); | 
|---|
| 769 | ///         } | 
|---|
| 770 | ///         continue; | 
|---|
| 771 | ///     } | 
|---|
| 772 | ///     println!( "{}", entry.path().display()); | 
|---|
| 773 | /// } | 
|---|
| 774 | /// ``` | 
|---|
| 775 | /// | 
|---|
| 776 | /// You may find it more convenient to use the [`filter_entry`] iterator | 
|---|
| 777 | /// adapter. (See its documentation for the same example functionality as | 
|---|
| 778 | /// above.) | 
|---|
| 779 | /// | 
|---|
| 780 | /// [`filter_entry`]: #method.filter_entry | 
|---|
| 781 | pub fn skip_current_dir(&mut self) { | 
|---|
| 782 | if !self.stack_list.is_empty() { | 
|---|
| 783 | self.pop(); | 
|---|
| 784 | } | 
|---|
| 785 | } | 
|---|
| 786 |  | 
|---|
| 787 | /// Yields only entries which satisfy the given predicate and skips | 
|---|
| 788 | /// descending into directories that do not satisfy the given predicate. | 
|---|
| 789 | /// | 
|---|
| 790 | /// The predicate is applied to all entries. If the predicate is | 
|---|
| 791 | /// true, iteration carries on as normal. If the predicate is false, the | 
|---|
| 792 | /// entry is ignored and if it is a directory, it is not descended into. | 
|---|
| 793 | /// | 
|---|
| 794 | /// This is often more convenient to use than [`skip_current_dir`]. For | 
|---|
| 795 | /// example, to skip hidden files and directories efficiently on unix | 
|---|
| 796 | /// systems: | 
|---|
| 797 | /// | 
|---|
| 798 | /// ```no_run | 
|---|
| 799 | /// use walkdir::{DirEntry, WalkDir}; | 
|---|
| 800 | /// # use walkdir::Error; | 
|---|
| 801 | /// | 
|---|
| 802 | /// fn is_hidden(entry: &DirEntry) -> bool { | 
|---|
| 803 | ///     entry.file_name() | 
|---|
| 804 | ///          .to_str() | 
|---|
| 805 | ///          .map(|s| s.starts_with( ".")) | 
|---|
| 806 | ///          .unwrap_or(false) | 
|---|
| 807 | /// } | 
|---|
| 808 | /// | 
|---|
| 809 | /// # fn try_main() -> Result<(), Error> { | 
|---|
| 810 | /// for entry in WalkDir::new( "foo") | 
|---|
| 811 | ///                      .into_iter() | 
|---|
| 812 | ///                      .filter_entry(|e| !is_hidden(e)) { | 
|---|
| 813 | ///     println!( "{}", entry?.path().display()); | 
|---|
| 814 | /// } | 
|---|
| 815 | /// # Ok(()) | 
|---|
| 816 | /// # } | 
|---|
| 817 | /// ``` | 
|---|
| 818 | /// | 
|---|
| 819 | /// Note that the iterator will still yield errors for reading entries that | 
|---|
| 820 | /// may not satisfy the predicate. | 
|---|
| 821 | /// | 
|---|
| 822 | /// Note that entries skipped with [`min_depth`] and [`max_depth`] are not | 
|---|
| 823 | /// passed to this predicate. | 
|---|
| 824 | /// | 
|---|
| 825 | /// Note that if the iterator has `contents_first` enabled, then this | 
|---|
| 826 | /// method is no different than calling the standard `Iterator::filter` | 
|---|
| 827 | /// method (because directory entries are yielded after they've been | 
|---|
| 828 | /// descended into). | 
|---|
| 829 | /// | 
|---|
| 830 | /// [`skip_current_dir`]: #method.skip_current_dir | 
|---|
| 831 | /// [`min_depth`]: struct.WalkDir.html#method.min_depth | 
|---|
| 832 | /// [`max_depth`]: struct.WalkDir.html#method.max_depth | 
|---|
| 833 | pub fn filter_entry<P>(self, predicate: P) -> FilterEntry<Self, P> | 
|---|
| 834 | where | 
|---|
| 835 | P: FnMut(&DirEntry) -> bool, | 
|---|
| 836 | { | 
|---|
| 837 | FilterEntry { it: self, predicate } | 
|---|
| 838 | } | 
|---|
| 839 |  | 
|---|
| 840 | fn handle_entry( | 
|---|
| 841 | &mut self, | 
|---|
| 842 | mut dent: DirEntry, | 
|---|
| 843 | ) -> Option<Result<DirEntry>> { | 
|---|
| 844 | if self.opts.follow_links && dent.file_type().is_symlink() { | 
|---|
| 845 | dent = itry!(self.follow(dent)); | 
|---|
| 846 | } | 
|---|
| 847 | let is_normal_dir = !dent.file_type().is_symlink() && dent.is_dir(); | 
|---|
| 848 | if is_normal_dir { | 
|---|
| 849 | if self.opts.same_file_system && dent.depth() > 0 { | 
|---|
| 850 | if itry!(self.is_same_file_system(&dent)) { | 
|---|
| 851 | itry!(self.push(&dent)); | 
|---|
| 852 | } | 
|---|
| 853 | } else { | 
|---|
| 854 | itry!(self.push(&dent)); | 
|---|
| 855 | } | 
|---|
| 856 | } else if dent.depth() == 0 | 
|---|
| 857 | && dent.file_type().is_symlink() | 
|---|
| 858 | && self.opts.follow_root_links | 
|---|
| 859 | { | 
|---|
| 860 | // As a special case, if we are processing a root entry, then we | 
|---|
| 861 | // always follow it even if it's a symlink and follow_links is | 
|---|
| 862 | // false. We are careful to not let this change the semantics of | 
|---|
| 863 | // the DirEntry however. Namely, the DirEntry should still respect | 
|---|
| 864 | // the follow_links setting. When it's disabled, it should report | 
|---|
| 865 | // itself as a symlink. When it's enabled, it should always report | 
|---|
| 866 | // itself as the target. | 
|---|
| 867 | let md = itry!(fs::metadata(dent.path()).map_err(|err| { | 
|---|
| 868 | Error::from_path(dent.depth(), dent.path().to_path_buf(), err) | 
|---|
| 869 | })); | 
|---|
| 870 | if md.file_type().is_dir() { | 
|---|
| 871 | itry!(self.push(&dent)); | 
|---|
| 872 | } | 
|---|
| 873 | } | 
|---|
| 874 | if is_normal_dir && self.opts.contents_first { | 
|---|
| 875 | self.deferred_dirs.push(dent); | 
|---|
| 876 | None | 
|---|
| 877 | } else if self.skippable() { | 
|---|
| 878 | None | 
|---|
| 879 | } else { | 
|---|
| 880 | Some(Ok(dent)) | 
|---|
| 881 | } | 
|---|
| 882 | } | 
|---|
| 883 |  | 
|---|
| 884 | fn get_deferred_dir(&mut self) -> Option<DirEntry> { | 
|---|
| 885 | if self.opts.contents_first { | 
|---|
| 886 | if self.depth < self.deferred_dirs.len() { | 
|---|
| 887 | // Unwrap is safe here because we've guaranteed that | 
|---|
| 888 | // `self.deferred_dirs.len()` can never be less than 1 | 
|---|
| 889 | let deferred: DirEntry = self | 
|---|
| 890 | .deferred_dirs | 
|---|
| 891 | .pop() | 
|---|
| 892 | .expect( "BUG: deferred_dirs should be non-empty"); | 
|---|
| 893 | if !self.skippable() { | 
|---|
| 894 | return Some(deferred); | 
|---|
| 895 | } | 
|---|
| 896 | } | 
|---|
| 897 | } | 
|---|
| 898 | None | 
|---|
| 899 | } | 
|---|
| 900 |  | 
|---|
| 901 | fn push(&mut self, dent: &DirEntry) -> Result<()> { | 
|---|
| 902 | // Make room for another open file descriptor if we've hit the max. | 
|---|
| 903 | let free = | 
|---|
| 904 | self.stack_list.len().checked_sub(self.oldest_opened).unwrap(); | 
|---|
| 905 | if free == self.opts.max_open { | 
|---|
| 906 | self.stack_list[self.oldest_opened].close(); | 
|---|
| 907 | } | 
|---|
| 908 | // Open a handle to reading the directory's entries. | 
|---|
| 909 | let rd = fs::read_dir(dent.path()).map_err(|err| { | 
|---|
| 910 | Some(Error::from_path(self.depth, dent.path().to_path_buf(), err)) | 
|---|
| 911 | }); | 
|---|
| 912 | let mut list = DirList::Opened { depth: self.depth, it: rd }; | 
|---|
| 913 | if let Some(ref mut cmp) = self.opts.sorter { | 
|---|
| 914 | let mut entries: Vec<_> = list.collect(); | 
|---|
| 915 | entries.sort_by(|a, b| match (a, b) { | 
|---|
| 916 | (&Ok(ref a), &Ok(ref b)) => cmp(a, b), | 
|---|
| 917 | (&Err(_), &Err(_)) => Ordering::Equal, | 
|---|
| 918 | (&Ok(_), &Err(_)) => Ordering::Greater, | 
|---|
| 919 | (&Err(_), &Ok(_)) => Ordering::Less, | 
|---|
| 920 | }); | 
|---|
| 921 | list = DirList::Closed(entries.into_iter()); | 
|---|
| 922 | } | 
|---|
| 923 | if self.opts.follow_links { | 
|---|
| 924 | let ancestor = Ancestor::new(&dent) | 
|---|
| 925 | .map_err(|err| Error::from_io(self.depth, err))?; | 
|---|
| 926 | self.stack_path.push(ancestor); | 
|---|
| 927 | } | 
|---|
| 928 | // We push this after stack_path since creating the Ancestor can fail. | 
|---|
| 929 | // If it fails, then we return the error and won't descend. | 
|---|
| 930 | self.stack_list.push(list); | 
|---|
| 931 | // If we had to close out a previous directory stream, then we need to | 
|---|
| 932 | // increment our index the oldest still-open stream. We do this only | 
|---|
| 933 | // after adding to our stack, in order to ensure that the oldest_opened | 
|---|
| 934 | // index remains valid. The worst that can happen is that an already | 
|---|
| 935 | // closed stream will be closed again, which is a no-op. | 
|---|
| 936 | // | 
|---|
| 937 | // We could move the close of the stream above into this if-body, but | 
|---|
| 938 | // then we would have more than the maximum number of file descriptors | 
|---|
| 939 | // open at a particular point in time. | 
|---|
| 940 | if free == self.opts.max_open { | 
|---|
| 941 | // Unwrap is safe here because self.oldest_opened is guaranteed to | 
|---|
| 942 | // never be greater than `self.stack_list.len()`, which implies | 
|---|
| 943 | // that the subtraction won't underflow and that adding 1 will | 
|---|
| 944 | // never overflow. | 
|---|
| 945 | self.oldest_opened = self.oldest_opened.checked_add(1).unwrap(); | 
|---|
| 946 | } | 
|---|
| 947 | Ok(()) | 
|---|
| 948 | } | 
|---|
| 949 |  | 
|---|
| 950 | fn pop(&mut self) { | 
|---|
| 951 | self.stack_list.pop().expect( "BUG: cannot pop from empty stack"); | 
|---|
| 952 | if self.opts.follow_links { | 
|---|
| 953 | self.stack_path.pop().expect( "BUG: list/path stacks out of sync"); | 
|---|
| 954 | } | 
|---|
| 955 | // If everything in the stack is already closed, then there is | 
|---|
| 956 | // room for at least one more open descriptor and it will | 
|---|
| 957 | // always be at the top of the stack. | 
|---|
| 958 | self.oldest_opened = min(self.oldest_opened, self.stack_list.len()); | 
|---|
| 959 | } | 
|---|
| 960 |  | 
|---|
| 961 | fn follow(&self, mut dent: DirEntry) -> Result<DirEntry> { | 
|---|
| 962 | dent = | 
|---|
| 963 | DirEntry::from_path(self.depth, dent.path().to_path_buf(), true)?; | 
|---|
| 964 | // The only way a symlink can cause a loop is if it points | 
|---|
| 965 | // to a directory. Otherwise, it always points to a leaf | 
|---|
| 966 | // and we can omit any loop checks. | 
|---|
| 967 | if dent.is_dir() { | 
|---|
| 968 | self.check_loop(dent.path())?; | 
|---|
| 969 | } | 
|---|
| 970 | Ok(dent) | 
|---|
| 971 | } | 
|---|
| 972 |  | 
|---|
| 973 | fn check_loop<P: AsRef<Path>>(&self, child: P) -> Result<()> { | 
|---|
| 974 | let hchild = Handle::from_path(&child) | 
|---|
| 975 | .map_err(|err| Error::from_io(self.depth, err))?; | 
|---|
| 976 | for ancestor in self.stack_path.iter().rev() { | 
|---|
| 977 | let is_same = ancestor | 
|---|
| 978 | .is_same(&hchild) | 
|---|
| 979 | .map_err(|err| Error::from_io(self.depth, err))?; | 
|---|
| 980 | if is_same { | 
|---|
| 981 | return Err(Error::from_loop( | 
|---|
| 982 | self.depth, | 
|---|
| 983 | &ancestor.path, | 
|---|
| 984 | child.as_ref(), | 
|---|
| 985 | )); | 
|---|
| 986 | } | 
|---|
| 987 | } | 
|---|
| 988 | Ok(()) | 
|---|
| 989 | } | 
|---|
| 990 |  | 
|---|
| 991 | fn is_same_file_system(&mut self, dent: &DirEntry) -> Result<bool> { | 
|---|
| 992 | let dent_device = util::device_num(dent.path()) | 
|---|
| 993 | .map_err(|err| Error::from_entry(dent, err))?; | 
|---|
| 994 | Ok(self | 
|---|
| 995 | .root_device | 
|---|
| 996 | .map(|d| d == dent_device) | 
|---|
| 997 | .expect( "BUG: called is_same_file_system without root device")) | 
|---|
| 998 | } | 
|---|
| 999 |  | 
|---|
| 1000 | fn skippable(&self) -> bool { | 
|---|
| 1001 | self.depth < self.opts.min_depth || self.depth > self.opts.max_depth | 
|---|
| 1002 | } | 
|---|
| 1003 | } | 
|---|
| 1004 |  | 
|---|
| 1005 | impl iter::FusedIterator for IntoIter {} | 
|---|
| 1006 |  | 
|---|
| 1007 | impl DirList { | 
|---|
| 1008 | fn close(&mut self) { | 
|---|
| 1009 | if let DirList::Opened { .. } = *self { | 
|---|
| 1010 | *self = DirList::Closed(self.collect::<Vec<_>>().into_iter()); | 
|---|
| 1011 | } | 
|---|
| 1012 | } | 
|---|
| 1013 | } | 
|---|
| 1014 |  | 
|---|
| 1015 | impl Iterator for DirList { | 
|---|
| 1016 | type Item = Result<DirEntry>; | 
|---|
| 1017 |  | 
|---|
| 1018 | #[ inline(always)] | 
|---|
| 1019 | fn next(&mut self) -> Option<Result<DirEntry>> { | 
|---|
| 1020 | match *self { | 
|---|
| 1021 | DirList::Closed(ref mut it: &mut IntoIter>) => it.next(), | 
|---|
| 1022 | DirList::Opened { depth: usize, ref mut it: &mut Result> } => match *it { | 
|---|
| 1023 | Err(ref mut err: &mut Option) => err.take().map(Err), | 
|---|
| 1024 | Ok(ref mut rd: &mut ReadDir) => rd.next().map(|r: Result| match r { | 
|---|
| 1025 | Ok(r: DirEntry) => DirEntry::from_entry(depth:depth + 1, &r), | 
|---|
| 1026 | Err(err: Error) => Err(Error::from_io(depth:depth + 1, err)), | 
|---|
| 1027 | }), | 
|---|
| 1028 | }, | 
|---|
| 1029 | } | 
|---|
| 1030 | } | 
|---|
| 1031 | } | 
|---|
| 1032 |  | 
|---|
| 1033 | /// A recursive directory iterator that skips entries. | 
|---|
| 1034 | /// | 
|---|
| 1035 | /// Values of this type are created by calling [`.filter_entry()`] on an | 
|---|
| 1036 | /// `IntoIter`, which is formed by calling [`.into_iter()`] on a `WalkDir`. | 
|---|
| 1037 | /// | 
|---|
| 1038 | /// Directories that fail the predicate `P` are skipped. Namely, they are | 
|---|
| 1039 | /// never yielded and never descended into. | 
|---|
| 1040 | /// | 
|---|
| 1041 | /// Entries that are skipped with the [`min_depth`] and [`max_depth`] options | 
|---|
| 1042 | /// are not passed through this filter. | 
|---|
| 1043 | /// | 
|---|
| 1044 | /// If opening a handle to a directory resulted in an error, then it is yielded | 
|---|
| 1045 | /// and no corresponding call to the predicate is made. | 
|---|
| 1046 | /// | 
|---|
| 1047 | /// Type parameter `I` refers to the underlying iterator and `P` refers to the | 
|---|
| 1048 | /// predicate, which is usually `FnMut(&DirEntry) -> bool`. | 
|---|
| 1049 | /// | 
|---|
| 1050 | /// [`.filter_entry()`]: struct.IntoIter.html#method.filter_entry | 
|---|
| 1051 | /// [`.into_iter()`]: struct.WalkDir.html#into_iter.v | 
|---|
| 1052 | /// [`min_depth`]: struct.WalkDir.html#method.min_depth | 
|---|
| 1053 | /// [`max_depth`]: struct.WalkDir.html#method.max_depth | 
|---|
| 1054 | #[ derive(Debug)] | 
|---|
| 1055 | pub struct FilterEntry<I, P> { | 
|---|
| 1056 | it: I, | 
|---|
| 1057 | predicate: P, | 
|---|
| 1058 | } | 
|---|
| 1059 |  | 
|---|
| 1060 | impl<P> Iterator for FilterEntry<IntoIter, P> | 
|---|
| 1061 | where | 
|---|
| 1062 | P: FnMut(&DirEntry) -> bool, | 
|---|
| 1063 | { | 
|---|
| 1064 | type Item = Result<DirEntry>; | 
|---|
| 1065 |  | 
|---|
| 1066 | /// Advances the iterator and returns the next value. | 
|---|
| 1067 | /// | 
|---|
| 1068 | /// # Errors | 
|---|
| 1069 | /// | 
|---|
| 1070 | /// If the iterator fails to retrieve the next value, this method returns | 
|---|
| 1071 | /// an error value. The error will be wrapped in an `Option::Some`. | 
|---|
| 1072 | fn next(&mut self) -> Option<Result<DirEntry>> { | 
|---|
| 1073 | loop { | 
|---|
| 1074 | let dent = match self.it.next() { | 
|---|
| 1075 | None => return None, | 
|---|
| 1076 | Some(result) => itry!(result), | 
|---|
| 1077 | }; | 
|---|
| 1078 | if !(self.predicate)(&dent) { | 
|---|
| 1079 | if dent.is_dir() { | 
|---|
| 1080 | self.it.skip_current_dir(); | 
|---|
| 1081 | } | 
|---|
| 1082 | continue; | 
|---|
| 1083 | } | 
|---|
| 1084 | return Some(Ok(dent)); | 
|---|
| 1085 | } | 
|---|
| 1086 | } | 
|---|
| 1087 | } | 
|---|
| 1088 |  | 
|---|
| 1089 | impl<P> iter::FusedIterator for FilterEntry<IntoIter, P> where | 
|---|
| 1090 | P: FnMut(&DirEntry) -> bool | 
|---|
| 1091 | { | 
|---|
| 1092 | } | 
|---|
| 1093 |  | 
|---|
| 1094 | impl<P> FilterEntry<IntoIter, P> | 
|---|
| 1095 | where | 
|---|
| 1096 | P: FnMut(&DirEntry) -> bool, | 
|---|
| 1097 | { | 
|---|
| 1098 | /// Yields only entries which satisfy the given predicate and skips | 
|---|
| 1099 | /// descending into directories that do not satisfy the given predicate. | 
|---|
| 1100 | /// | 
|---|
| 1101 | /// The predicate is applied to all entries. If the predicate is | 
|---|
| 1102 | /// true, iteration carries on as normal. If the predicate is false, the | 
|---|
| 1103 | /// entry is ignored and if it is a directory, it is not descended into. | 
|---|
| 1104 | /// | 
|---|
| 1105 | /// This is often more convenient to use than [`skip_current_dir`]. For | 
|---|
| 1106 | /// example, to skip hidden files and directories efficiently on unix | 
|---|
| 1107 | /// systems: | 
|---|
| 1108 | /// | 
|---|
| 1109 | /// ```no_run | 
|---|
| 1110 | /// use walkdir::{DirEntry, WalkDir}; | 
|---|
| 1111 | /// # use walkdir::Error; | 
|---|
| 1112 | /// | 
|---|
| 1113 | /// fn is_hidden(entry: &DirEntry) -> bool { | 
|---|
| 1114 | ///     entry.file_name() | 
|---|
| 1115 | ///          .to_str() | 
|---|
| 1116 | ///          .map(|s| s.starts_with( ".")) | 
|---|
| 1117 | ///          .unwrap_or(false) | 
|---|
| 1118 | /// } | 
|---|
| 1119 | /// | 
|---|
| 1120 | /// # fn try_main() -> Result<(), Error> { | 
|---|
| 1121 | /// for entry in WalkDir::new( "foo") | 
|---|
| 1122 | ///                      .into_iter() | 
|---|
| 1123 | ///                      .filter_entry(|e| !is_hidden(e)) { | 
|---|
| 1124 | ///     println!( "{}", entry?.path().display()); | 
|---|
| 1125 | /// } | 
|---|
| 1126 | /// # Ok(()) | 
|---|
| 1127 | /// # } | 
|---|
| 1128 | /// ``` | 
|---|
| 1129 | /// | 
|---|
| 1130 | /// Note that the iterator will still yield errors for reading entries that | 
|---|
| 1131 | /// may not satisfy the predicate. | 
|---|
| 1132 | /// | 
|---|
| 1133 | /// Note that entries skipped with [`min_depth`] and [`max_depth`] are not | 
|---|
| 1134 | /// passed to this predicate. | 
|---|
| 1135 | /// | 
|---|
| 1136 | /// Note that if the iterator has `contents_first` enabled, then this | 
|---|
| 1137 | /// method is no different than calling the standard `Iterator::filter` | 
|---|
| 1138 | /// method (because directory entries are yielded after they've been | 
|---|
| 1139 | /// descended into). | 
|---|
| 1140 | /// | 
|---|
| 1141 | /// [`skip_current_dir`]: #method.skip_current_dir | 
|---|
| 1142 | /// [`min_depth`]: struct.WalkDir.html#method.min_depth | 
|---|
| 1143 | /// [`max_depth`]: struct.WalkDir.html#method.max_depth | 
|---|
| 1144 | pub fn filter_entry(self, predicate: P) -> FilterEntry<Self, P> { | 
|---|
| 1145 | FilterEntry { it: self, predicate } | 
|---|
| 1146 | } | 
|---|
| 1147 |  | 
|---|
| 1148 | /// Skips the current directory. | 
|---|
| 1149 | /// | 
|---|
| 1150 | /// This causes the iterator to stop traversing the contents of the least | 
|---|
| 1151 | /// recently yielded directory. This means any remaining entries in that | 
|---|
| 1152 | /// directory will be skipped (including sub-directories). | 
|---|
| 1153 | /// | 
|---|
| 1154 | /// Note that the ergonomics of this method are questionable since it | 
|---|
| 1155 | /// borrows the iterator mutably. Namely, you must write out the looping | 
|---|
| 1156 | /// condition manually. For example, to skip hidden entries efficiently on | 
|---|
| 1157 | /// unix systems: | 
|---|
| 1158 | /// | 
|---|
| 1159 | /// ```no_run | 
|---|
| 1160 | /// use walkdir::{DirEntry, WalkDir}; | 
|---|
| 1161 | /// | 
|---|
| 1162 | /// fn is_hidden(entry: &DirEntry) -> bool { | 
|---|
| 1163 | ///     entry.file_name() | 
|---|
| 1164 | ///          .to_str() | 
|---|
| 1165 | ///          .map(|s| s.starts_with( ".")) | 
|---|
| 1166 | ///          .unwrap_or(false) | 
|---|
| 1167 | /// } | 
|---|
| 1168 | /// | 
|---|
| 1169 | /// let mut it = WalkDir::new( "foo").into_iter(); | 
|---|
| 1170 | /// loop { | 
|---|
| 1171 | ///     let entry = match it.next() { | 
|---|
| 1172 | ///         None => break, | 
|---|
| 1173 | ///         Some(Err(err)) => panic!( "ERROR: {}", err), | 
|---|
| 1174 | ///         Some(Ok(entry)) => entry, | 
|---|
| 1175 | ///     }; | 
|---|
| 1176 | ///     if is_hidden(&entry) { | 
|---|
| 1177 | ///         if entry.file_type().is_dir() { | 
|---|
| 1178 | ///             it.skip_current_dir(); | 
|---|
| 1179 | ///         } | 
|---|
| 1180 | ///         continue; | 
|---|
| 1181 | ///     } | 
|---|
| 1182 | ///     println!( "{}", entry.path().display()); | 
|---|
| 1183 | /// } | 
|---|
| 1184 | /// ``` | 
|---|
| 1185 | /// | 
|---|
| 1186 | /// You may find it more convenient to use the [`filter_entry`] iterator | 
|---|
| 1187 | /// adapter. (See its documentation for the same example functionality as | 
|---|
| 1188 | /// above.) | 
|---|
| 1189 | /// | 
|---|
| 1190 | /// [`filter_entry`]: #method.filter_entry | 
|---|
| 1191 | pub fn skip_current_dir(&mut self) { | 
|---|
| 1192 | self.it.skip_current_dir(); | 
|---|
| 1193 | } | 
|---|
| 1194 | } | 
|---|
| 1195 |  | 
|---|