;;; em-glob.el --- extended file name globbing -*- lexical-binding:t -*- ;; Copyright (C) 1999-2024 Free Software Foundation, Inc. ;; Author: John Wiegley ;; This file is part of GNU Emacs. ;; GNU Emacs is free software: you can redistribute it and/or modify ;; it under the terms of the GNU General Public License as published by ;; the Free Software Foundation, either version 3 of the License, or ;; (at your option) any later version. ;; GNU Emacs is distributed in the hope that it will be useful, ;; but WITHOUT ANY WARRANTY; without even the implied warranty of ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ;; GNU General Public License for more details. ;; You should have received a copy of the GNU General Public License ;; along with GNU Emacs. If not, see . ;;; Commentary: ;; The globbing code used by Eshell closely follows the syntax used by ;; zsh. Basically, here is a summary of examples: ;; ;; echo a* ; anything starting with 'a' ;; echo a#b ; zero or more 'a's, then 'b' ;; echo a##b ; one or more 'a's, then 'b' ;; echo a? ; a followed by any character ;; echo a*~ab ; 'a', then anything, but not 'ab' ;; echo c*~*~ ; all files beginning with 'c', except backups (*~) ;; ;; Recursive globbing is also supported: ;; ;; echo **/*.c ; all '.c' files at or under current directory ;; echo ***/*.c ; same as above, but traverse symbolic links ;; ;; Using argument predication, the recursive globbing syntax is ;; sufficient to replace the use of 'find | xargs ' in ;; most cases. For example, to change the readership of all files ;; belonging to 'johnw' in the '/tmp' directory or lower, use: ;; ;; chmod go-r /tmp/**/*(u'johnw') ;; ;; The glob above matches all of the files beneath '/tmp' that are ;; owned by the user 'johnw'. See [Value modifiers and predicates], ;; for more information about argument predication. ;;; Code: (require 'esh-arg) (require 'esh-module) (require 'esh-util) ;;;###autoload (progn (defgroup eshell-glob nil "This module provides extended globbing syntax, similar what is used by zsh for filename generation." :tag "Extended filename globbing" :group 'eshell-module)) ;;; User Variables: (defcustom eshell-glob-load-hook nil "A list of functions to run when `eshell-glob' is loaded." :version "24.1" ; removed eshell-glob-initialize :type 'hook :group 'eshell-glob) (defcustom eshell-glob-splice-results nil "If non-nil, the results of glob patterns will be spliced in-place. When splicing, the resulting command is as though the user typed each result individually. Otherwise, the glob results a single argument as a list." :version "30.1" :type 'boolean :group 'eshell-glob) (defcustom eshell-glob-include-dot-files nil "If non-nil, glob patterns will match files beginning with a dot." :type 'boolean :group 'eshell-glob) (defcustom eshell-glob-include-dot-dot t "If non-nil, glob patterns that match dots will match . and .." :type 'boolean :group 'eshell-glob) (defcustom eshell-glob-case-insensitive (not (not (eshell-under-windows-p))) "If non-nil, glob pattern matching will ignore case." :type 'boolean :group 'eshell-glob) (defcustom eshell-glob-show-progress nil "If non-nil, display progress messages during a recursive glob. This option slows down recursive glob processing by quite a bit." :type 'boolean :group 'eshell-glob) (defcustom eshell-error-if-no-glob nil "If non-nil, it is an error for a glob pattern not to match. This mimics the behavior of zsh if non-nil, but bash if nil." :type 'boolean :group 'eshell-glob) (defcustom eshell-glob-chars-list '(?\] ?\[ ?* ?? ?~ ?\( ?\) ?| ?# ?^) "List of additional characters used in extended globbing." :type '(repeat character) :group 'eshell-glob) (defcustom eshell-glob-translate-alist '((?\] . "]") (?\[ . "[") (?^ . "^") (?? . ".") (?* . ".*") (?~ . "~") (?\( . "\\(") (?\) . "\\)") (?\| . "\\|") (?# . (lambda (str pos) (if (and (< (1+ pos) (length str)) (memq (aref str (1+ pos)) '(?* ?# ?+ ??))) (cons (if (eq (aref str (1+ pos)) ??) "?" (if (eq (aref str (1+ pos)) ?*) "*" "+")) (+ pos 2)) (cons "*" (1+ pos)))))) "An alist for translation of extended globbing characters." :type '(alist :key-type character :value-type (choice string function)) :group 'eshell-glob) ;;; Functions: (defun eshell-glob-initialize () ;Called from `eshell-mode' via intern-soft! "Initialize the extended globbing code." ;; it's important that `eshell-glob-chars-list' come first (when (boundp 'eshell-special-chars-outside-quoting) (setq-local eshell-special-chars-outside-quoting (append eshell-glob-chars-list eshell-special-chars-outside-quoting))) (add-hook 'eshell-parse-argument-hook 'eshell-parse-glob-chars t t) (add-hook 'eshell-pre-rewrite-command-hook 'eshell-no-command-globbing nil t)) (defun eshell-no-command-globbing (terms) "Don't glob the command argument. Reflect this by modifying TERMS." (ignore (pcase (car terms) ((or `(eshell-extended-glob ,term) `(eshell-splice-args (eshell-extended-glob ,term))) (setcar terms term))))) (defun eshell-add-glob-modifier () "Add `eshell-extended-glob' to the argument modifier list." (when eshell-glob-splice-results (add-hook 'eshell-current-modifiers #'eshell-splice-args 99)) (add-hook 'eshell-current-modifiers #'eshell-extended-glob)) (defun eshell-parse-glob-chars () "Parse a globbing delimiter. The character is not advanced for ordinary globbing characters, so that other function may have a chance to override the globbing interpretation." (when (memq (char-after) eshell-glob-chars-list) (if (not (memq (char-after) '(?\( ?\[))) (ignore (eshell-add-glob-modifier)) (let ((here (point))) (forward-char) (let* ((delim (char-before)) (end (eshell-find-delimiter delim (if (eq delim ?\[) ?\] ?\))))) (if (not end) (throw 'eshell-incomplete (char-to-string delim)) (if (and (eshell-using-module 'eshell-pred) (eshell-arg-delimiter (1+ end))) (ignore (goto-char here)) (eshell-add-glob-modifier) (prog1 (buffer-substring-no-properties (1- (point)) (1+ end)) (goto-char (1+ end)))))))))) (defvar eshell-glob-chars-regexp nil) (defvar eshell-glob-matches) (defvar message-shown) (defvar eshell-glob-recursive-alist '(("**/" . recurse) ("***/" . recurse-symlink))) (defun eshell-glob-regexp (pattern) "Convert glob-pattern PATTERN to a regular expression. The basic syntax is: glob regexp meaning ---- ------ ------- ? . matches any single character * .* matches any group of characters (or none) # * matches zero or more occurrences of preceding ## + matches one or more occurrences of preceding (x) \\(x\\) makes `x' a regular expression group | \\| boolean OR within an expression group [a-b] [a-b] matches a character or range [^a] [^a] excludes a character or range If any characters in PATTERN have the text property `escaped' set to true, then these characters will match themselves in the resulting regular expression." (let ((matched-in-pattern 0) ; How much of PATTERN handled regexp) (while (string-match (or eshell-glob-chars-regexp (setq-local eshell-glob-chars-regexp (format "[%s]+" (apply 'string eshell-glob-chars-list)))) pattern matched-in-pattern) (let* ((op-begin (match-beginning 0)) (op-char (aref pattern op-begin))) (setq regexp (concat regexp (regexp-quote (substring pattern matched-in-pattern op-begin)))) (if (get-text-property op-begin 'escaped pattern) (setq regexp (concat regexp (regexp-quote (char-to-string op-char))) matched-in-pattern (1+ op-begin)) (let ((xlat (assq op-char eshell-glob-translate-alist))) (if (not xlat) (error "Unrecognized globbing character `%c'" op-char) (if (stringp (cdr xlat)) (setq regexp (concat regexp (cdr xlat)) matched-in-pattern (1+ op-begin)) (let ((result (funcall (cdr xlat) pattern op-begin))) (setq regexp (concat regexp (car result)) matched-in-pattern (cdr result))))))))) (concat "\\`" regexp (regexp-quote (substring pattern matched-in-pattern)) "\\'"))) (defun eshell-glob-convert-1 (glob &optional last) "Convert a GLOB matching a single element of a file name to regexps. If LAST is non-nil, this glob is the last element of a file name. The result is a pair of regexps, the first for file names to include, and the second for ones to exclude." (let ((len (length glob)) (index 1) (incl glob) excl) ;; We can't use `directory-file-name' because it strips away text ;; properties in the string. (let ((last (1- (length incl)))) (when (eq (aref incl last) ?/) (setq incl (substring incl 0 last)))) ;; Split the glob if it contains a negation like x~y. (while (and (eq incl glob) (setq index (string-search "~" glob index))) (if (or (get-text-property index 'escaped glob) (or (= (1+ index) len))) (setq index (1+ index)) (setq incl (substring glob 0 index) excl (substring glob (1+ index))))) (setq incl (eshell-glob-regexp incl) excl (and excl (eshell-glob-regexp excl))) ;; Exclude dot files if requested. (if (or eshell-glob-include-dot-files (eq (aref glob 0) ?.)) (unless (or eshell-glob-include-dot-dot (not last)) (setq excl (if excl (concat "\\(\\`\\.\\.?\\'\\|" excl "\\)") "\\`\\.\\.?\\'"))) (setq excl (if excl (concat "\\(\\`\\.\\|" excl "\\)") "\\`\\."))) (cons incl excl))) (defun eshell-glob-convert (glob) "Convert an Eshell glob-pattern GLOB to regexps. The result is a list of three elements: 1. The base directory to search in. 2. A list containing elements of the following forms: * Regexp pairs as generated by `eshell-glob-convert-1'. * `recurse', indicating that searches should recurse into subdirectories. * `recurse-symlink', like `recurse', but also following symlinks. 3. A boolean indicating whether to match directories only." (let ((globs (eshell-split-path glob)) (isdir (eq (aref glob (1- (length glob))) ?/)) start-dir result last-saw-recursion) (if (and (cdr globs) (file-name-absolute-p (car globs))) (setq start-dir (car globs) globs (cdr globs)) (setq start-dir ".")) (while globs (if-let ((recurse (cdr (assoc (car globs) eshell-glob-recursive-alist)))) (if last-saw-recursion (setcar result recurse) (push recurse result) (setq last-saw-recursion t)) (push (eshell-glob-convert-1 (car globs) (null (cdr globs))) result) (setq last-saw-recursion nil)) (setq globs (cdr globs))) (list (file-name-as-directory start-dir) (nreverse result) isdir))) (defun eshell-extended-glob (glob) "Return a list of files matched by GLOB. If no files match, signal an error (if `eshell-error-if-no-glob' is non-nil), or otherwise return GLOB itself. This function almost fully supports zsh style filename generation syntax. Things that are not supported are: ^foo for matching everything but foo (foo~bar) tilde within a parenthesis group foo<1-10> numeric ranges foo~x(a|b) (a|b) will be interpreted as a predicate/modifier list Mainly they are not supported because file matching is done with Emacs regular expressions, and these cannot support the above constructs." (let ((globs (eshell-glob-convert glob)) eshell-glob-matches message-shown) (unwind-protect (apply #'eshell-glob-entries globs) (if message-shown (message nil))) (or (and eshell-glob-matches (sort eshell-glob-matches #'string<)) (if eshell-error-if-no-glob (error "No matches found: %s" glob) (if eshell-glob-splice-results (list glob) glob))))) ;; FIXME does this really need to abuse eshell-glob-matches, message-shown? (defun eshell-glob-entries (path globs only-dirs) "Match the entries in PATH against GLOBS. GLOBS is a list of globs as converted by `eshell-glob-convert', which see. If ONLY-DIRS is non-nil, only match directories; otherwise, match directories and files." (let* ((entries (ignore-errors (file-name-all-completions "" path))) (case-fold-search eshell-glob-case-insensitive) glob glob-remainder recurse-p) (if (rassq (car globs) eshell-glob-recursive-alist) (setq recurse-p (car globs) glob (or (cadr globs) (eshell-glob-convert-1 "*" t)) glob-remainder (cddr globs)) (setq glob (car globs) glob-remainder (cdr globs))) (when (and recurse-p eshell-glob-show-progress) (message "Building file list...%d so far: %s" (length eshell-glob-matches) path) (setq message-shown t)) (when (equal path "./") (setq path "")) (let ((incl (car glob)) (excl (cdr glob)) dirs rdirs) (dolist (name entries) (let* ((len (length name)) (isdir (eq (aref name (1- len)) ?/)) pathname) (when (let ((fname (directory-file-name name))) (and (not (and excl (string-match excl fname))) (string-match incl fname))) (if glob-remainder (when isdir (push (concat path name) dirs)) (when (or (not only-dirs) (and isdir (not (and (eq recurse-p 'recurse) (file-symlink-p (directory-file-name (concat path name))))))) (push (concat path name) eshell-glob-matches)))) (when (and recurse-p isdir (not (member name '("./" "../"))) (setq pathname (concat path name)) (not (and (eq recurse-p 'recurse) (file-symlink-p (directory-file-name pathname))))) (push pathname rdirs)))) (dolist (dir (nreverse dirs)) (eshell-glob-entries dir glob-remainder only-dirs)) (dolist (rdir (nreverse rdirs)) (eshell-glob-entries rdir globs only-dirs))))) (provide 'em-glob) ;; Local Variables: ;; generated-autoload-file: "esh-groups.el" ;; End: ;;; em-glob.el ends here