diff options
| author | Richard M. Stallman | 1993-11-23 19:32:27 +0000 |
|---|---|---|
| committer | Richard M. Stallman | 1993-11-23 19:32:27 +0000 |
| commit | 089c3fb3e632782886c898fa1977f2394003733c (patch) | |
| tree | d3a79935ca0c8fdf8291c5eb0f7dc4ba0b72ed07 | |
| parent | 4e08e741828628c22300799357c35736be201838 (diff) | |
| download | emacs-089c3fb3e632782886c898fa1977f2394003733c.tar.gz emacs-089c3fb3e632782886c898fa1977f2394003733c.zip | |
Initial revision
| -rw-r--r-- | lisp/regi.el | 259 |
1 files changed, 259 insertions, 0 deletions
diff --git a/lisp/regi.el b/lisp/regi.el new file mode 100644 index 00000000000..9e29c6e2eb5 --- /dev/null +++ b/lisp/regi.el | |||
| @@ -0,0 +1,259 @@ | |||
| 1 | ;;; regi.el --- REGular expression Interpreting engine | ||
| 2 | |||
| 3 | ;; Author: 1993 Barry A. Warsaw, Century Computing, Inc. <bwarsaw@cen.com> | ||
| 4 | ;; Maintainer: bwarsaw@cen.com | ||
| 5 | ;; Created: 24-Feb-1993 | ||
| 6 | ;; Version: 1.8 | ||
| 7 | ;; Last Modified: 1993/06/01 21:33:00 | ||
| 8 | ;; Keywords: regular expression regexp matching text | ||
| 9 | |||
| 10 | ;; Copyright (C) 1993 Barry A. Warsaw | ||
| 11 | |||
| 12 | ;; This file is not yet part of GNU Emacs. | ||
| 13 | ;; | ||
| 14 | ;; This program is free software; you can redistribute it and/or modify | ||
| 15 | ;; it under the terms of the GNU General Public License as published by | ||
| 16 | ;; the Free Software Foundation; either version 2 of the License, or | ||
| 17 | ;; (at your option) any later version. | ||
| 18 | ;; | ||
| 19 | ;; This program is distributed in the hope that it will be useful, | ||
| 20 | ;; but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
| 21 | ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
| 22 | ;; GNU General Public License for more details. | ||
| 23 | ;; | ||
| 24 | ;; You should have received a copy of the GNU General Public License | ||
| 25 | ;; along with this program; if not, write to the Free Software | ||
| 26 | ;; Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. | ||
| 27 | |||
| 28 | ;; LCD Archive Entry | ||
| 29 | ;; regi|Barry A. Warsaw|bwarsaw@cen.com | ||
| 30 | ;; |REGular expression Interpreting engine | ||
| 31 | ;; |1993/06/01 21:33:00|1.8| | ||
| 32 | |||
| 33 | ;;; Code: | ||
| 34 | |||
| 35 | |||
| 36 | (defun regi-pos (&optional position col-p) | ||
| 37 | "Return the character position at various buffer positions. | ||
| 38 | Optional POSITION can be one of the following symbols: | ||
| 39 | |||
| 40 | `bol' == beginning of line | ||
| 41 | `boi' == beginning of indentation | ||
| 42 | `eol' == end of line [default] | ||
| 43 | `bonl' == beginning of next line | ||
| 44 | `bopl' == beginning of previous line | ||
| 45 | |||
| 46 | Optional COL-P non-nil returns `current-column' instead of character position." | ||
| 47 | (save-excursion | ||
| 48 | (cond | ||
| 49 | ((eq position 'bol) (beginning-of-line)) | ||
| 50 | ((eq position 'boi) (back-to-indentation)) | ||
| 51 | ((eq position 'bonl) (forward-line 1)) | ||
| 52 | ((eq position 'bopl) (forward-line -1)) | ||
| 53 | (t (end-of-line))) | ||
| 54 | (if col-p (current-column) (point)))) | ||
| 55 | |||
| 56 | (defun regi-mapcar (predlist func &optional negate-p case-fold-search-p) | ||
| 57 | "Build a regi frame where each element of PREDLIST appears exactly once. | ||
| 58 | The frame contains elements where each member of PREDLIST is | ||
| 59 | associated with FUNC, and optionally NEGATE-P and CASE-FOLD-SEARCH-P." | ||
| 60 | (let (frame tail) | ||
| 61 | (if (or negate-p case-fold-search-p) | ||
| 62 | (setq tail (list negate-p))) | ||
| 63 | (if case-fold-search-p | ||
| 64 | (setq tail (append tail (list case-fold-search-p)))) | ||
| 65 | (while predlist | ||
| 66 | (let ((element (list (car predlist) func))) | ||
| 67 | (if tail | ||
| 68 | (setq element (append element tail))) | ||
| 69 | (setq frame (append frame (list element)) | ||
| 70 | predlist (cdr predlist)) | ||
| 71 | )) | ||
| 72 | frame)) | ||
| 73 | |||
| 74 | |||
| 75 | (defun regi-interpret (frame &optional start end) | ||
| 76 | "Interpret the regi frame FRAME. | ||
| 77 | If optional START and END are supplied, they indicate the region of | ||
| 78 | interest, and the buffer is narrowed to the beginning of the line | ||
| 79 | containing START, and beginning of the line after the line containing | ||
| 80 | END. Otherwise, point and mark are not set and processing continues | ||
| 81 | until your FUNC returns the `abort' symbol (see below). Beware! Not | ||
| 82 | supplying a START or END could put you in an infinite loop. | ||
| 83 | |||
| 84 | A regi frame is a list of entries of the form: | ||
| 85 | |||
| 86 | (PRED FUNC [NEGATE-P [CASE-FOLD-SEARCH]]) | ||
| 87 | |||
| 88 | PRED is a predicate against which each line in the region is tested, | ||
| 89 | and if a match occurs, FUNC is `eval'd. Point is then moved to the | ||
| 90 | beginning of the next line, the frame is reset and checking continues. | ||
| 91 | If a match doesn't occur, the next entry is checked against the | ||
| 92 | current line until all entries in the frame are checked. At this | ||
| 93 | point, if no match occurred, the frame is reset and point is moved to | ||
| 94 | the next line. Checking continues until every line in the region is | ||
| 95 | checked. Optional NEGATE-P inverts the result of PRED before FUNC is | ||
| 96 | called and `case-fold-search' is bound to the optional value of | ||
| 97 | CASE-FOLD-SEARCH for the PRED check. | ||
| 98 | |||
| 99 | PRED can be a string, variable, function or one of the following | ||
| 100 | symbols: t, nil, `begin', `end', and `every'. If PRED is a string, or | ||
| 101 | a variable or list that evaluates to a string, it is interpreted as a | ||
| 102 | regular expression and is matched against the current line (from the | ||
| 103 | beginning) using `looking-at'. If PRED does not evaluate to a string, | ||
| 104 | it is interpreted as a binary value (nil or non-nil). | ||
| 105 | |||
| 106 | PRED can also be one of the following symbols: | ||
| 107 | |||
| 108 | t -- always produces a true outcome | ||
| 109 | `begin' -- always executes before anything else | ||
| 110 | `end' -- always executes after everything else | ||
| 111 | `every' -- execute after frame is matched on a line | ||
| 112 | |||
| 113 | Note that NEGATE-P and CASE-FOLD-SEARCH are meaningless if PRED is one | ||
| 114 | of these special symbols. Only the first occurance of each symbol in | ||
| 115 | a frame entry is used, the rest are ignored. | ||
| 116 | |||
| 117 | Your FUNC can return values which control regi processing. If a list | ||
| 118 | is returned from your function, it can contain any combination of the | ||
| 119 | following elements: | ||
| 120 | |||
| 121 | the symbol `continue' | ||
| 122 | Tells regi to continue processing frame-entries after a match, | ||
| 123 | instead of resetting to the first entry and advancing to the next | ||
| 124 | line, as is the default behavior. When returning this symbol, | ||
| 125 | you must take care not to enter an infinite loop. | ||
| 126 | |||
| 127 | the symbol `abort' | ||
| 128 | Tells regi to terminate processing this frame. any end | ||
| 129 | frame-entry is still processed. | ||
| 130 | |||
| 131 | the list `(frame . NEWFRAME)' | ||
| 132 | Tells regi to use NEWFRAME as its current frame. In other words, | ||
| 133 | your FUNC can modify the executing regi frame on the fly. | ||
| 134 | |||
| 135 | the list `(step . STEP)' | ||
| 136 | Tells regi to move STEP number of lines forward during normal | ||
| 137 | processing. By default, regi moves forward 1 line. STEP can be | ||
| 138 | negative, but be careful of infinite loops. | ||
| 139 | |||
| 140 | You should usually take care to explicitly return nil from your | ||
| 141 | function if no action is to take place. Your FUNC will always be | ||
| 142 | `eval'ed. The following variables will be temporarily bound to some | ||
| 143 | useful information: | ||
| 144 | |||
| 145 | `curline' | ||
| 146 | the current line in the buffer, as a string | ||
| 147 | |||
| 148 | `curframe' | ||
| 149 | the full, current frame being executed | ||
| 150 | |||
| 151 | `curentry' | ||
| 152 | the current frame entry being executed." | ||
| 153 | |||
| 154 | (save-excursion | ||
| 155 | (save-restriction | ||
| 156 | (let (begin-tag end-tag every-tag current-frame working-frame donep) | ||
| 157 | |||
| 158 | ;; set up the narrowed region | ||
| 159 | (and start | ||
| 160 | end | ||
| 161 | (let* ((tstart start) | ||
| 162 | (start (min start end)) | ||
| 163 | (end (max start end))) | ||
| 164 | (narrow-to-region | ||
| 165 | (progn (goto-char end) (regi-pos 'bonl)) | ||
| 166 | (progn (goto-char start) (regi-pos 'bol))))) | ||
| 167 | |||
| 168 | ;; lets find the special tags and remove them from the working | ||
| 169 | ;; frame. note that only the last special tag is used. | ||
| 170 | (mapcar | ||
| 171 | (function | ||
| 172 | (lambda (entry) | ||
| 173 | (let ((pred (car entry)) | ||
| 174 | (func (car (cdr entry)))) | ||
| 175 | (cond | ||
| 176 | ((eq pred 'begin) (setq begin-tag func)) | ||
| 177 | ((eq pred 'end) (setq end-tag func)) | ||
| 178 | ((eq pred 'every) (setq every-tag func)) | ||
| 179 | (t | ||
| 180 | (setq working-frame (append working-frame (list entry)))) | ||
| 181 | ) ; end-cond | ||
| 182 | ))) | ||
| 183 | frame) ; end-mapcar | ||
| 184 | |||
| 185 | ;; execute the begin entry | ||
| 186 | (eval begin-tag) | ||
| 187 | |||
| 188 | ;; now process the frame | ||
| 189 | (setq current-frame working-frame) | ||
| 190 | (while (not (or donep (eobp))) | ||
| 191 | (let* ((entry (car current-frame)) | ||
| 192 | (pred (nth 0 entry)) | ||
| 193 | (func (nth 1 entry)) | ||
| 194 | (negate-p (nth 2 entry)) | ||
| 195 | (case-fold-search (nth 3 entry)) | ||
| 196 | match-p) | ||
| 197 | (catch 'regi-throw-top | ||
| 198 | (cond | ||
| 199 | ;; we are finished processing the frame for this line | ||
| 200 | ((not current-frame) | ||
| 201 | (setq current-frame working-frame) ;reset frame | ||
| 202 | (forward-line 1) | ||
| 203 | (throw 'regi-throw-top t)) | ||
| 204 | ;; see if predicate evaluates to a string | ||
| 205 | ((stringp (setq match-p (eval pred))) | ||
| 206 | (setq match-p (looking-at match-p))) | ||
| 207 | ) ; end-cond | ||
| 208 | |||
| 209 | ;; now that we've done the initial matching, check for | ||
| 210 | ;; negation of match | ||
| 211 | (and negate-p | ||
| 212 | (setq match-p (not match-p))) | ||
| 213 | |||
| 214 | ;; if the line matched, package up the argument list and | ||
| 215 | ;; funcall the FUNC | ||
| 216 | (if match-p | ||
| 217 | (let* ((curline (buffer-substring | ||
| 218 | (regi-pos 'bol) | ||
| 219 | (regi-pos 'eol))) | ||
| 220 | (curframe current-frame) | ||
| 221 | (curentry entry) | ||
| 222 | (result (eval func)) | ||
| 223 | (step (or (cdr (assq 'step result)) 1)) | ||
| 224 | ) | ||
| 225 | ;; changing frame on the fly? | ||
| 226 | (if (assq 'frame result) | ||
| 227 | (setq working-frame (cdr (assq 'frame result)))) | ||
| 228 | |||
| 229 | ;; continue processing current frame? | ||
| 230 | (if (memq 'continue result) | ||
| 231 | (setq current-frame (cdr current-frame)) | ||
| 232 | (forward-line step) | ||
| 233 | (setq current-frame working-frame)) | ||
| 234 | |||
| 235 | ;; abort current frame? | ||
| 236 | (if (memq 'abort result) | ||
| 237 | (progn | ||
| 238 | (setq donep t) | ||
| 239 | (throw 'regi-throw-top t))) | ||
| 240 | ) ; end-let | ||
| 241 | |||
| 242 | ;; else if no match occurred, then process the next | ||
| 243 | ;; frame-entry on the current line | ||
| 244 | (setq current-frame (cdr current-frame)) | ||
| 245 | |||
| 246 | ) ; end-if match-p | ||
| 247 | ) ; end catch | ||
| 248 | ) ; end let | ||
| 249 | |||
| 250 | ;; after every cycle, evaluate every-tag | ||
| 251 | (eval every-tag) | ||
| 252 | ) ; end-while | ||
| 253 | |||
| 254 | ;; now process the end entry | ||
| 255 | (eval end-tag))))) | ||
| 256 | |||
| 257 | |||
| 258 | (provide 'regi) | ||
| 259 | ;;; regi.el ends here | ||