X-Git-Url: https://git.distorted.org.uk/~mdw/sod/blobdiff_plain/e0808c472145fc81e52898bc9ac289e10c4f4f41..e046c3f65a8f7241889fb9b6005aac21e2aad1a8:/src/lexer-impl.lisp diff --git a/src/lexer-impl.lisp b/src/lexer-impl.lisp index ffc8446..48109b1 100644 --- a/src/lexer-impl.lisp +++ b/src/lexer-impl.lisp @@ -44,7 +44,7 @@ Usable in `format''s ~/.../ command." (declare (ignore colonp atsignp)) - (cond ((null char) (write-string "" stream)) + (cond ((null char) (write-string "" stream)) ((and (graphic-char-p char) (char/= char #\space)) (format stream "`~C'" char)) (t (format stream "<~(~:C~)>" char)))) @@ -59,17 +59,22 @@ (return (values token-types nil consumedp))) (scanner-step scanner))) -(defun parse-error-recover (scanner parser recover) +(defun parse-error-recover (scanner parser recover + &key ignore-unconsumed force-progress) "This is the implementation of the `error' parser." (multiple-value-bind (result win consumedp) (funcall parser) - (cond ((or win (and (not consumedp) (scanner-at-eof-p scanner))) - ;; If we succeeded then there's nothing for us to do here. On the - ;; other hand, if we failed, didn't consume any tokens, and we're - ;; at end-of-file, then there's not much hope of making onward - ;; progress, so in this case we propagate the failure rather than - ;; trying to recover. And we assume that the continuation will - ;; somehow arrange to report the problem, and avoid inundating the - ;; user with error reports. + (cond ((or win + (and (not consumedp) + (or ignore-unconsumed + (scanner-at-eof-p scanner)))) + ;; If we succeeded, or if we didn't consume any tokens and the + ;; caller's OK with that, then there's nothing for us to do here. + ;; On the other hand, if we failed, didn't consume any tokens, and + ;; we're at end-of-file, then there's not much hope of making + ;; onward progress, so in this case we propagate the failure + ;; rather than trying to recover. And we assume that the + ;; continuation will somehow arrange to report the problem, and + ;; avoid inundating the user with error reports. (values result win consumedp)) (t ;; Now we have to do some kind of sensible error recovery. The @@ -80,8 +85,8 @@ ;; current token. Finally, if we are at EOF then our best bet is ;; simply to propagate the current failure back to the caller, but ;; we handled that case above. - (syntax-error scanner result :continuep t) - (unless consumedp (scanner-step scanner)) + (syntax-error scanner result) + (when (and force-progress (not consumedp)) (scanner-step scanner)) (funcall recover))))) ;;;-------------------------------------------------------------------------- @@ -96,7 +101,18 @@ (parse (many (acc init (+ (* acc radix) it) :min min) (label (list :digit radix) (filter (lambda (ch) - (digit-char-p ch radix)))))))) + (digit-char-p ch radix))))))) + (start-floc () + ;; This is a little nasty. We scan the first token during + ;; instance initialization, as a result of `shared-initialize' + ;; on `token-scanner'. Unfortunately, this happens before + ;; we've had a chance to initialize our own `filename' slot. + ;; This means that we can't use the SCANNER as a file + ;; location, however tempting it might be. So we have this + ;; hack. + (make-file-location (scanner-filename char-scanner) + (scanner-line scanner) + (scanner-column scanner)))) ;; Skip initial junk, and remember the place. (loop @@ -105,7 +121,7 @@ (cond-parse (:consumedp cp :expected exp) ((satisfies whitespace-char-p) (parse :whitespace)) ((scan-comment char-scanner)) - (t (if cp (lexer-error char-scanner exp cp) (return))))) + (t (if cp (lexer-error char-scanner exp) (return))))) ;; Now parse something. (cond-parse (:consumedp cp :expected exp) @@ -123,13 +139,23 @@ (progn (write-char it out) out) :final (get-output-stream-string out)) (or (and #\\ :any) (not quote)))) - (nil (char quote))) + (nil (or (char quote) + (seq (:eof) + (lexer-error char-scanner (list quote)) + (info-with-location + (start-floc) "Literal started here"))))) (ecase quote (#\" contents) (#\' (case (length contents) (1 (char contents 0)) - (0 (cerror* "Empty character literal") #\?) - (t (cerror* "Too many characters in literal") + (0 (cerror*-with-location (start-floc) + "Lexical error: ~ + empty character literal") + #\?) + (t (cerror*-with-location (start-floc) + "Lexical error: ~ + too many characters ~ + in literal") (char contents 0)))))) (values (etypecase it (character :char) @@ -164,7 +190,7 @@ ;; must make progress on every call. (t (assert cp) - (lexer-error char-scanner exp cp) + (lexer-error char-scanner exp) (scanner-token scanner))))))) ;;;----- That's all, folks --------------------------------------------------