src/lexer-*.lisp: Add option to `error' to ignore non-consuming failure.
[sod] / src / module-parse.lisp
CommitLineData
bf090e02
MW
1;;; -*-lisp-*-
2;;;
3;;; Top-level parser for module syntax
4;;;
5;;; (c) 2010 Straylight/Edgeware
6;;;
7
8;;;----- Licensing notice ---------------------------------------------------
9;;;
e0808c47 10;;; This file is part of the Sensible Object Design, an object system for C.
bf090e02
MW
11;;;
12;;; SOD is free software; you can redistribute it and/or modify
13;;; it under the terms of the GNU General Public License as published by
14;;; the Free Software Foundation; either version 2 of the License, or
15;;; (at your option) any later version.
16;;;
17;;; SOD is distributed in the hope that it will be useful,
18;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
19;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
20;;; GNU General Public License for more details.
21;;;
22;;; You should have received a copy of the GNU General Public License
23;;; along with SOD; if not, write to the Free Software Foundation,
24;;; Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
25
26(in-package #:sod)
27
28;;;--------------------------------------------------------------------------
29;;; Toplevel syntax.
30
bf090e02
MW
31;;; Type names.
32
048d0b2d
MW
33(define-pluggable-parser module typename (scanner pset)
34 ;; `typename' id ( `,' id )* `;'
35 (declare (ignore pset))
bf090e02
MW
36 (with-parser-context (token-scanner-context :scanner scanner)
37 (parse (and "typename"
38 (skip-many (:min 1)
39 (seq ((id :id))
40 (if (gethash id *module-type-map*)
41 (cerror* "Type `~A' already defined" id)
42 (add-to-module *module*
43 (make-instance 'type-item
44 :name id))))
45 #\,)
46 #\;))))
47
48;;; Fragments.
49
048d0b2d
MW
50(define-pluggable-parser module code (scanner pset)
51 ;; `code' id `:' id [constraints] `{' c-fragment `}'
52 ;;
53 ;; constrains ::= `[' constraint-list `]'
54 ;; constraint ::= id+
55 (declare (ignore pset))
bf090e02 56 (with-parser-context (token-scanner-context :scanner scanner)
9ec578d9
MW
57 (flet ((kw ()
58 (parse (seq ((kw :id)) (intern (string-upcase kw) 'keyword)))))
59 (parse (seq ("code"
60 (reason (kw))
61 #\:
62 (name (kw))
63 (constraints (? (seq (#\[
64 (constraints (list (:min 1)
65 (list (:min 1) (kw))
66 #\,))
67 #\])
68 constraints)))
69 (fragment (parse-delimited-fragment scanner #\{ #\})))
70 (add-to-module *module*
71 (make-instance 'code-fragment-item
72 :fragment fragment
73 :constraints constraints
74 :reason reason
75 :name name)))))))
bf090e02
MW
76
77;;; External files.
78
9ec578d9
MW
79(export 'read-module)
80(defun read-module (pathname &key (truename nil truep) location)
bf090e02
MW
81 "Parse the file at PATHNAME as a module, returning it.
82
83 This is the main entry point for parsing module files. You may well know
84 the file's TRUENAME already (e.g., because `probe-file' dropped it into
85 your lap) so you can avoid repeating the search by providing it.
86
87 The LOCATION is the thing which wanted the module imported -- usually a
88 `file-location' object, though it might be anything other than `t' which
89 can be printed in the event of circular imports."
90
9ec578d9
MW
91 (setf pathname (merge-pathnames pathname
92 (make-pathname :type "SOD" :case :common)))
93 (unless truep (setf truename (truename pathname)))
bf090e02
MW
94 (define-module (pathname :location location :truename truename)
95 (with-open-file (f-stream pathname :direction :input)
96 (let* ((*readtable* (copy-readtable))
97 (char-scanner (make-instance 'charbuf-scanner
98 :stream f-stream))
99 (scanner (make-instance 'sod-token-scanner
100 :char-scanner char-scanner)))
101 (with-default-error-location (scanner)
102 (with-parser-context (token-scanner-context :scanner scanner)
048d0b2d
MW
103 (parse (skip-many ()
104 (seq ((pset (parse-property-set scanner))
105 (nil (error ()
106 (plug module scanner pset))))
107 (check-unused-properties pset))))))))))
108
109(define-pluggable-parser module test (scanner pset)
110 ;; `demo' string `;'
111 (declare (ignore pset))
bf090e02
MW
112 (with-parser-context (token-scanner-context :scanner scanner)
113 (parse (seq ("demo" (string :string) #\;)
114 (format t ";; DEMO ~S~%" string)))))
115
048d0b2d
MW
116(define-pluggable-parser module file (scanner pset)
117 ;; `import' string `;'
118 ;; `load' string `;'
119 (declare (ignore pset))
bf090e02
MW
120 (flet ((common (name type what thunk)
121 (find-file scanner
122 (merge-pathnames name
123 (make-pathname :type type
124 :case :common))
125 what
126 thunk)))
127 (with-parser-context (token-scanner-context :scanner scanner)
128 (parse (or (seq ("import" (name :string) #\;)
129 (common name "SOD" "module"
130 (lambda (path true)
131 (handler-case
132 (let ((module (read-module path
133 :truename true)))
134 (when module
135 (module-import module)
136 (pushnew module
137 (module-dependencies
138 *module*))))
139 (file-error (error)
140 (cerror* "Error reading module ~S: ~A"
141 path error))))))
142 (seq ("load" (name :string) #\;)
143 (common name "LISP" "Lisp file"
144 (lambda (path true)
145 (handler-case
146 (load true :verbose nil :print nil)
147 (error (error)
148 (cerror* "Error loading Lisp file ~S: ~A"
149 path error)))))))))))
150
151;;; Lisp escape.
152
048d0b2d 153(define-pluggable-parser module lisp (scanner pset)
bf090e02 154 ;; `lisp' s-expression `;'
048d0b2d 155 (declare (ignore pset))
bf090e02
MW
156 (with-parser-context (token-scanner-context :scanner scanner)
157 (parse (seq ((sexp (if (and (eql (token-type scanner) :id)
158 (string= (token-value scanner) "lisp"))
159 (let* ((stream (make-scanner-stream scanner))
160 (sexp (read stream t)))
161 (scanner-step scanner)
162 (values sexp t t))
163 (values '((:id "lisp")) nil nil)))
164 #\;)
165 (eval sexp)))))
166
167;;;--------------------------------------------------------------------------
168;;; Class declarations.
169
7f2917d2
MW
170(export 'class-item)
171
048d0b2d 172(defun parse-class-body (scanner pset name supers)
c91b90c3 173 ;; class-body ::= `{' class-item* `}'
048d0b2d
MW
174 ;;
175 ;; class-item ::= property-set raw-class-item
c91b90c3
MW
176 (with-parser-context (token-scanner-context :scanner scanner)
177 (make-class-type name)
048d0b2d 178 (let* ((class (make-sod-class name (mapcar #'find-sod-class supers)
c91b90c3
MW
179 pset scanner))
180 (nick (sod-class-nickname class)))
181
182 (labels ((parse-maybe-dotted-declarator (base-type)
183 ;; Parse a declarator or dotted-declarator, i.e., one whose
184 ;; centre is
185 ;;
186 ;; maybe-dotted-identifier ::= [id `.'] id
187 ;;
188 ;; A plain identifier is returned as a string, as usual; a
189 ;; dotted identifier is returned as a cons cell of the two
190 ;; names.
191 (parse-declarator
192 scanner base-type
ea578bb4 193 :kernel (parser ()
c91b90c3
MW
194 (seq ((name-a :id)
195 (name-b (? (seq (#\. (id :id)) id))))
196 (if name-b (cons name-a name-b)
197 name-a)))))
198
c91b90c3
MW
199 (parse-message-item (sub-pset type name)
200 ;; message-item ::=
201 ;; declspec+ declarator -!- (method-body | `;')
2cbdee3d
MW
202 ;;
203 ;; Don't allow a method-body here if the message takes a
204 ;; varargs list, because we don't have a name for the
205 ;; `va_list' parameter.
206 (let ((message (make-sod-message class name type
207 sub-pset scanner)))
208 (if (varargs-message-p message)
209 (parse #\;)
210 (parse (or #\; (parse-method-item sub-pset
211 type nick name))))))
c91b90c3
MW
212
213 (parse-method-item (sub-pset type sub-nick name)
214 ;; method-item ::=
215 ;; declspec+ dotted-declarator -!- method-body
216 ;;
217 ;; method-body ::= `{' c-fragment `}' | `extern' `;'
218 (parse (seq ((body (or (seq ("extern" #\;) nil)
219 (parse-delimited-fragment
220 scanner #\{ #\}))))
221 (make-sod-method class sub-nick name type
222 body sub-pset scanner))))
223
224 (parse-initializer ()
225 ;; initializer ::= `=' c-fragment | `=' `{' c-fragment `}'
226 ;;
227 ;; Return (VALUE-KIND . VALUE-FORM), ready for passing to a
228 ;; `sod-initializer' constructor.
9ec578d9
MW
229
230 ;; This is kind of tricky because we have to juggle both
231 ;; layers of the parsing machinery. The character scanner
232 ;; will already have consumed the lookahead token (which, if
233 ;; we're going to do anything, is `=').
234 (let ((char-scanner (token-scanner-char-scanner scanner)))
235
236 ;; First, skip the character-scanner past any whitespace.
237 ;; We don't record this consumption, which is a bit
238 ;; naughty, but nobody will actually mind.
239 (loop
240 (when (or (scanner-at-eof-p char-scanner)
241 (not (whitespace-char-p
242 (scanner-current-char char-scanner))))
243 (return))
244 (scanner-step char-scanner))
245
246 ;; Now maybe read an initializer.
247 (cond ((not (eql (token-type scanner) #\=))
248 ;; It's not an `=' after all. There's no
249 ;; initializer.
250 (values '(#\=) nil nil))
251
252 ((and (not (scanner-at-eof-p char-scanner))
253 (char= (scanner-current-char char-scanner)
254 #\{))
255 ;; There's a brace after the `=', so we should
256 ;; consume the `=' here, and read a compound
257 ;; initializer enclosed in braces.
258 (parse (seq (#\= (frag (parse-delimited-fragment
259 scanner #\{ #\})))
260 (cons :compound frag))))
261
262 (t
263 ;; No brace, so read from the `=' up to, but not
264 ;; including, the trailing `,' or `;' delimiter.
265 (parse (seq ((frag (parse-delimited-fragment
266 scanner #\= '(#\; #\,)
267 :keep-end t)))
268 (cons :simple frag)))))))
c91b90c3
MW
269
270 (parse-slot-item (sub-pset base-type type name)
271 ;; slot-item ::=
272 ;; declspec+ declarator -!- [initializer]
273 ;; [`,' init-declarator-list] `;'
274 ;;
275 ;; init-declarator-list ::=
276 ;; declarator [initializer] [`,' init-declarator-list]
277 (parse (and (seq ((init (? (parse-initializer))))
278 (make-sod-slot class name type
279 sub-pset scanner)
280 (when init
281 (make-sod-instance-initializer
282 class nick name (car init) (cdr init)
048d0b2d 283 sub-pset scanner)))
c91b90c3
MW
284 (skip-many ()
285 (seq (#\,
286 (ds (parse-declarator scanner
287 base-type))
288 (init (? (parse-initializer))))
289 (make-sod-slot class (cdr ds) (car ds)
290 sub-pset scanner)
291 (when init
292 (make-sod-instance-initializer
293 class nick (cdr ds)
294 (car init) (cdr init)
048d0b2d 295 sub-pset scanner))))
c91b90c3
MW
296 #\;)))
297
298 (parse-initializer-item (sub-pset constructor)
299 ;; initializer-item ::=
300 ;; [`class'] -!- slot-initializer-list `;'
301 ;;
302 ;; slot-initializer ::= id `.' id initializer
303 (parse (and (skip-many ()
304 (seq ((name-a :id) #\. (name-b :id)
305 (init (parse-initializer)))
306 (funcall constructor class
307 name-a name-b
308 (car init) (cdr init)
309 sub-pset scanner))
310 #\,)
311 #\;)))
312
313 (class-item-dispatch (sub-pset base-type type name)
314 ;; Logically part of `parse-raw-class-item', but the
315 ;; indentation was getting crazy. We're currently at
316 ;;
317 ;; raw-class-item ::=
318 ;; declspec+ (declarator | dotted-declarator) -!- ...
319 ;; | other-items
320 ;;
321 ;; If the declarator is dotted then this must be a method
322 ;; definition; otherwise it might be a message or slot.
323 (cond ((not (typep type 'c-function-type))
324 (when (consp name)
325 (cerror*-with-location
326 scanner
327 "Method declarations must have function type.")
328 (setf name (cdr name)))
329 (parse-slot-item sub-pset base-type type name))
330 ((consp name)
331 (parse-method-item sub-pset type
332 (car name) (cdr name)))
333 (t
334 (parse-message-item sub-pset type name))))
335
336 (parse-raw-class-item (sub-pset)
337 ;; raw-class-item ::=
338 ;; message-item
339 ;; | method-item
340 ;; | slot-item
341 ;; | initializer-item
342 ;;
343 ;; Most of the above begin with declspecs and a declarator
344 ;; (which might be dotted). So we parse that here and
345 ;; dispatch based on what we find.
048d0b2d 346 (parse (or (plug class-item scanner class sub-pset)
db2abd9d 347 (peek
c91b90c3
MW
348 (seq ((ds (parse-c-type scanner))
349 (dc (parse-maybe-dotted-declarator ds))
048d0b2d
MW
350 (nil (class-item-dispatch sub-pset
351 ds
352 (car dc)
db2abd9d 353 (cdr dc))))))
c91b90c3
MW
354 (and "class"
355 (parse-initializer-item
356 sub-pset
357 #'make-sod-class-initializer))
358 (parse-initializer-item
359 sub-pset
360 #'make-sod-instance-initializer)))))
361
048d0b2d
MW
362 (parse (seq (#\{
363 (nil (skip-many ()
364 (seq ((sub-pset (parse-property-set scanner))
9ec578d9 365 (nil (parse-raw-class-item sub-pset)))
048d0b2d 366 (check-unused-properties sub-pset))))
9ec578d9 367 (nil (error () #\})))
048d0b2d
MW
368 (finalize-sod-class class)
369 (add-to-module *module* class)))))))
370
371(define-pluggable-parser module class (scanner pset)
c91b90c3
MW
372 ;; `class' id [`:' id-list] class-body
373 ;; `class' id `;'
bf090e02 374 (with-parser-context (token-scanner-context :scanner scanner)
c91b90c3
MW
375 (parse (seq ("class"
376 (name :id)
377 (nil (or (seq (#\;)
378 (make-class-type name))
379 (seq ((supers (? (seq (#\: (ids (list () :id #\,)))
380 ids)))
381 (nil (parse-class-body
382 scanner
383 pset name supers)))))))))))
384
bf090e02 385;;;----- That's all, folks --------------------------------------------------