src/: Write `NULL' for a null pointer, rather than plain `0'.
[sod] / src / codegen-proto.lisp
1 ;;; -*-lisp-*-
2 ;;;
3 ;;; Code generation protocol
4 ;;;
5 ;;; (c) 2009 Straylight/Edgeware
6 ;;;
7
8 ;;;----- Licensing notice ---------------------------------------------------
9 ;;;
10 ;;; This file is part of the Sensible Object Design, an object system for C.
11 ;;;
12 ;;; SOD is free software; you can redistribute it and/or modify
13 ;;; it under the terms of the GNU General Public License as published by
14 ;;; the Free Software Foundation; either version 2 of the License, or
15 ;;; (at your option) any later version.
16 ;;;
17 ;;; SOD is distributed in the hope that it will be useful,
18 ;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
19 ;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
20 ;;; GNU General Public License for more details.
21 ;;;
22 ;;; You should have received a copy of the GNU General Public License
23 ;;; along with SOD; if not, write to the Free Software Foundation,
24 ;;; Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
25
26 (cl:in-package #:sod)
27
28 ;;;--------------------------------------------------------------------------
29 ;;; Temporary names.
30
31 ;; Protocol.
32
33 (export 'format-temporary-name)
34 (defgeneric format-temporary-name (var stream)
35 (:documentation
36 "Write the name of a temporary variable VAR to STREAM."))
37
38 (export 'var-in-use-p)
39 (defgeneric var-in-use-p (var)
40 (:documentation
41 "Answer whether VAR is currently being used. See `with-temporary-var'.")
42 (:method (var)
43 "Non-temporary variables are always in use."
44 (declare (ignore var))
45 t))
46 (defgeneric (setf var-in-use-p) (value var)
47 (:documentation
48 "Record whether VAR is currently being used. See `with-temporary-var'."))
49
50 ;; Root class.
51
52 (export '(temporary-name temp-tag))
53 (defclass temporary-name ()
54 ((tag :initarg :tag :reader temp-tag))
55 (:documentation
56 "Base class for temporary variable and argument names."))
57
58 ;; Important temporary names.
59
60 (export '(*sod-ap* *sod-master-ap*))
61 (defparameter *sod-ap*
62 (make-instance 'temporary-name :tag "sod__ap"))
63 (defparameter *sod-master-ap*
64 (make-instance 'temporary-name :tag "sod__master_ap"))
65 (defparameter *sod-tmp-ap*
66 (make-instance 'temporary-name :tag "sod__tmp_ap"))
67 (defparameter *sod-tmp-val*
68 (make-instance 'temporary-name :tag "sod__t"))
69
70 (export '*null-pointer*)
71 (defparameter *null-pointer* "NULL")
72
73 ;;;--------------------------------------------------------------------------
74 ;;; Instructions.
75
76 ;; Classes.
77
78 (export 'inst)
79 (defclass inst () ()
80 (:documentation
81 "A base class for instructions.
82
83 An `instruction' is anything which might be useful to string into a code
84 generator. Both statements and expressions can be represented by trees of
85 instructions. The `definst' macro is a convenient way of defining new
86 instructions.
87
88 The only important protocol for instructions is output, which is achieved
89 by calling `print-object' with `*print-escape*' nil.
90
91 This doesn't really do very much, but it acts as a handy marker for
92 instruction subclasses."))
93
94 (export 'inst-metric)
95 (defgeneric inst-metric (inst)
96 (:documentation
97 "Returns a `metric' describing how complicated INST is.
98
99 The default metric of an inst node is simply 1; `inst' subclasses
100 generated by `definst' (q.v.) have an automatically generated method which
101 returns one plus the sum of the metrics of the node's children.
102
103 This isn't intended to be a particularly rigorous definition. Its purpose
104 is to allow code generators to make decisions about inlining or calling
105 code fairly simply.")
106 (:method ((inst t))
107 (declare (ignore inst))
108 1)
109 (:method ((inst null))
110 (declare (ignore inst))
111 1)
112 (:method ((inst list))
113 (reduce #'+ inst :key #'inst-metric)))
114
115 ;; Instruction definition.
116
117 (export 'definst)
118 (defmacro definst (code (streamvar &key export) args &body body)
119 "Define an instruction type and describe how to output it.
120
121 An `inst' can represent any structured piece of output syntax: a
122 statement, expression or declaration, for example. This macro defines the
123 following things:
124
125 * A class `CODE-inst' to represent the instruction.
126
127 * Instance slots named after the ARGS, with matching keyword initargs,
128 and `inst-ARG' readers.
129
130 * A constructor `make-CODE-inst' which accepts the ARGS (as an ordinary
131 BVL) as arguments and returns a fresh instance.
132
133 * A print method, which prints a diagnostic dump if `*print-escape*' is
134 set, or invokes the BODY (with STREAMVAR bound to the output stream)
135 otherwise. The BODY is expected to produce target code at this
136 point.
137
138 If EXPORT is non-nil, then export the `CODE-inst' and `make-CODE-inst'
139 symbols."
140
141 (let* ((inst-var (gensym "INST"))
142 (class-name (symbolicate code '-inst))
143 (constructor-name (symbolicate 'make- code '-inst))
144 (slots (mapcan (lambda (arg)
145 (if (listp arg) (list (car arg))
146 (let ((name (symbol-name arg)))
147 (if (and (plusp (length name))
148 (char/= (char name 0) #\&))
149 (list arg)
150 nil))))
151 args))
152 (keys (mapcar (lambda (arg) (intern (symbol-name arg) :keyword))
153 slots)))
154 `(progn
155 (defclass ,class-name (inst)
156 ,(mapcar (lambda (slot key)
157 `(,slot :initarg ,key
158 :reader ,(symbolicate 'inst- slot)))
159 slots keys))
160 (defun ,constructor-name (,@args)
161 (make-instance ',class-name ,@(mappend #'list keys slots)))
162 (defmethod inst-metric ((,inst-var ,class-name))
163 (with-slots (,@slots) ,inst-var
164 (+ 1 ,@(mapcar (lambda (slot) `(inst-metric ,slot)) slots))))
165 (defmethod print-object ((,inst-var ,class-name) ,streamvar)
166 (with-slots (,@slots) ,inst-var
167 (if *print-escape*
168 (print-unreadable-object (,inst-var ,streamvar :type t)
169 (format stream "~@<~@{~S ~@_~S~^ ~_~}~:>"
170 ,@(mappend #'list keys slots)))
171 (block ,code ,@body))))
172 ,@(and export `((export '(,class-name ,constructor-name
173 ,@(mapcar (lambda (slot)
174 (symbolicate 'inst- slot))
175 slots)))))
176 ',code)))
177
178 ;; Formatting utilities.
179
180 (defun format-compound-statement* (stream child morep thunk)
181 "Underlying function for `format-compound-statement'."
182 (cond ((typep child 'block-inst)
183 (funcall thunk stream)
184 (write-char #\space stream)
185 (princ child stream)
186 (when morep (write-char #\space stream)))
187 (t
188 (pprint-logical-block (stream nil)
189 (funcall thunk stream)
190 (write-char #\space stream)
191 (pprint-indent :block 2 stream)
192 (pprint-newline :linear stream)
193 (princ child stream)
194 (pprint-indent :block 0 stream)
195 (case morep
196 (:space
197 (write-char #\space stream)
198 (pprint-newline :linear stream))
199 ((t)
200 (pprint-newline :mandatory stream)))))))
201
202 (export 'format-compound-statement)
203 (defmacro format-compound-statement
204 ((stream child &optional morep) &body body)
205 "Format a compound statement to STREAM.
206
207 The introductory material is printed by BODY. The CHILD is formatted
208 properly according to whether it's a `block-inst'. If MOREP is true, then
209 allow for more stuff following the child."
210 `(format-compound-statement* ,stream ,child ,morep
211 (lambda (,stream) ,@body)))
212
213 ;; Important instruction classes.
214
215 ;; HACK: Some of the slot names we'd like to use are external symbols in our
216 ;; package or the `common-lisp' package. Use gensyms for these slot names to
217 ;; prevent them from leaking.
218
219 (definst var (stream :export t) (name #1=#:type &optional init)
220 (pprint-c-type #1# stream name)
221 (when init
222 (format stream " = ~A" init))
223 (write-char #\; stream))
224
225 (definst function (stream :export t) (name #1=#:type body)
226 (pprint-logical-block (stream nil)
227 (princ "static " stream)
228 (pprint-c-type #1# stream name)
229 (format stream "~:@_~A~:@_~:@_" body)))
230
231 ;; Expression statements.
232 (definst expr (stream :export t) (#1=#:expr)
233 (format stream "~A;" #1#))
234 (definst set (stream :export t) (var #1=#:expr)
235 (format stream "~@<~A = ~@_~2I~A;~:>" var #1#))
236 (definst update (stream :export t) (var op #1=#:expr)
237 (format stream "~@<~A ~A= ~@_~2I~A;~:>" var op #1#))
238
239 ;; Special kinds of expressions.
240 (definst call (stream :export t) (#1=#:func &rest args)
241 (format stream "~A(~@<~{~A~^, ~_~}~:>)" #1# args))
242
243 ;; Simple statements.
244 (definst return (stream :export t) (#1=#:expr)
245 (format stream "return~@[ (~A)~];" #1#))
246 (definst break (stream :export t) ()
247 (format stream "break;"))
248 (definst continue (stream :export t) ()
249 (format stream "continue;"))
250
251 ;; Compound statements.
252
253 (definst block (stream :export t) (decls body)
254 (format stream "{~:@_~@< ~2I~@[~{~A~:@_~}~:@_~]~{~A~^~:@_~}~:>~:@_}"
255 decls body))
256
257 (definst if (stream :export t) (#1=#:cond conseq &optional alt)
258 (format-compound-statement (stream conseq alt)
259 (format stream "if (~A)" #1#))
260 (when alt
261 (format-compound-statement (stream alt)
262 (write-string "else" stream))))
263
264 (definst while (stream :export t) (#1=#:cond body)
265 (format-compound-statement (stream body)
266 (format stream "while (~A)" #1#)))
267
268 (definst do-while (stream :export t) (body #1=#:cond)
269 (format-compound-statement (stream body :space)
270 (write-string "do" stream))
271 (format stream "while (~A);" #1#))
272
273 ;;;--------------------------------------------------------------------------
274 ;;; Code generation.
275
276 ;; Accessors.
277
278 (export 'codegen-functions)
279 (defgeneric codegen-functions (codegen)
280 (:documentation
281 "Return the list of `function-inst's of completed functions."))
282
283 (export 'ensure-var)
284 (defgeneric ensure-var (codegen name type &optional init)
285 (:documentation
286 "Add a variable to CODEGEN's list.
287
288 The variable is called NAME (which should be comparable using `equal' and
289 print to an identifier) and has the given TYPE. If INIT is present and
290 non-nil it is an expression `inst' used to provide the variable with an
291 initial value."))
292
293 (export '(emit-inst emit-insts))
294 (defgeneric emit-inst (codegen inst)
295 (:documentation
296 "Add INST to the end of CODEGEN's list of instructions."))
297 (defgeneric emit-insts (codegen insts)
298 (:documentation
299 "Add a list of INSTS to the end of CODEGEN's list of instructions.")
300 (:method (codegen insts)
301 (dolist (inst insts) (emit-inst codegen inst))))
302
303 (export '(emit-decl emit-decls))
304 (defgeneric emit-decl (codegen inst)
305 (:documentation
306 "Add INST to the end of CODEGEN's list of declarations."))
307 (defgeneric emit-decls (codegen insts)
308 (:documentation
309 "Add a list of INSTS to the end of CODEGEN's list of declarations."))
310
311 (export 'codegen-push)
312 (defgeneric codegen-push (codegen)
313 (:documentation
314 "Pushes the current code generation state onto a stack.
315
316 The state consists of the accumulated variables and instructions."))
317
318 (export 'codegen-pop)
319 (defgeneric codegen-pop (codegen)
320 (:documentation
321 "Pops a saved state off of the CODEGEN's stack.
322
323 Returns the newly accumulated variables and instructions as lists, as
324 separate values."))
325
326 (export 'codegen-add-function)
327 (defgeneric codegen-add-function (codegen function)
328 (:documentation
329 "Adds a function to CODEGEN's list.
330
331 Actually, we're not picky: FUNCTION can be any kind of object that you're
332 willing to find in the list returned by `codegen-functions'."))
333
334 (export 'temporary-var)
335 (defgeneric temporary-var (codegen type)
336 (:documentation
337 "Return the name of a temporary variable.
338
339 The temporary variable will have the given TYPE, and will be marked
340 in-use. You should clear the in-use flag explicitly when you've finished
341 with the variable -- or, better, use `with-temporary-var' to do the
342 cleanup automatically."))
343
344 (export 'codegen-build-function)
345 (defun codegen-build-function (codegen name type vars insts)
346 "Build a function and add it to CODEGEN's list.
347
348 Returns the function's name."
349 (codegen-add-function codegen
350 (make-function-inst name type
351 (make-block-inst vars insts)))
352 name)
353
354 (export 'codegen-pop-block)
355 (defgeneric codegen-pop-block (codegen)
356 (:documentation
357 "Makes a block (`block-inst') out of the completed code in CODEGEN.")
358 (:method (codegen)
359 (multiple-value-bind (vars insts) (codegen-pop codegen)
360 (make-block-inst vars insts))))
361
362 (export 'codegen-pop-function)
363 (defgeneric codegen-pop-function (codegen name type)
364 (:documentation
365 "Makes a function out of the completed code in CODEGEN.
366
367 The NAME can be any object you like. The TYPE should be a function type
368 object which includes argument names. The return value is the NAME.")
369 (:method (codegen name type)
370 (multiple-value-bind (vars insts) (codegen-pop codegen)
371 (codegen-build-function codegen name type vars insts))))
372
373 (export 'with-temporary-var)
374 (defmacro with-temporary-var ((codegen var type) &body body)
375 "Evaluate BODY with VAR bound to a temporary variable name.
376
377 During BODY, VAR will be marked in-use; when BODY ends, VAR will be marked
378 available for re-use."
379 (multiple-value-bind (doc decls body) (parse-body body :docp nil)
380 (declare (ignore doc))
381 `(let ((,var (temporary-var ,codegen ,type)))
382 ,@decls
383 (unwind-protect
384 (progn ,@body)
385 (setf (var-in-use-p ,var) nil)))))
386
387 ;;;--------------------------------------------------------------------------
388 ;;; Code generation idioms.
389
390 (export 'deliver-expr)
391 (defun deliver-expr (codegen target expr)
392 "Emit code to deliver the value of EXPR to the TARGET.
393
394 The TARGET may be one of the following.
395
396 * `:void', indicating that the value is to be discarded. The expression
397 will still be evaluated.
398
399 * `:void-return', indicating that the value is to be discarded (as for
400 `:void') and furthermore a `return' from the current function should
401 be forced after computing the value.
402
403 * `:return', indicating that the value is to be returned from the
404 current function.
405
406 * A variable name, indicating that the value is to be stored in the
407 variable.
408
409 In the cases of `:return', `:void' and `:void-return' targets, it is valid
410 for EXPR to be nil; this signifies that no computation needs to be
411 performed. Variable-name targets require an expression."
412
413 (case target
414 (:return (emit-inst codegen (make-return-inst expr)))
415 (:void (when expr (emit-inst codegen (make-expr-inst expr))))
416 (:void-return (when expr (emit-inst codegen (make-expr-inst expr)))
417 (emit-inst codegen (make-return-inst nil)))
418 (t (emit-inst codegen (make-set-inst target expr)))))
419
420 (export 'convert-stmts)
421 (defun convert-stmts (codegen target type func)
422 "Invoke FUNC to deliver a value to a non-`:return' target.
423
424 FUNC is a function which accepts a single argument, a non-`:return'
425 target, and generates statements which deliver a value (see
426 `deliver-expr') of the specified TYPE to this target. In general, the
427 generated code will have the form
428
429 setup instructions...
430 (deliver-expr CODEGEN TARGET (compute value...))
431 cleanup instructions...
432
433 where the cleanup instructions are essential to the proper working of the
434 generated program.
435
436 The `convert-stmts' function will call FUNC to generate code, and arrange
437 that its value is correctly delivered to TARGET, regardless of what the
438 TARGET is -- i.e., it lifts the restriction to non-`:return' targets. It
439 does this by inventing a new temporary variable."
440
441 (case target
442 (:return (with-temporary-var (codegen var type)
443 (funcall func var)
444 (deliver-expr codegen target var)))
445 (:void-return (funcall func :void)
446 (emit-inst codegen (make-return-inst nil)))
447 (t (funcall func target))))
448
449 (export 'deliver-call)
450 (defun deliver-call (codegen target func &rest args)
451 "Emit a statement to call FUNC with ARGS and deliver the result to TARGET."
452 (deliver-expr codegen target (apply #'make-call-inst func args)))
453
454 ;;;----- That's all, folks --------------------------------------------------