Major effort to plug slot-name leaks.
[sod] / src / codegen-proto.lisp
CommitLineData
1f1d88f5
MW
1;;; -*-lisp-*-
2;;;
dea4d055 3;;; Code generation protocol
1f1d88f5
MW
4;;;
5;;; (c) 2009 Straylight/Edgeware
6;;;
7
8;;;----- Licensing notice ---------------------------------------------------
9;;;
dea4d055 10;;; This file is part of the Sensble Object Design, an object system for C.
1f1d88f5
MW
11;;;
12;;; SOD is free software; you can redistribute it and/or modify
13;;; it under the terms of the GNU General Public License as published by
14;;; the Free Software Foundation; either version 2 of the License, or
15;;; (at your option) any later version.
16;;;
17;;; SOD is distributed in the hope that it will be useful,
18;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
19;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
20;;; GNU General Public License for more details.
21;;;
22;;; You should have received a copy of the GNU General Public License
23;;; along with SOD; if not, write to the Free Software Foundation,
24;;; Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
25
26(cl:in-package #:sod)
27
28;;;--------------------------------------------------------------------------
29;;; Temporary names.
30
dea4d055
MW
31;; Protocol.
32
33(export 'format-temporary-name)
34(defgeneric format-temporary-name (var stream)
1f1d88f5 35 (:documentation
dea4d055 36 "Write the name of a temporary variable VAR to STREAM."))
1f1d88f5 37
dea4d055
MW
38(export 'var-in-use-p)
39(defgeneric var-in-use-p (var)
40 (:documentation
3109662a 41 "Answer whether VAR is currently being used. See `with-temporary-var'.")
dea4d055
MW
42 (:method (var)
43 "Non-temporary variables are always in use."
1d8cc67a 44 (declare (ignore var))
dea4d055
MW
45 t))
46(defgeneric (setf var-in-use-p) (value var)
47 (:documentation
3109662a 48 "Record whether VAR is currently being used. See `with-temporary-var'."))
1f1d88f5 49
dea4d055 50;; Root class.
1f1d88f5 51
1344e1f9 52(export '(temporary-name temp-tag))
dea4d055
MW
53(defclass temporary-name ()
54 ((tag :initarg :tag :reader temp-tag))
55 (:documentation
56 "Base class for temporary variable and argument names."))
1f1d88f5 57
dea4d055 58;; Important variables.
1f1d88f5
MW
59
60(defparameter *temporary-index* 0
61 "Index for temporary name generation.
62
63 This is automatically reset to zero before the output functions are
64 invoked to write a file. This way, we can ensure that the same output
9ec578d9
MW
65 file is always produced from the same input.")
66
67(define-clear-the-decks reset-codegen-index
68 (setf *temporary-index* 0))
1f1d88f5 69
dea4d055 70;; Important temporary names.
1f1d88f5 71
dea4d055 72(export '(*sod-ap* *sod-master-ap*))
1f1d88f5
MW
73(defparameter *sod-ap*
74 (make-instance 'temporary-name :tag "sod__ap"))
75(defparameter *sod-master-ap*
76 (make-instance 'temporary-name :tag "sod__master_ap"))
2bbe0f1d
MW
77(defparameter *sod-tmp-ap*
78 (make-instance 'temporary-name :tag "sod__tmp_ap"))
1f1d88f5
MW
79
80;;;--------------------------------------------------------------------------
81;;; Instructions.
82
dea4d055
MW
83;; Classes.
84
85(export 'inst)
1f1d88f5
MW
86(defclass inst () ()
87 (:documentation
88 "A base class for instructions.
89
90 An `instruction' is anything which might be useful to string into a code
9ec578d9
MW
91 generator. Both statements and expressions can be represented by trees of
92 instructions. The `definst' macro is a convenient way of defining new
93 instructions.
1f1d88f5
MW
94
95 The only important protocol for instructions is output, which is achieved
3109662a 96 by calling `print-object' with `*print-escape*' nil.
1f1d88f5
MW
97
98 This doesn't really do very much, but it acts as a handy marker for
99 instruction subclasses."))
100
dea4d055 101(export 'inst-metric)
1f1d88f5
MW
102(defgeneric inst-metric (inst)
103 (:documentation
104 "Returns a `metric' describing how complicated INST is.
105
3109662a
MW
106 The default metric of an inst node is simply 1; `inst' subclasses
107 generated by `definst' (q.v.) have an automatically generated method which
108 returns one plus the sum of the metrics of the node's children.
1f1d88f5
MW
109
110 This isn't intended to be a particularly rigorous definition. Its purpose
111 is to allow code generators to make decisions about inlining or calling
112 code fairly simply.")
9ec578d9
MW
113 (:method ((inst t))
114 (declare (ignore inst))
115 1)
116 (:method ((inst null))
1d8cc67a 117 (declare (ignore inst))
9ec578d9
MW
118 1)
119 (:method ((inst list))
120 (reduce #'+ inst :key #'inst-metric)))
1f1d88f5 121
dea4d055
MW
122;; Instruction definition.
123
124(export 'definst)
418752c5 125(defmacro definst (code (streamvar &key export) args &body body)
1f1d88f5
MW
126 "Define an instruction type and describe how to output it.
127
3109662a
MW
128 An `inst' can represent any structured piece of output syntax: a
129 statement, expression or declaration, for example. This macro defines the
130 following things:
1f1d88f5 131
3109662a 132 * A class `CODE-inst' to represent the instruction.
1f1d88f5
MW
133
134 * Instance slots named after the ARGS, with matching keyword initargs,
3109662a 135 and `inst-ARG' readers.
1f1d88f5 136
3109662a 137 * A constructor `make-CODE-inst' which accepts the ARGS (in order, not
1f1d88f5
MW
138 with keywords) as arguments and returns a fresh instance.
139
3109662a 140 * A print method, which prints a diagnostic dump if `*print-escape*' is
1f1d88f5
MW
141 set, or invokes the BODY (with STREAMVAR bound to the output stream)
142 otherwise. The BODY is expected to produce target code at this
418752c5
MW
143 point.
144
145 If EXPORT is non-nil, then export the `CODE-inst' and `make-CODE-inst'
146 symbols."
1f1d88f5
MW
147
148 (let ((inst-var (gensym "INST"))
149 (class-name (symbolicate code '-inst))
418752c5 150 (constructor-name (symbolicate 'make- code '-inst))
1f1d88f5
MW
151 (keys (mapcar (lambda (arg) (intern (symbol-name arg) :keyword))
152 args)))
153 `(progn
154 (defclass ,class-name (inst)
155 ,(mapcar (lambda (arg key)
156 `(,arg :initarg ,key :reader ,(symbolicate 'inst- arg)))
157 args keys))
418752c5 158 (defun ,constructor-name (,@args)
1f1d88f5
MW
159 (make-instance ',class-name ,@(mappend #'list keys args)))
160 (defmethod inst-metric ((,inst-var ,class-name))
161 (with-slots (,@args) ,inst-var
162 (+ 1 ,@(mapcar (lambda (arg) `(inst-metric ,arg)) args))))
163 (defmethod print-object ((,inst-var ,class-name) ,streamvar)
164 (with-slots (,@args) ,inst-var
165 (if *print-escape*
166 (print-unreadable-object (,inst-var ,streamvar :type t)
167 (format stream "~@<~@{~S ~@_~S~^ ~_~}~:>"
168 ,@(mappend #'list keys args)))
418752c5 169 (progn ,@body))))
34c51b1c
MW
170 ,@(and export `((export '(,class-name ,constructor-name
171 ,@(mapcar (lambda (arg)
172 (symbolicate 'inst- arg))
173 args)))))
418752c5 174 ',code)))
1f1d88f5 175
dea4d055
MW
176;; Important instruction classes.
177
4b8e5c03
MW
178;; HACK: use a gensym for the `expr' and `type' slots to avoid leaking the
179;; slot names, since the symbol `expr' is exported from our package and
180;; `type' belongs to the `common-lisp' package.
181
182(definst var (stream :export t) (name #1=#:type init)
183 (pprint-c-type #1# stream name)
dea4d055 184 (when init
75dbacfc
MW
185 (format stream " = ~A" init))
186 (write-char #\; stream))
4b8e5c03
MW
187(definst set (stream :export t) (var #1=#:expr)
188 (format stream "~@<~A = ~@_~2I~A;~:>" var #1#))
189(definst update (stream :export t) (var op #1=#:expr)
190 (format stream "~@<~A ~A= ~@_~2I~A;~:>" var op #1#))
191(definst return (stream :export t) (#1=#:expr)
192 (format stream "return~@[ (~A)~];" #1#))
b559689b
MW
193(definst break (stream :export t) ()
194 (format stream "break;"))
195(definst continue (stream :export t) ()
196 (format stream "continue;"))
4b8e5c03
MW
197(definst expr (stream :export t) (#1=#:expr)
198 (format stream "~A;" #1#))
418752c5 199(definst block (stream :export t) (decls body)
75dbacfc 200 (format stream "{~:@_~@< ~2I~@[~{~A~:@_~}~:@_~]~{~A~^~:@_~}~:>~:@_}"
dea4d055 201 decls body))
4b8e5c03 202(definst function (stream :export t) (name #1=#:type body)
dea4d055
MW
203 (pprint-logical-block (stream nil)
204 (princ "static " stream)
4b8e5c03 205 (pprint-c-type #1# stream name)
dea4d055
MW
206 (format stream "~:@_~A~:@_~:@_" body)))
207
208;; Formatting utilities.
209
1f1d88f5 210(defun format-compound-statement* (stream child morep thunk)
3109662a 211 "Underlying function for `format-compound-statement'."
1f1d88f5
MW
212 (cond ((typep child 'block-inst)
213 (funcall thunk stream)
214 (write-char #\space stream)
215 (princ child stream)
216 (when morep (write-char #\space stream)))
217 (t
218 (pprint-logical-block (stream nil)
219 (funcall thunk stream)
220 (write-char #\space stream)
221 (pprint-indent :block 2 stream)
222 (pprint-newline :linear stream)
223 (princ child stream)
224 (pprint-indent :block 0 stream)
225 (case morep
226 (:space
227 (write-char #\space stream)
228 (pprint-newline :linear stream))
dea4d055 229 ((t)
1f1d88f5
MW
230 (pprint-newline :mandatory stream)))))))
231
dea4d055 232(export 'format-compound-statement)
1f1d88f5
MW
233(defmacro format-compound-statement
234 ((stream child &optional morep) &body body)
235 "Format a compound statement to STREAM.
236
237 The introductory material is printed by BODY. The CHILD is formatted
3109662a 238 properly according to whether it's a `block-inst'. If MOREP is true, then
1f1d88f5
MW
239 allow for more stuff following the child."
240 `(format-compound-statement* ,stream ,child ,morep
241 (lambda (,stream) ,@body)))
242
243;;;--------------------------------------------------------------------------
dea4d055 244;;; Code generation.
1f1d88f5 245
dea4d055 246;; Accessors.
1f1d88f5 247
dea4d055
MW
248(export 'codegen-functions)
249(defgeneric codegen-functions (codegen)
1f1d88f5 250 (:documentation
3109662a 251 "Return the list of `function-inst's of completed functions."))
1f1d88f5 252
dea4d055 253(export 'ensure-var)
1f1d88f5
MW
254(defgeneric ensure-var (codegen name type &optional init)
255 (:documentation
256 "Add a variable to CODEGEN's list.
257
3109662a 258 The variable is called NAME (which should be comparable using `equal' and
1f1d88f5 259 print to an identifier) and has the given TYPE. If INIT is present and
3109662a 260 non-nil it is an expression `inst' used to provide the variable with an
dea4d055 261 initial value."))
1f1d88f5 262
dea4d055
MW
263(export '(emit-inst emit-insts))
264(defgeneric emit-inst (codegen inst)
265 (:documentation
266 "Add INST to the end of CODEGEN's list of instructions."))
267(defgeneric emit-insts (codegen insts)
268 (:documentation
269 "Add a list of INSTS to the end of CODEGEN's list of instructions.")
270 (:method (codegen insts)
271 (dolist (inst insts) (emit-inst codegen inst))))
1f1d88f5 272
3f4ac959
MW
273(export '(emit-decl emit-decls))
274(defgeneric emit-decl (codegen inst)
275 (:documentation
276 "Add INST to the end of CODEGEN's list of declarations."))
277(defgeneric emit-decls (codegen insts)
278 (:documentation
279 "Add a list of INSTS to the end of CODEGEN's list of declarations."))
280
dea4d055 281(export 'codegen-push)
1f1d88f5
MW
282(defgeneric codegen-push (codegen)
283 (:documentation
284 "Pushes the current code generation state onto a stack.
285
dea4d055 286 The state consists of the accumulated variables and instructions."))
1f1d88f5 287
dea4d055 288(export 'codegen-pop)
1f1d88f5
MW
289(defgeneric codegen-pop (codegen)
290 (:documentation
291 "Pops a saved state off of the CODEGEN's stack.
292
293 Returns the newly accumulated variables and instructions as lists, as
dea4d055 294 separate values."))
1f1d88f5 295
dea4d055 296(export 'codegen-add-function)
1f1d88f5
MW
297(defgeneric codegen-add-function (codegen function)
298 (:documentation
299 "Adds a function to CODEGEN's list.
300
301 Actually, we're not picky: FUNCTION can be any kind of object that you're
3109662a 302 willing to find in the list returned by `codegen-functions'."))
dea4d055
MW
303
304(export 'temporary-var)
305(defgeneric temporary-var (codegen type)
306 (:documentation
307 "Return the name of a temporary variable.
308
309 The temporary variable will have the given TYPE, and will be marked
310 in-use. You should clear the in-use flag explicitly when you've finished
3109662a
MW
311 with the variable -- or, better, use `with-temporary-var' to do the
312 cleanup automatically."))
1f1d88f5 313
dea4d055 314(export 'codegen-build-function)
1f1d88f5
MW
315(defun codegen-build-function (codegen name type vars insts)
316 "Build a function and add it to CODEGEN's list.
317
318 Returns the function's name."
319 (codegen-add-function codegen
320 (make-function-inst name type
321 (make-block-inst vars insts)))
322 name)
323
dea4d055
MW
324(export 'codegen-pop-block)
325(defgeneric codegen-pop-block (codegen)
326 (:documentation
3109662a 327 "Makes a block (`block-inst') out of the completed code in CODEGEN.")
dea4d055
MW
328 (:method (codegen)
329 (multiple-value-bind (vars insts) (codegen-pop codegen)
330 (make-block-inst vars insts))))
331
332(export 'codegen-pop-function)
1f1d88f5
MW
333(defgeneric codegen-pop-function (codegen name type)
334 (:documentation
335 "Makes a function out of the completed code in CODEGEN.
336
337 The NAME can be any object you like. The TYPE should be a function type
338 object which includes argument names. The return value is the NAME.")
dea4d055 339 (:method (codegen name type)
1f1d88f5
MW
340 (multiple-value-bind (vars insts) (codegen-pop codegen)
341 (codegen-build-function codegen name type vars insts))))
342
dea4d055 343(export 'with-temporary-var)
1f1d88f5
MW
344(defmacro with-temporary-var ((codegen var type) &body body)
345 "Evaluate BODY with VAR bound to a temporary variable name.
346
347 During BODY, VAR will be marked in-use; when BODY ends, VAR will be marked
9ec578d9 348 available for re-use."
1f1d88f5
MW
349 `(let ((,var (temporary-var ,codegen ,type)))
350 (unwind-protect
351 (progn ,@body)
352 (setf (var-in-use-p ,var) nil))))
353
354;;;--------------------------------------------------------------------------
355;;; Code generation idioms.
356
dea4d055 357(export 'deliver-expr)
1f1d88f5
MW
358(defun deliver-expr (codegen target expr)
359 "Emit code to deliver the value of EXPR to the TARGET.
360
361 The TARGET may be one of the following.
362
3109662a 363 * `:void', indicating that the value is to be discarded. The expression
1f1d88f5
MW
364 will still be evaluated.
365
3109662a
MW
366 * `:void-return', indicating that the value is to be discarded (as for
367 `:void') and furthermore a `return' from the current function should
368 be forced after computing the value.
1f1d88f5 369
3109662a
MW
370 * `:return', indicating that the value is to be returned from the
371 current function.
1f1d88f5
MW
372
373 * A variable name, indicating that the value is to be stored in the
374 variable.
375
3109662a
MW
376 In the cases of `:return', `:void' and `:void-return' targets, it is valid
377 for EXPR to be nil; this signifies that no computation needs to be
378 performed. Variable-name targets require an expression."
1f1d88f5
MW
379
380 (case target
381 (:return (emit-inst codegen (make-return-inst expr)))
382 (:void (when expr (emit-inst codegen (make-expr-inst expr))))
383 (:void-return (when expr (emit-inst codegen (make-expr-inst expr)))
384 (emit-inst codegen (make-return-inst nil)))
385 (t (emit-inst codegen (make-set-inst target expr)))))
386
dea4d055 387(export 'convert-stmts)
1f1d88f5 388(defun convert-stmts (codegen target type func)
3109662a 389 "Invoke FUNC to deliver a value to a non-`:return' target.
1f1d88f5 390
3109662a
MW
391 FUNC is a function which accepts a single argument, a non-`:return'
392 target, and generates statements which deliver a value (see
393 `deliver-expr') of the specified TYPE to this target. In general, the
394 generated code will have the form
1f1d88f5
MW
395
396 setup instructions...
3109662a 397 (deliver-expr CODEGEN TARGET (compute value...))
1f1d88f5
MW
398 cleanup instructions...
399
400 where the cleanup instructions are essential to the proper working of the
401 generated program.
402
3109662a
MW
403 The `convert-stmts' function will call FUNC to generate code, and arrange
404 that its value is correctly delivered to TARGET, regardless of what the
405 TARGET is -- i.e., it lifts the restriction to non-`:return' targets. It
406 does this by inventing a new temporary variable."
1f1d88f5
MW
407
408 (case target
409 (:return (with-temporary-var (codegen var type)
410 (funcall func var)
411 (deliver-expr codegen target var)))
412 (:void-return (funcall func :void)
413 (emit-inst codegen (make-return-inst nil)))
414 (t (funcall func target))))
415
416;;;----- That's all, folks --------------------------------------------------