doc/clang.tex: Missing return type in `format-qualifiers' synopsis.
[sod] / doc / clang.tex
1 %%% -*-latex-*-
2 %%%
3 %%% C language utilities
4 %%%
5 %%% (c) 2015 Straylight/Edgeware
6 %%%
7
8 %%%----- Licensing notice ---------------------------------------------------
9 %%%
10 %%% This file is part of the Sensible Object Design, an object system for C.
11 %%%
12 %%% SOD is free software; you can redistribute it and/or modify
13 %%% it under the terms of the GNU General Public License as published by
14 %%% the Free Software Foundation; either version 2 of the License, or
15 %%% (at your option) any later version.
16 %%%
17 %%% SOD is distributed in the hope that it will be useful,
18 %%% but WITHOUT ANY WARRANTY; without even the implied warranty of
19 %%% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
20 %%% GNU General Public License for more details.
21 %%%
22 %%% You should have received a copy of the GNU General Public License
23 %%% along with SOD; if not, write to the Free Software Foundation,
24 %%% Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
25
26 \chapter{C language utilities} \label{ch:clang}
27
28 %%%--------------------------------------------------------------------------
29 \section{C type representation} \label{sec:clang.c-types}
30
31 \subsection{Overview} \label{sec:clang.c-types.over}
32
33 The Sod translator represents C types in a fairly simple and direct way.
34 However, because it spends a fair amount of its time dealing with C types, it
35 provides a number of useful operations and macros.
36
37 The class hierarchy is shown in~\xref{fig:codegen.c-types.classes}.
38
39 \begin{figure} \centering
40 \parbox{10pt}{\begin{tabbing}
41 @|c-type| \\ \ind
42 @|qualifiable-c-type| \\ \ind
43 @|simple-c-type| \\ \ind
44 @|c-class-type| \- \\
45 @|tagged-c-type| \\ \ind
46 @|c-struct-type| \\
47 @|c-union-type| \\
48 @|c-enum-type| \- \\
49 @|c-pointer-type| \- \\
50 @|c-array-type| \\
51 @|c-function-type|
52 \end{tabbing}}
53 \caption{Classes representing C types}
54 \label{fig:codegen.c-types.classes}
55 \end{figure}
56
57 C type objects are immutable unless otherwise specified.
58
59 \subsubsection{Constructing C type objects}
60 There is a constructor function for each non-abstract class of C type object.
61 Note, however, that constructor functions need not generate a fresh type
62 object if a previously existing type object is suitable. In this case, we
63 say that the objects are \emph{interned}. Some constructor functions are
64 specified to return interned objects: programs may rely on receiving the same
65 (@|eq|) type object for similar (possibly merely @|equal|) arguments. Where
66 not specified, clients may still not rely on receiving fresh objects.
67
68 A convenient S-expression notation is provided by the @|c-type| macro. Use
69 of this macro is merely an abbreviation for corresponding use of the various
70 constructor functions, and therefore interns type objects in the same manner.
71 The syntax accepted by the macro can be extended in order to support new
72 classes: see @|defctype|, @|c-type-alias| and @|define-c-type-syntax|.
73
74 The descriptions of each of the various classes include descriptions of the
75 initargs which may be passed to @|make-instance| when constructing a new
76 instance of the class. However, the constructor functions and S-expression
77 syntax are strongly recommended over direct use of @|make-instance|.
78
79 \subsubsection{Printing}
80 There are two protocols for printing C types. Unfortunately they have
81 similar names.
82 \begin{itemize}
83 \item The @|print-c-type| function prints a C type value using the
84 S-expression notation. It is mainly useful for diagnostic purposes.
85 \item The @|pprint-c-type| function prints a C type as a C-syntax
86 declaration.
87 \end{itemize}
88 Neither generic function defines a default primary method; subclasses of
89 @|c-type| must define their own methods in order to print correctly.
90
91
92 \subsection{The C type root class} \label{sec:clang.c-types.root}
93
94 \begin{describe}{cls}{c-type ()}
95 The class @|c-type| marks the root of the built-in C type hierarchy.
96
97 Users may define subclasses of @|c-type|. All non-abstract subclasses must
98 have a primary method defined on @|pprint-c-type|; unless instances of the
99 subclass are interned, a method on @|c-type-equal-p| is also required.
100
101 The class @|c-type| is abstract.
102 \end{describe}
103
104
105 \subsection{C type S-expression notation} \label{sec:clang.c-types.sexp}
106
107 The S-expression representation of a type is described syntactically as a
108 type specifier. Type specifiers fit into two syntactic categories.
109 \begin{itemize}
110 \item A \emph{symbolic type specifier} consists of a symbol. It has a
111 single, fixed meaning: if @<name> is a symbolic type specifier, then each
112 use of @<name> in a type specifier evaluates to the same (@|eq|) type
113 object, until the @<name> is redefined.
114 \item A \emph{type operator} is a symbol; the corresponding specifier is a
115 list whose @|car| is the operator. The remaining items in the list are
116 arguments to the type operator.
117 \end{itemize}
118
119 \begin{describe}{mac}{c-type @<type-spec> @> @<c-type>}
120 Evaluates to a C type object, as described by the type specifier
121 @<type-spec>.
122 \end{describe}
123
124 \begin{describe}{mac}
125 {defctype @{ @<name> @! (@<name> @<nickname>^*) @} @<type-spec>
126 @> @<names>}
127 Defines a new symbolic type specifier @<name>; if a list of @<name>s is
128 given, then all are defined in the same way. The type constructed by using
129 any of the @<name>s is as described by the type specifier @<type-spec>.
130
131 The resulting type object is constructed once, at the time that the macro
132 expansion is evaluated; the same (@|eq|) value is used each time any
133 @<name> is used in a type specifier.
134 \end{describe}
135
136 \begin{describe}{mac}{c-type-alias @<original> @<alias>^* @> @<aliases>}
137 Defines each @<alias> as being a type operator identical in behaviour to
138 @<original>. If @<original> is later redefined then the behaviour of the
139 @<alias>es changes too.
140 \end{describe}
141
142 \begin{describe}{mac}
143 {define-c-type-syntax @<name> @<lambda-list> \\ \ind
144 @[[ @<declaration>^* @! @<doc-string> @]] \\
145 @<form>^* \-
146 \nlret @<name>}
147 Defines the symbol @<name> as a new type operator. When a list of the form
148 @|(@<name> @<argument>^*)| is used as a type specifier, the @<argument>s
149 are bound to fresh variables according to @<lambda-list> (a destructuring
150 lambda-list) and the @<form>s evaluated in order in the resulting lexical
151 environment as an implicit @|progn|. The value should be a Lisp form which
152 will evaluate to the type specified by the arguments.
153
154 The @<form>s may call @|expand-c-type-spec| in order to recursively expand
155 type specifiers among its arguments.
156 \end{describe}
157
158 \begin{describe}{fun}{expand-c-type-spec @<type-spec> @> @<form>}
159 Returns the Lisp form that @|(c-type @<type-spec>)| would expand into.
160 \end{describe}
161
162 \begin{describe}{gf}
163 {print-c-type @<stream> @<type> \&optional @<colon> @<atsign>}
164 Print the C type object @<type> to @<stream> in S-expression form. The
165 @<colon> and @<atsign> arguments may be interpreted in any way which seems
166 appropriate: they are provided so that @|print-c-type| may be called via
167 @|format|'s @|\char`\~/\dots/| command; they are not set when
168 @|print-c-type| is called by Sod functions.
169
170 There should be a method defined for every C type class; there is no
171 default method.
172 \end{describe}
173
174
175 \subsection{Comparing C types} \label{sec:clang.c-types.cmp}
176
177 It is necessary to compare C types for equality, for example when checking
178 argument lists for methods. This is done by @|c-type-equal-p|.
179
180 \begin{describe}{gf}
181 {c-type-equal-p @<c-type>_1 @<c-type>_2 @> @<generalized-boolean>}
182 The generic function @|c-type-equal-p| compares two C types @<c-type>_1 and
183 @<c-type>_2 for equality; it returns true if the two types are equal and
184 false if they are not.
185
186 Two types are equal if they are structurally similar, where this property
187 is defined by methods for each individual class; see the descriptions of
188 the classes for the details.
189
190 The generic function @|c-type-equal-p| uses the @|and| method combination.
191
192 \begin{describe}{meth}{c-type-equal-p @<c-type>_1 @<c-type>_2}
193 A default primary method for @|c-type-equal-p| is defined. It simply
194 returns @|nil|. This way, methods can specialize on both arguments
195 without fear that a call will fail because no methods are applicable.
196 \end{describe}
197 \begin{describe}{ar-meth}{c-type-equal-p @<c-type>_1 @<c-type>_2}
198 A default around-method for @|c-type-equal-p| is defined. It returns
199 true if @<c-type>_1 and @<c-type>_2 are @|eql|; otherwise it delegates to
200 the primary methods. Since several common kinds of C types are interned,
201 this is a common case worth optimizing.
202 \end{describe}
203 \end{describe}
204
205
206 \subsection{Outputting C types} \label{sec:clang.c-types.output}
207
208 \begin{describe}{gf}{pprint-c-type @<c-type> @<stream> @<kernel>}
209 The generic function @|pprint-c-type| pretty-prints to @<stream> a C-syntax
210 declaration of an object or function of type @<c-type>. The result is
211 written to @<stream>.
212
213 A C declaration has two parts: a sequence of \emph{declaration specifiers}
214 and a \emph{declarator}. The declarator syntax involves parentheses and
215 operators, in order to reflect the operators applicable to the declared
216 variable. For example, the name of a pointer variable is preceded by @`*';
217 the name of an array is followed by dimensions enclosed in @`['\dots @`]'.
218
219 The @<kernel> argument must be a function designator (though see the
220 standard around-method); it is invoked as
221 \begin{quote} \codeface
222 (funcall @<kernel> @<stream> @<priority> @<spacep>)
223 \end{quote}
224 It should write to @<stream> -- which may not be the same stream originally
225 passed into the generic function -- the `kernel' of the declarator, i.e.,
226 the part to which prefix and/or postfix operators are attached to form the
227 full declarator.
228
229 The methods on @|pprint-c-type| specialized for compound types work by
230 recursively calling @|pprint-c-type| on the subtype, passing down a closure
231 which prints the necessary additional declarator operators before calling
232 the original @<kernel> function. The additional arguments @<priority> and
233 @<spacep> support this implementation technique.
234
235 The @<priority> argument describes the surrounding operator context. It is
236 zero if no type operators are directly attached to the kernel (i.e., there
237 are no operators at all, or the kernel is enclosed in parentheses), one if
238 a prefix operator is directly attached, or two if a postfix operator is
239 directly attached. If the @<kernel> function intends to provide its own
240 additional declarator operators, it should check the @<priority> in order
241 to determine whether parentheses are necessary. See also the
242 @|maybe-in-parens| macro (page~\pageref{mac:maybe-in-parens}).
243
244 The @<spacep> argument indicates whether a space needs to be printed in
245 order to separate the declarator from the declaration specifiers. A kernel
246 which contains an identifier should insert a space before the identifier
247 when @<spacep> is non-nil. An `empty' kernel, as found in an abstract
248 declarator (one that specifies no name), looks more pleasing without a
249 trailing space. See also the @|c-type-space| function
250 (page~\pageref{fun:c-type-space}).
251
252 Every concrete subclass of @|c-type| is expected to provide a primary
253 method on this function. There is no default primary method.
254
255 \begin{describe}{ar-meth}{pprint-c-type @<c-type> @<stream> @<kernel>}
256 A default around method is defined on @|pprint-c-type| which `canonifies'
257 non-function @<kernel> arguments. In particular:
258 \begin{itemize}
259 \item if @<kernel> is nil, then @|pprint-c-type| is called recursively
260 with a @<kernel> function that does nothing; and
261 \item if @<kernel> is any other kind of object, then @|pprint-c-type| is
262 called recursively with a @<kernel> function that prints the object as
263 if by @|princ|, preceded if necessary by space using @|c-type-space|.
264 \end{itemize}
265 \end{describe}
266 \end{describe}
267
268 \begin{describe}{fun}{c-type-space @<stream>}
269 Writes a space and other pretty-printing instructions to @<stream> in order
270 visually to separate a declarator from the preceding declaration
271 specifiers. The precise details are subject to change.
272 \end{describe}
273
274 \begin{describe}{mac}
275 {maybe-in-parens (@<stream-var> @<guard-form>)
276 @<declaration>^*
277 @<form>^*}
278 The @<guard-form> is evaluated, and then the @<form>s are evaluated in
279 sequence within a pretty-printer logical block writing to the stream named
280 by the symbol @<stream-var>. If the @<guard-form> evaluates to nil, then
281 the logical block has empty prefix and suffix strings; if it evaluates to a
282 non-nil value, then the logical block has prefix and suffix @`(' and @`)'
283 respectively.
284
285 Note that this may cause @<stream> to be bound to a different stream object
286 within the @<form>s.
287 \end{describe}
288
289
290 \subsection{Type qualifiers and qualifiable types}
291 \label{sec:clang.ctypes.qual}
292
293 \begin{describe}{cls}{qualifiable-c-type (c-type) \&key :qualifiers}
294 The class @|qualifiable-c-type| describes C types which can bear
295 `qualifiers' (\Cplusplus\ calls them `cv-qualifiers'): @|const|,
296 @|restrict| and @|volatile|.
297
298 The @<qualifiers> are a list of keyword symbols @|:const|, @|:restrict| and
299 @|:volatile|. There is no built-in limitation to these particular
300 qualifiers; others keywords may be used, though this isn't recommended.
301
302 Two qualifiable types are equal only if they have \emph{matching
303 qualifiers}: i.e., every qualifier attached to one is also attached to the
304 other: order is not significant, and neither is multiplicity.
305
306 The class @|qualifiable-c-type| is abstract.
307 \end{describe}
308
309 \begin{describe}{gf}{c-type-qualifiers @<c-type> @> @<list>}
310 Returns the qualifiers of the @|qualifiable-c-type| instance @<c-type> as
311 an immutable list.
312 \end{describe}
313
314 \begin{describe}{fun}{qualify-type @<c-type> @<qualifiers> @> @<c-type>}
315 The argument @<c-type> must be an instance of @|qualifiable-c-type|,
316 currently bearing no qualifiers, and @<qualifiers> a list of qualifier
317 keywords. The result is a C type object like @<c-type> except that it
318 bears the given @<qualifiers>.
319
320 The @<c-type> is not modified. If @<c-type> is interned, then the returned
321 type will be interned.
322 \end{describe}
323
324 \begin{describe}{fun}{format-qualifiers @<qualifiers> @> @<string>}
325 Returns a string containing the qualifiers listed in @<qualifiers> in C
326 syntax, with a space after each. In particular, if @<qualifiers> is
327 non-null then the final character of the returned string will be a space.
328 \end{describe}
329
330
331 \subsection{Leaf types} \label{sec:clang.c-types.leaf}
332
333 A \emph{leaf type} is a type which is not defined in terms of another type.
334 In Sod, the leaf types are
335 \begin{itemize}
336 \item \emph{simple types}, including builtin types like @|int| and @|char|,
337 as well as type names introduced by @|typename|, because Sod isn't
338 interested in what the type name means, merely that it names a type; and
339 \item \emph{tagged types}, i.e., enum, struct and union types which are named
340 by a keyword identifying the kind of type, and a \emph{tag}.
341 \end{itemize}
342
343 \begin{describe}{cls}{simple-c-type (qualifiable-c-type)
344 \&key :qualifiers :name}
345 The class of `simple types'; an instance denotes the type @<qualifiers>
346 @<name>.
347
348 A simple type object maintains a \emph{name}, which is a string whose
349 contents are the C name for the type. The initarg @|:name| may be used to
350 provide this name when calling @|make-instance|.
351
352 Two simple type objects are equal if and only if they have @|string=| names
353 and matching qualifiers.
354
355 A number of symbolic type specifiers for builtin types are predefined as
356 shown in \xref{tab:codegen.c-types.simple}. These are all defined as if by
357 @|define-simple-c-type|, so can be used to construct qualified types.
358 \end{describe}
359
360 \begin{table}
361 \begin{tabular}[C]{ll} \hlx*{hv}
362 \thd{C type} & \thd{Specifiers} \\ \hlx{vhv}
363 @|void| & @|void| \\ \hlx{v}
364 @|_Bool| & @|bool| \\ \hlx{v}
365 @|char| & @|char| \\ \hlx{}
366 @|wchar_t| & @|wchar-t| \\ \hlx{v}
367 @|signed char| & @|signed-char|, @|schar| \\ \hlx{}
368 @|unsigned char| & @|unsigned-char|, @|uchar| \\ \hlx{v}
369 @|short| & @|short|, @|signed-short|, @|short-int|,
370 @|signed-short-int| @|sshort| \\ \hlx{}
371 @|unsigned short| & @|unsigned-short|, @|unsigned-short-int|,
372 @|ushort| \\ \hlx{v}
373 @|int| & @|int|, @|signed|, @|signed-int|,
374 @|sint| \\ \hlx{}
375 @|unsigned int| & @|unsigned|, @|unsigned-int|, @|uint| \\ \hlx{v}
376 @|long| & @|long|, @|signed-long|, @|long-int|,
377 @|signed-long-int|, @|slong| \\ \hlx{}
378 @|unsigned long| & @|unsigned-long|, @|unsigned-long-int|,
379 @|ulong| \\ \hlx{v}
380 @|long long| & @|long-long|, @|signed-long-long|,
381 @|long-long-int|, \\ \hlx{}
382 & \qquad @|signed-long-long-int|,
383 @|llong|, @|sllong| \\ \hlx{v}
384 @|unsigned long long|
385 & @|unsigned-long-long|, @|unsigned-long-long-int|,
386 @|ullong| \\ \hlx{v}
387 @|size_t| & @|size-t| \\ \hlx{}
388 @|ptrdiff_t| & @|ptrdiff-t| \\ \hlx{v}
389 @|float| & @|float| \\ \hlx{}
390 @|double| & @|double| \\ \hlx{}
391 @|long double| & @|long-double| \\ \hlx{v}
392 @|float _Imaginary| & @|float-imaginary| \\ \hlx{}
393 @|double _Imaginary|& @|double-imaginary| \\ \hlx{}
394 @|long double _Imaginary|
395 & @|long-double-imaginary| \\ \hlx{v}
396 @|float _Complex| & @|float-complex| \\ \hlx{}
397 @|double _Complex| & @|double-complex| \\ \hlx{}
398 @|long double _Complex|
399 & @|long-double-complex| \\ \hlx{v}
400 @|va_list| & @|va-list| \\ \hlx*{vh}
401 \end{tabular}
402 \caption{Builtin symbolic type specifiers for simple C types}
403 \label{tab:codegen.c-types.simple}
404 \end{table}
405
406 \begin{describe}{fun}
407 {make-simple-type @<name> \&optional @<qualifiers> @> @<c-type>}
408 Return the (unique interned) simple C type object for the C type whose name
409 is @<name> (a string) and which has the given @<qualifiers> (a list of
410 keywords).
411 \end{describe}
412
413 \begin{describe}{gf}{c-type-name @<c-type> @> @<string>}
414 Returns the name of a @|simple-c-type| instance @<c-type> as an immutable
415 string.
416 \end{describe}
417
418 \begin{describe}{mac}
419 {define-simple-c-type @{ @<name> @! (@<name>^*) @} @<string> @> @<name>}
420 Define type specifiers for a new simple C type. Each symbol @<name> is
421 defined as a symbolic type specifier for the (unique interned) simple C
422 type whose name is the value of @<string>. Further, each @<name> is
423 defined to be a type operator: the type specifier @|(@<name>
424 @<qualifier>^*)| evaluates to the (unique interned) simple C type whose
425 name is @<string> and which has the @<qualifiers> (which are evaluated).
426 \end{describe}
427
428 \begin{describe}{cls}{tagged-c-type (qualifiable-c-type)
429 \&key :qualifiers :tag}
430 Provides common behaviour for C tagged types. A @<tag> is a string
431 containing a C identifier.
432
433 Two tagged types are equal if and only if they have the same class, their
434 @<tag>s are @|string=|, and they have matching qualifiers. (User-defined
435 subclasses may have additional methods on @|c-type-equal-p| which impose
436 further restrictions.)
437 \end{describe}
438 \begin{boxy}[Bug]
439 Sod maintains distinct namespaces for the three kinds of tagged types. In
440 C, there is only one namespace for tags which is shared between enums,
441 structs and unions.
442 \end{boxy}
443
444 \begin{describe}{gf}{c-tagged-type-kind @<c-type> @> @<keyword>}
445 Returns a keyword classifying the tagged @<c-type>: one of @|:enum|,
446 @|:struct| or @|:union|. User-defined subclasses of @|tagged-c-type|
447 should return their own classification symbols. It is intended that
448 @|(string-downcase (c-tagged-type-kind @<c-type>))| be valid C
449 syntax.\footnote{%
450 Alas, C doesn't provide a syntactic category for these keywords;
451 \Cplusplus\ calls them a @<class-key>.} %
452 There is a method defined for each of the built-in tagged type classes
453 @|c-struct-type|, @|c-union-type| and @|c-enum-type|.
454 \end{describe}
455
456 \begin{describe}{gf}{kind-c-tagged-type @<keyword> @> @<symbol>}
457 This is not quite the inverse of @|c-tagged-type-kind|. Given a keyword
458 naming a kind of tagged type, return the name of the corresponding C
459 type class as a symbol.
460 \end{describe}
461
462 \begin{describe}{cls}{c-enum-type (tagged-c-type) \&key :qualifiers :tag}
463 Represents a C enumerated type. An instance denotes the C type @|enum|
464 @<tag>. See the direct superclass @|tagged-c-type| for details.
465
466 The type specifier @|(enum @<tag> @<qualifier>^*)| returns the (unique
467 interned) enumerated type with the given @<tag> and @<qualifier>s (all
468 evaluated).
469 \end{describe}
470 \begin{describe}{fun}
471 {make-enum-type @<tag> \&optional @<qualifiers> @> @<c-enum-type>}
472 Return the (unique interned) C type object for the enumerated C type whose
473 tag is @<tag> (a string) and which has the given @<qualifiers> (a list of
474 keywords).
475 \end{describe}
476
477 \begin{describe}{cls}{c-struct-type (tagged-c-type) \&key :qualifiers :tag}
478 Represents a C structured type. An instance denotes the C type @|struct|
479 @<tag>. See the direct superclass @|tagged-c-type| for details.
480
481 The type specifier @|(struct @<tag> @<qualifier>^*)| returns the (unique
482 interned) structured type with the given @<tag> and @<qualifier>s (all
483 evaluated).
484 \end{describe}
485 \begin{describe}{fun}
486 {make-struct-type @<tag> \&optional @<qualifiers> @> @<c-struct-type>}
487 Return the (unique interned) C type object for the structured C type whose
488 tag is @<tag> (a string) and which has the given @<qualifiers> (a list of
489 keywords).
490 \end{describe}
491
492 \begin{describe}{cls}{c-union-type (tagged-c-type) \&key :qualifiers :tag}
493 Represents a C union type. An instance denotes the C type @|union|
494 @<tag>. See the direct superclass @|tagged-c-type|
495 for details.
496
497 The type specifier @|(union @<tag> @<qualifier>^*)| returns the (unique
498 interned) union type with the given @<tag> and @<qualifier>s (all
499 evaluated).
500 \end{describe}
501 \begin{describe}{fun}
502 {make-union-type @<tag> \&optional @<qualifiers> @> @<c-union-type>}
503 Return the (unique interned) C type object for the union C type whose tag
504 is @<tag> (a string) and which has the given @<qualifiers> (a list of
505 keywords).
506 \end{describe}
507
508
509 \subsection{Compound C types} \label{sec:code.c-types.compound}
510
511 Some C types are \emph{compound types}: they're defined in terms of existing
512 types. The classes which represent compound types implement a common
513 protocol.
514
515 \begin{describe}{gf}{c-type-subtype @<c-type> @> @<subtype>}
516 Returns the underlying type of a compound type @<c-type>. Precisely what
517 this means depends on the class of @<c-type>.
518 \end{describe}
519
520
521 \subsection{Pointer types} \label{sec:clang.c-types.pointer}
522
523 Pointers compound types. The subtype of a pointer type is the type it points
524 to.
525
526 \begin{describe}{cls}
527 {c-pointer-type (qualifiable-c-type) \&key :qualifiers :subtype}
528 Represents a C pointer type. An instance denotes the C type @<subtype>
529 @|*|@<qualifiers>.
530
531 The @<subtype> may be any C type. Two pointer types are equal if and only
532 if their subtypes are equal and they have matching qualifiers.
533
534 The type specifier @|(* @<type-spec> @<qualifier>^*)| returns a type
535 qualified pointer-to-@<subtype>, where @<subtype> is the type specified by
536 @<type-spec> and the @<qualifier>s are qualifier keywords (which are
537 evaluated). The synonyms @|ptr| and @|pointer| may be used in place of the
538 star @`*'.
539
540 The symbol @|string| is a type specifier for the type pointer to
541 characters; the symbol @|const-string| is a type specifier for the type
542 pointer to constant characters.
543 \end{describe}
544
545 \begin{describe}{fun}
546 {make-pointer-type @<c-type> \&optional @<qualifiers>
547 @> @<c-pointer-type>}
548 Return an object describing the type qualified pointer to @<subtype>.
549 If @<subtype> is interned, then the returned pointer type object is
550 interned also.
551 \end{describe}
552
553
554 \subsection{Array types} \label{sec:clang.c-types.array}
555
556 Arrays implement the compound-type protocol. The subtype of an array type is
557 the array element type.
558
559 \begin{describe}{cls}{c-array-type (c-type) \&key :subtype :dimensions}
560 Represents a multidimensional C array type. The @<dimensions> are a list
561 of dimension specifiers $d_0$, $d_1$, \ldots, $d_{n-1}$; an instance then
562 denotes the C type @<subtype> @|[$d_0$][$d_1$]$\ldots$[$d_{n-1}$]|. An
563 individual dimension specifier is either a string containing a C integral
564 constant expression, or nil which is equivalent to an empty string. Only
565 the first (outermost) dimension $d_0$ should be empty.
566
567 C doesn't actually have multidimensional arrays as a primitive notion;
568 rather, it permits an array (with known extent) to be the element type of
569 an array, which achieves an equivalent effect. C arrays are stored in
570 row-major order: i.e., if we write down the indices of the elements of an
571 array in order of ascending address, the rightmost index varies fastest;
572 hence, the type constructed is more accurately an array of $d_0$ arrays of
573 $d_1$ of \ldots\ arrays of $d_{n-1}$ elements of type @<subtype>. We shall
574 continue to abuse terminology and refer to multidimensional arrays.
575
576 The type specifier @|([] @<type-spec> @<dimension>^*)| constructs a
577 multidimensional array with the given @<dimension>s whose elements have the
578 type specified by @<type-spec>. If no dimensions are given then a
579 single-dimensional array with unspecified extent. The synonyms @|array|
580 and @|vector| may be used in place of the brackets @`[]'.
581 \end{describe}
582
583 \begin{describe}{fun}
584 {make-array-type @<subtype> @<dimensions> @> @<c-array-type>}
585 Return an object describing the type of arrays with given @<dimensions> and
586 with element type @<subtype> (an instance of @|c-type|). The @<dimensions>
587 argument is a list whose elements are strings or nil; see the description
588 of the class @|c-array-type| above for details.
589 \end{describe}
590
591 \begin{describe}{gf}{c-array-dimensions @<c-type> @> @<list>}
592 Returns the dimensions of @<c-type>, an array type, as an immutable list.
593 \end{describe}
594
595
596 \subsection{Function types} \label{sec:clang.c-types.fun}
597
598 Function types implement the compound-type protocol. The subtype of a
599 function type is the type of the function's return value.
600
601 \begin{describe}{cls}{argument}
602 Represents an ordinary function argument.
603 \end{describe}
604
605 \begin{describe}{fun}{argumentp @<value> @> @<generalized-boolean>}
606 Decide whether @<value> is an @<argument> object: if so, return non-nil; if
607 not return nil.
608 \end{describe}
609
610 \begin{describe}{fun}{make-argument @<name> @<c-type> @> @<argument>}
611 Construct and a return a new @<argument> object. The argument has type
612 @<c-type>, which must be a @|c-type| object, and is named @<name>.
613
614 The @<name> may be nil to indicate that the argument has no name: in this
615 case the argument will be formatted as an abstract declarator, which is not
616 suitable for function definitions. If @<name> is not nil, then the
617 @<name>'s print representation, with @|*print-escape*| nil, is used as the
618 argument name.
619 \end{describe}
620
621 \begin{describe*}
622 {\dhead{fun}{argument-name @<argument> @> @<name>}
623 \dhead{fun}{argument-type @<argument> @> @<c-type>}}
624 Accessor functions for @|argument| objects. They return the name (for
625 @|argument-name|) or type (for @|argument-type|) from the object, as passed
626 to @|make-argument|.
627 \end{describe*}
628
629 \begin{describe}{gf}
630 {commentify-argument-name @<name> @> @<commentified-name>}
631 Convert the argument name @<name> so that it's suitable to declare the
632 function in a header file.
633
634 Robust header files shouldn't include literal argument names in
635 declarations of functions or function types, since this restricts the
636 including file from defining such names as macros. This generic function
637 is used to convert names into a safe form.
638
639 \begin{describe}{meth}{commentify-argument-name (@<name> null) @> nil}
640 Returns nil: if the argument name is already omitted, it's safe for use
641 in a header file.
642 \end{describe}
643 \begin{describe}{meth}{commentify-argument-name (@<name> t) @> @<string>}
644 Returns the print form of @<name> wrapped in a C comment, as
645 @`/*@<name>*/'.
646 \end{describe}
647 \end{describe}
648
649 \begin{describe}{fun}
650 {commentify-argument-names @<arguments> @> @<commentified-arguments>}
651 Convert the @<arguments> list so that it's suitable for use in a header
652 file.
653
654 The @<arguments> list should be a list whose items are @|argument| objects
655 or the keyword @|:ellipsis|. The return value is a list constructed as
656 follows. For each @|argument| object in the input list, there is a
657 corresponding @|argument| object in the returned list, with the same type,
658 and whose name is the result of @|commentify-argument-name| applied to the
659 input argument name; an @|:ellipsis| in the input list is passed through
660 unchanged.
661 \end{describe}
662
663 \begin{describe}{cls}{c-function-type (c-type) \&key :subtype :arguments}
664 Represents C function types. An instance denotes the type of a C
665 function which accepts the @<arguments> and returns @<subtype>.
666
667 The @<arguments> are a possibly empty list. All but the last element of
668 the list must be @|argument| objects; the final element may instead be the
669 keyword @|:ellipsis|, which denotes a variable argument list.
670
671 An @<arguments> list consisting of a single argument with type @|void| is
672 converted into an empty list. On output as C code, an empty argument list
673 is written as @|void|. It is not possible to represent a pre-ANSI C
674 function without prototypes.
675
676 Two function types are considered to be the same if their return types are
677 the same, and their argument lists consist of arguments with the same type,
678 in the same order, and either both or neither argument list ends with
679 @|:ellipsis|; argument names are not compared.
680
681 The type specifier @|(fun @<return-type> @{ (@<arg-name> @<arg-type>) @}^*
682 @[:ellipsis @! . @<form> @])| constructs a function type. The function has
683 the subtype @<return-type>. The remaining items in the type-specifier list
684 are used to construct the argument list. The argument items are a possibly
685 improper list, beginning with zero or more \emph{explicit arguments}:
686 two-item @<arg-name>/@<arg-type> lists. For each such list, an @|argument|
687 object is constructed with the given name (evaluated) and type. Following
688 the explicit arguments, there may be
689 \begin{itemize}
690 \item nothing, in which case the function's argument list consists only of
691 the explicit arguments;
692 \item the keyword @|:ellipsis|, as the final item in the type-specifier
693 list, indicating a variable argument list may follow the explicit
694 arguments; or
695 \item a possibly-improper list tail, beginning with an atom either as a
696 list item or as the final list cdr, indicating that the entire list tail
697 is Lisp expression which is to be evaluated to compute the remaining
698 arguments.
699 \end{itemize}
700 A tail expression may return a list of @|argument| objects, optionally
701 followed by an @|:ellipsis|.
702
703 For example,
704 \begin{prog}
705 (c-type (fun \=(lisp (c-type-subtype other-func)) \+ \\
706 ("first" int) . (c-function-arguments other-func))
707 \end{prog}
708 evaluates to a function type like @|other-func|, only with an additional
709 argument of type @|int| added to the front of its argument list. This
710 could also have been written
711 \begin{prog}
712 (let (\=(args (c-function-arguments other-func)) \+ \\
713 (ret (c-type-subtype other-func))) \- \\ \ind
714 (c-type (fun \=(lisp ret) ("first" int) . args)
715 \end{prog}
716 \end{describe}
717
718 \begin{describe}{fun}
719 {make-function-type @<subtype> @<arguments> @> @<c-function-type>}
720 Construct and return a new function type, returning @<subtype> and
721 accepting the @<arguments>.
722 \end{describe}
723
724 \begin{describe}{gf}
725 {c-function-arguments @<c-function-type> @> @<arguments>}
726 Return the arguments list of the @<c-function-type>.
727 \end{describe}
728
729 \begin{describe}{fun}
730 {commentify-function-type @<c-function-type> @> @<commentified-c-type>}
731 Return a commentified version of the @<c-function-type>.
732
733 The returned type has the same subtype as the given type, and the argument
734 list of the returned type is the result of applying
735 @|commentify-argument-names| to the argument list of the given type.
736 \end{describe}
737
738
739 \subsection{Parsing C types} \label{sec:clang.c-types.parsing}
740
741 \begin{describe}{fun}
742 {parse-c-type @<scanner>
743 @> @<result> @<success-flag> @<consumed-flag>}
744 \end{describe}
745
746 \begin{describe}{fun}
747 {parse-declarator @<scanner> @<base-type> \&key :kernel :abstractp
748 \nlret @<result> @<success-flag> @<consumed-flag>}
749 \end{describe}
750
751
752 \subsection{Class types} \label{sec:clang.c-types.class}
753
754 \begin{describe}{cls}
755 {c-class-type (simple-c-type) \&key :class :tag :qualifiers :name}
756 \end{describe}
757
758 \begin{describe*}
759 {\dhead{gf}{c-type-class @<class-type> @> @<class>}
760 \dhead{gf}{setf (c-type-class @<class-type>) @<class>}}
761 \end{describe*}
762
763 \begin{describe}{fun}{find-class-type @<name> @> @<class-type-or-nil>}
764 \end{describe}
765
766 \begin{describe}{fun}
767 {make-class-type @<name> \&optional @<qualifiers> @> @<class-type>}
768 \end{describe}
769
770 \begin{describe}{fun}
771 {make-class-type @<name> \&optional @<qualifiers> @> @<class-type>}
772 \end{describe}
773
774 \begin{describe}{fun}{find-sod-class @<name> @> @<class>}
775 \end{describe}
776
777 \begin{describe}{fun}{record-sod-class @<class>}
778 \end{describe}
779
780 %%%--------------------------------------------------------------------------
781 \section{Generating C code} \label{sec:clang.codegen}
782
783 This section deals with Sod's facilities for constructing and manipulating C
784 expressions, declarations, instructions and definitions.
785
786
787 \subsection{Temporary names} \label{sec:clang.codegen.temporaries}
788
789 Many C-level objects, especially ones with external linkage or inclusion in a
790 header file, are assigned names which are simple strings, perhaps fixed ones,
791 perhaps constructed. Other objects don't need meaningful names, and
792 suitably unique constructed names would be tedious and most likely rather
793 opaque. Therefore Sod has an ability to construct \emph{temporary names}.
794
795 These aren't temporary in the sense that they name C objects which have
796 limited lifetimes at runtime. Rather, the idea is that the names be
797 significant only to small pieces of Lisp code, which will soon forget about
798 them.
799
800 \subsubsection{The temporary name protocol}
801 Temporary names are represented by objects which implement a simple protocol.
802
803 \begin{describe}{gf}{format-temporary-name @<var> @<stream>}
804 \end{describe}
805
806 \begin{describe*}
807 {\dhead{gf}{var-in-use-p @<var> @> @<generalized-boolean>}
808 \dhead[setf var-in-use-p]
809 {gf}{setf (var-in-use-p @<var>) @<generalized-boolean>}}
810 \end{describe*}
811
812 \subsubsection{Temporary name objects}
813
814 \begin{describe}{cls}{temporary-name () \&key :tag}
815 A temporary name object. This is the root of a small collection of
816 subclasses, but is also usable on its own.
817 \end{describe}
818
819 \begin{describe}{meth}
820 {commentify-argument-name (@<name> temporary-name) @> nil}
821 \end{describe}
822
823 \begin{table}
824 \begin{tabular}[C]{*2{>{\codeface}l}} \hlx*{hv}
825 \thd{\textbf{Class}} & \thd{\textbf{Name format}} \\ \hlx{vhv}
826 temporary-name & @<tag> \\
827 temporary-argument & sod__a@<tag> \\
828 temporary-function & sod__f@<tag> \\
829 temporary-variable & sod__v@<tag> \\ \hlx*{vh}
830 \end{tabular}
831 \caption{Temporary name formats}
832 \label{tab:codegen.codegen.temps-format}
833 \end{table}
834
835 \begin{describe}{cls}{temporary-argument (temporary-name) \&key :tag}
836 \end{describe}
837
838 \begin{describe}{cls}{temporary-function (temporary-name) \&key :tag}
839 \end{describe}
840
841 \begin{describe}{fun}{temporary-function @> @<name>}
842 \end{describe}
843
844 \begin{describe}{cls}
845 {temporary-variable (temporary-name) \&key :tag :in-use-p}
846 \end{describe}
847
848 \subsubsection{Well-known `temporary' names}
849
850 \begin{table}
851 \begin{tabular}[C]{*2{>{\codeface}l}} \hlx*{hv}
852 \thd{\textbf{Variable}} & \thd{\textbf{Name format}} \\ \hlx{vhv}
853 {}*sod-ap* & sod__ap \\
854 {}*sod-master-ap* & sod__master_ap \\
855 {}*sod-tmp-ap* & sod__tmp_ap \\ \hlx*{vh}
856 \end{tabular}
857 \caption{Well-known temporary names}
858 \label{tab:codegen.codegen.well-known-temps}
859 \end{table}
860
861
862 \subsection{Instructions} \label{sec:clang.codegen.insts}
863
864 \begin{describe}{cls}{inst () \&key}
865 \end{describe}
866
867 \begin{describe}{gf}{inst-metric @<inst>}
868 \end{describe}
869
870 \begin{describe}{mac}
871 {definst @<code> (@<streamvar> \&key @<export>) (@<arg>^*) \\ \ind
872 @[[ @<declaration>^* @! @<doc-string> @]] \\
873 @<form>^* \-
874 \nlret @<code>}
875 \end{describe}
876
877 \begin{describe}{mac}
878 {format-compound-statement
879 (@<stream> @<child> \&optional @<morep>) \\ \ind
880 @<declaration>^* \\
881 @<form>^*}
882 \end{describe}
883
884 \begin{table}
885 \begin{tabular}[C]{ll>{\codeface}l} \hlx*{hv}
886 \thd{Class name} &
887 \thd{Arguments} &
888 \thd{Output format} \\ \hlx{vhv}
889 @|var| & @<name> @<type> @<init> & @<type> @<name> @[= @<init>@];
890 \\ \hlx{v}
891 @|set| & @<var> @<expr> & @<var> = @<expr>; \\ \hlx{v}
892 @|update| & @<var> @<op> @<expr> & @<var> @<op>= @<expr>;
893 \\ \hlx{v}
894 @|return| & @<expr> & return @[@<expr>@];
895 \\ \hlx{v}
896 @|break| & --- & break; \\ \hlx{v}
897 @|continue| & --- & continue; \\ \hlx{v}
898 @|expr| & @<expr> & @<expr>; \\ \hlx{v}
899 @|call| & @<func> @<args> & @<func>(@<arg>_1,
900 $\ldots$,
901 @<arg>_n) \\ \hlx{v}
902 @|va-start| & @<ap> @<arg> & va_start(@<ap>, @<arg>);
903 \\ \hlx{v}
904 @|va-copy| & @<to> @<from> & va_copy(@<to>, @<from>);
905 \\ \hlx{v}
906 @|va-end| & @<ap> & va_end(@<ap>); \\ \hlx{vhv}
907 @|block| & @<decls> @<body> & \{ @[@<decls>@] @<body> \}
908 \\ \hlx{v}
909 @|if| & @<cond> @<conseq> @<alt> & if (@<cond>) @<conseq>
910 @[else @<alt>@] \\ \hlx{v}
911 @|while| & @<cond> @<body> & while (@<cond>) @<body>
912 \\ \hlx{v}
913 @|do-while| & @<body> @<cond> & do @<body> while (@<cond>);
914 \\ \hlx{v}
915 @|function| & @<name> @<type> @<body> &
916 @<type>_0 @<name>(@<type>_1 @<arg>_1, $\ldots$,
917 @<type>_n @<arg>_n @[, \dots@])
918 @<body> \\ \hlx*{vh}
919 \end{tabular}
920 \caption{Instruction classes}
921 \label{tab:codegen.codegen.insts}
922 \end{table}
923
924
925 \subsection{Code generation} \label{sec:clang.codegen.codegen}
926
927 \begin{describe}{gf}{codegen-functions @<codegen> @> @<list>}
928 \end{describe}
929
930 \begin{describe}{gf}
931 {ensure-var @<codegen> @<name> @<type> \&optional @<init>}
932 \end{describe}
933
934 \begin{describe}{gf}{emit-inst @<codegen> @<inst>}
935 \end{describe}
936
937 \begin{describe}{gf}{emit-insts @<codegen> @<insts>}
938 \end{describe}
939
940 \begin{describe}{gf}{emit-decl @<codegen> @<decl>}
941 \end{describe}
942
943 \begin{describe}{gf}{emit-declss @<codegen> @<decls>}
944 \end{describe}
945
946 \begin{describe}{gf}{codegen-push @<codegen>}
947 \end{describe}
948
949 \begin{describe}{gf}{codegen-pop @<codegen> @> @<decls> @<insts>}
950 \end{describe}
951
952 \begin{describe}{gf}{codegen-pop-block @<codegen> @> @<block-inst>}
953 \end{describe}
954
955 \begin{describe}{gf}
956 {codegen-pop-function @<codegen> @<name> @<type> @> @<name>}
957 \end{describe}
958
959 \begin{describe}{gf}{codegen-add-function @<codegen> @<function>}
960 \end{describe}
961
962 \begin{describe}{fun}
963 {codegen-build-function @<codegen> @<name> @<type> @<vars> @<insts>
964 @> @<name>}
965 \end{describe}
966
967 \begin{describe}{gf}{temporary-var @<codegen> @<type> @> @<name>}
968 \end{describe}
969
970 \begin{describe}{mac}
971 {with-temporary-var (@<codegen> @<var> @<type>) \\ \ind
972 @<declaration>^* \\
973 @<form>^* \-
974 \nlret @<value>^*}
975 \end{describe}
976
977 \begin{describe}{fun}{deliver-expr @<codegen> @<target> @<expr>}
978 \end{describe}
979
980 \begin{describe}{fun}{convert-stmts @<codegen> @<target> @<type> @<func>}
981 \end{describe}
982
983 \begin{describe}{cls}{codegen () \&key :vars :insts (:temp-index 0)}
984 \end{describe}
985
986 %%%--------------------------------------------------------------------------
987 \section{Literal C code fragments} \label{sec:clang.fragment}
988
989 \begin{describe}{cls}{c-fragment () \&key :location :text}
990 \end{describe}
991
992 \begin{describe}{gf}{c-fragment-text @<fragment> @> @<string>}
993 \end{describe}
994
995 \begin{describe}{fun}
996 {scan-c-fragment @<scanner> @<end-chars>
997 @> @<result> @<success-flag> @<consumed-flag>}
998 \end{describe}
999
1000 \begin{describe}{fun}
1001 {parse-delimited-fragment @<scanner> @<begin> @<end> \&key :keep-end
1002 \nlret @<result> @<success-flag> @<consumed-flag>}
1003 \end{describe}
1004
1005 %%%----- That's all, folks --------------------------------------------------
1006
1007 %%% Local variables:
1008 %%% mode: LaTeX
1009 %%% TeX-master: "sod.tex"
1010 %%% TeX-PDF-mode: t
1011 %%% End: