mdw@git.distorted.org.uk Git - sod/blob - doc/clang.tex

   1 %%% -*-latex-*-
   2 %%%
   3 %%% C language utilities
   4 %%%
   5 %%% (c) 2015 Straylight/Edgeware
   6 %%%
   7
   8 %%%----- Licensing notice ---------------------------------------------------
   9 %%%
  10 %%% This file is part of the Sensble Object Design, an object system for C.
  11 %%%
  12 %%% SOD is free software; you can redistribute it and/or modify
  13 %%% it under the terms of the GNU General Public License as published by
  14 %%% the Free Software Foundation; either version 2 of the License, or
  15 %%% (at your option) any later version.
  16 %%%
  17 %%% SOD is distributed in the hope that it will be useful,
  18 %%% but WITHOUT ANY WARRANTY; without even the implied warranty of
  19 %%% MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  20 %%% GNU General Public License for more details.
  21 %%%
  22 %%% You should have received a copy of the GNU General Public License
  23 %%% along with SOD; if not, write to the Free Software Foundation,
  24 %%% Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
  25
  26 \chapter{C language utilities} \label{ch:clang}
  27
  28 %%%--------------------------------------------------------------------------
  29 \section{C type representation} \label{sec:clang.c-types}
  30
  31 \subsection{Overview} \label{sec:clang.c-types.over}
  32
  33 The Sod translator represents C types in a fairly simple and direct way.
  34 However, because it spends a fair amount of its time dealing with C types, it
  35 provides a number of useful operations and macros.
  36
  37 The class hierarchy is shown in~\xref{fig:codegen.c-types.classes}.
  38
  39 \begin{figure} \centering
  40   \parbox{10pt}{\begin{tabbing}
  41     @|c-type| \\ \ind
  42       @|qualifiable-c-type| \\ \ind
  43         @|simple-c-type| \\ \ind
  44           @|c-class-type| \- \\
  45         @|tagged-c-type| \\ \ind
  46           @|c-struct-type| \\
  47           @|c-union-type| \\
  48           @|c-enum-type| \- \\
  49         @|c-pointer-type| \- \\
  50       @|c-array-type| \\
  51       @|c-function-type|
  52   \end{tabbing}}
  53   \caption{Classes representing C types}
  54 \label{fig:codegen.c-types.classes}
  55 \end{figure}
  56
  57 C type objects are immutable unless otherwise specified.
  58
  59 \subsubsection{Constructing C type objects}
  60 There is a constructor function for each non-abstract class of C type object.
  61 Note, however, that constructor functions need not generate a fresh type
  62 object if a previously existing type object is suitable.  In this case, we
  63 say that the objects are \emph{interned}.  Some constructor functions are
  64 specified to return interned objects: programs may rely on receiving the same
  65 (@|eq|) type object for similar (possibly merely @|equal|) arguments.  Where
  66 not specified, clients may still not rely on receiving fresh objects.
  67
  68 A convenient S-expression notation is provided by the @|c-type| macro.  Use
  69 of this macro is merely an abbreviation for corresponding use of the various
  70 constructor functions, and therefore interns type objects in the same manner.
  71 The syntax accepted by the macro can be extended in order to support new
  72 classes: see @|defctype|, @|c-type-alias| and @|define-c-type-syntax|.
  73
  74 The descriptions of each of the various classes include descriptions of the
  75 initargs which may be passed to @|make-instance| when constructing a new
  76 instance of the class.  However, the constructor functions and S-expression
  77 syntax are strongly recommended over direct use of @|make-instance|.
  78
  79 \subsubsection{Printing}
  80 There are two protocols for printing C types.  Unfortunately they have
  81 similar names.
  82 \begin{itemize}
  83 \item The @|print-c-type| function prints a C type value using the
  84   S-expression notation.  It is mainly useful for diagnostic purposes.
  85 \item The @|pprint-c-type| function prints a C type as a C-syntax
  86   declaration.
  87 \end{itemize}
  88 Neither generic function defines a default primary method; subclasses of
  89 @|c-type| must define their own methods in order to print correctly.
  90
  91 \subsection{The C type root class} \label{sec:clang.c-types.root}
  92
  93 \begin{describe}{cls}{c-type ()}
  94   The class @|c-type| marks the root of the built-in C type hierarchy.
  95
  96   Users may define subclasses of @|c-type|.  All non-abstract subclasses must
  97   have a primary method defined on @|pprint-c-type|; unless instances of the
  98   subclass are interned, a method on @|c-type-equal-p| is also required.
  99
 100   The class @|c-type| is abstract.
 101 \end{describe}
 102
 103 \subsection{C type S-expression notation} \label{sec:clang.c-types.sexp}
 104
 105 The S-expression representation of a type is described syntactically as a
 106 type specifier.  Type specifiers fit into two syntactic categories.
 107 \begin{itemize}
 108 \item A \emph{symbolic type specifier} consists of a symbol.  It has a
 109   single, fixed meaning: if @<name> is a symbolic type specifier, then each
 110   use of @<name> in a type specifier evaluates to the same (@|eq|) type
 111   object, until the @<name> is redefined.
 112 \item A \emph{type operator} is a symbol; the corresponding specifier is a
 113   list whose @|car| is the operator.  The remaining items in the list are
 114   arguments to the type operator.
 115 \end{itemize}
 116
 117 \begin{describe}{mac}{c-type @<type-spec> @> @<c-type>}
 118   Evaluates to a C type object, as described by the type specifier
 119   @<type-spec>.
 120 \end{describe}
 121
 122 \begin{describe}{mac}
 123     {defctype @{ @<name> @! (@<name> @<nickname>^*) @} @<type-spec>
 124       @> @<names>}
 125   Defines a new symbolic type specifier @<name>; if a list of @<name>s is
 126   given, then all are defined in the same way.  The type constructed by using
 127   any of the @<name>s is as described by the type specifier @<type-spec>.
 128
 129   The resulting type object is constructed once, at the time that the macro
 130   expansion is evaluated; the same (@|eq|) value is used each time any
 131   @<name> is used in a type specifier.
 132 \end{describe}
 133
 134 \begin{describe}{mac}{c-type-alias @<original> @<alias>^* @> @<aliases>}
 135   Defines each @<alias> as being a type operator identical in behaviour to
 136   @<original>.  If @<original> is later redefined then the behaviour of the
 137   @<alias>es changes too.
 138 \end{describe}
 139
 140 \begin{describe}{mac}
 141     {define-c-type-syntax @<name> @<lambda-list> @<form>^* @> @<name>}
 142   Defines the symbol @<name> as a new type operator.  When a list of the form
 143   @|(@<name> @<argument>^*)| is used as a type specifier, the @<argument>s
 144   are bound to fresh variables according to @<lambda-list> (a destructuring
 145   lambda-list) and the @<form>s evaluated in order in the resulting lexical
 146   environment as an implicit @|progn|.  The value should be a Lisp form which
 147   will evaluate to the type specified by the arguments.
 148
 149   The @<form>s may call @|expand-c-type-spec| in order to recursively expand
 150   type specifiers among its arguments.
 151 \end{describe}
 152
 153 \begin{describe}{fun}{expand-c-type-spec @<type-spec> @> @<form>}
 154   Returns the Lisp form that @|(c-type @<type-spec>)| would expand into.
 155 \end{describe}
 156
 157 \begin{describe}{gf}
 158     {print-c-type @<stream> @<type> \&optional @<colon> @<atsign>}
 159   Print the C type object @<type> to @<stream> in S-expression form.  The
 160   @<colon> and @<atsign> arguments may be interpreted in any way which seems
 161   appropriate: they are provided so that @|print-c-type| may be called via
 162   @|format|'s @|\char`\~/\dots/| command; they are not set when
 163   @|print-c-type| is called by Sod functions.
 164
 165   There should be a method defined for every C type class; there is no
 166   default method.
 167 \end{describe}
 168
 169 \subsection{Comparing C types} \label{sec:clang.c-types.cmp}
 170
 171 It is necessary to compare C types for equality, for example when checking
 172 argument lists for methods.  This is done by @|c-type-equal-p|.
 173
 174 \begin{describe}{gf}
 175     {c-type-equal-p @<c-type>_1 @<c-type>_2 @> @<generalized-boolean>}
 176   The generic function @|c-type-equal-p| compares two C types @<c-type>_1 and
 177   @<c-type>_2 for equality; it returns true if the two types are equal and
 178   false if they are not.
 179
 180   Two types are equal if they are structurally similar, where this property
 181   is defined by methods for each individual class; see the descriptions of
 182   the classes for the details.
 183
 184   The generic function @|c-type-equal-p| uses the @|and| method combination.
 185
 186   \begin{describe}{meth}{c-type-equal-p @<c-type>_1 @<c-type>_2}
 187     A default primary method for @|c-type-equal-p| is defined.  It simply
 188     returns @|nil|.  This way, methods can specialize on both arguments
 189     without fear that a call will fail because no methods are applicable.
 190   \end{describe}
 191   \begin{describe}{ar-meth}{c-type-equal-p @<c-type>_1 @<c-type>_2}
 192     A default around-method for @|c-type-equal-p| is defined.  It returns
 193     true if @<c-type>_1 and @<c-type>_2 are @|eql|; otherwise it delegates to
 194     the primary methods.  Since several common kinds of C types are interned,
 195     this is a common case worth optimizing.
 196   \end{describe}
 197 \end{describe}
 198
 199 \subsection{Outputting C types} \label{sec:clang.c-types.output}
 200
 201 \begin{describe}{gf}{pprint-c-type @<c-type> @<stream> @<kernel>}
 202   The generic function @|pprint-c-type| pretty-prints to @<stream> a C-syntax
 203   declaration of an object or function of type @<c-type>.  The result is
 204   written to @<stream>.
 205
 206   A C declaration has two parts: a sequence of \emph{declaration specifiers}
 207   and a \emph{declarator}.  The declarator syntax involves parentheses and
 208   operators, in order to reflect the operators applicable to the declared
 209   variable.  For example, the name of a pointer variable is preceded by @`*';
 210   the name of an array is followed by dimensions enclosed in @`['\dots @`]'.
 211
 212   The @<kernel> argument must be a function designator (though see the
 213   standard around-method); it is invoked as
 214   \begin{quote} \codeface
 215     (funcall @<kernel> @<stream> @<priority> @<spacep>)
 216   \end{quote}
 217   It should write to @<stream> -- which may not be the same stream originally
 218   passed into the generic function -- the `kernel' of the declarator, i.e.,
 219   the part to which prefix and/or postfix operators are attached to form the
 220   full declarator.
 221
 222   The methods on @|pprint-c-type| specialized for compound types work by
 223   recursively calling @|pprint-c-type| on the subtype, passing down a closure
 224   which prints the necessary additional declarator operators before calling
 225   the original @<kernel> function.  The additional arguments @<priority> and
 226   @<spacep> support this implementation technique.
 227
 228   The @<priority> argument describes the surrounding operator context.  It is
 229   zero if no type operators are directly attached to the kernel (i.e., there
 230   are no operators at all, or the kernel is enclosed in parentheses), one if
 231   a prefix operator is directly attached, or two if a postfix operator is
 232   directly attached.  If the @<kernel> function intends to provide its own
 233   additional declarator operators, it should check the @<priority> in order
 234   to determine whether parentheses are necessary.  See also the
 235   @|maybe-in-parens| macro (page~\pageref{mac:maybe-in-parens}).
 236
 237   The @<spacep> argument indicates whether a space needs to be printed in
 238   order to separate the declarator from the declaration specifiers.  A kernel
 239   which contains an identifier should insert a space before the identifier
 240   when @<spacep> is non-nil.  An `empty' kernel, as found in an abstract
 241   declarator (one that specifies no name), looks more pleasing without a
 242   trailing space.  See also the @|c-type-space| function
 243   (page~\pageref{fun:c-type-space}).
 244
 245   Every concrete subclass of @|c-type| is expected to provide a primary
 246   method on this function.  There is no default primary method.
 247
 248   \begin{describe}{ar-meth}{pprint-c-type @<c-type> @<stream> @<kernel>}
 249     A default around method is defined on @|pprint-c-type| which `canonifies'
 250     non-function @<kernel> arguments.  In particular:
 251     \begin{itemize}
 252     \item if @<kernel> is nil, then @|pprint-c-type| is called recursively
 253       with a @<kernel> function that does nothing; and
 254     \item if @<kernel> is any other kind of object, then @|pprint-c-type| is
 255       called recursively with a @<kernel> function that prints the object as
 256       if by @|princ|, preceded if necessary by space using @|c-type-space|.
 257     \end{itemize}
 258   \end{describe}
 259 \end{describe}
 260
 261 \begin{describe}{fun}{c-type-space @<stream>}
 262   Writes a space and other pretty-printing instructions to @<stream> in order
 263   visually to separate a declarator from the preceding declaration
 264   specifiers.  The precise details are subject to change.
 265 \end{describe}
 266
 267 \begin{describe}{mac}
 268     {maybe-in-parens (@<stream-var> @<guard-form>) @<form>^*}
 269   The @<guard-form> is evaluated, and then the @<form>s are evaluated in
 270   sequence within a pretty-printer logical block writing to the stream named
 271   by the symbol @<stream-var>.  If the @<guard-form> evaluates to nil, then
 272   the logical block has empty prefix and suffix strings; if it evaluates to a
 273   non-nil value, then the logical block has prefix and suffix @`(' and @`)'
 274   respectively.
 275
 276   Note that this may cause @<stream> to be bound to a different stream object
 277   within the @<form>s.
 278 \end{describe}
 279
 280 \subsection{Type qualifiers and qualifiable types}
 281 \label{sec:clang.ctypes.qual}
 282
 283 \begin{describe}{cls}{qualifiable-c-type (c-type) \&key :qualifiers}
 284   The class @|qualifiable-c-type| describes C types which can bear
 285   `qualifiers' (\Cplusplus\ calls them `cv-qualifiers'): @|const|,
 286   @|restrict| and @|volatile|.
 287
 288   The @<qualifiers> are a list of keyword symbols @|:const|, @|:restrict| and
 289   @|:volatile|.  There is no built-in limitation to these particular
 290   qualifiers; others keywords may be used, though this isn't recommended.
 291
 292   Two qualifiable types are equal only if they have \emph{matching
 293     qualifiers}: i.e., every qualifier attached to one is also attached to
 294   the other: order is not significant, and neither is multiplicity.
 295
 296   The class @|qualifiable-c-type| is abstract.
 297 \end{describe}
 298
 299 \begin{describe}{gf}{c-type-qualifiers @<c-type> @> @<list>}
 300   Returns the qualifiers of the @|qualifiable-c-type| instance @<c-type> as
 301   an immutable list.
 302 \end{describe}
 303
 304 \begin{describe}{fun}{qualify-type @<c-type> @<qualifiers> @> @<c-type>}
 305   The argument @<c-type> must be an instance of @|qualifiable-c-type|,
 306   currently bearing no qualifiers, and @<qualifiers> a list of qualifier
 307   keywords.  The result is a C type object like @<c-type> except that it
 308   bears the given @<qualifiers>.
 309
 310   The @<c-type> is not modified.  If @<c-type> is interned, then the returned
 311   type will be interned.
 312 \end{describe}
 313
 314 \begin{describe}{fun}{format-qualifiers @<qualifiers>}
 315   Returns a string containing the qualifiers listed in @<qualifiers> in C
 316   syntax, with a space after each.  In particular, if @<qualifiers> is
 317   non-null then the final character of the returned string will be a space.
 318 \end{describe}
 319
 320 \subsection{Leaf types} \label{sec:clang.c-types.leaf}
 321
 322 A \emph{leaf type} is a type which is not defined in terms of another type.
 323 In Sod, the leaf types are
 324 \begin{itemize}
 325 \item \emph{simple types}, including builtin types like @|int| and @|char|,
 326   as well as type names introduced by @|typename|, because Sod isn't
 327   interested in what the type name means, merely that it names a type; and
 328 \item \emph{tagged types}, i.e., enum, struct and union types which are named
 329   by a keyword identifying the kind of type, and a \emph{tag}.
 330 \end{itemize}
 331
 332 \begin{describe}{cls}{simple-c-type (qualifiable-c-type)
 333     \&key :qualifiers :name}
 334   The class of `simple types'; an instance denotes the type @<qualifiers>
 335   @<name>.
 336
 337   A simple type object maintains a \emph{name}, which is a string whose
 338   contents are the C name for the type.  The initarg @|:name| may be used to
 339   provide this name when calling @|make-instance|.
 340
 341   Two simple type objects are equal if and only if they have @|string=| names
 342   and matching qualifiers.
 343
 344   A number of symbolic type specifiers for builtin types are predefined as
 345   shown in \xref{tab:codegen.c-types.simple}.  These are all defined as if by
 346   @|define-simple-c-type|, so can be used to construct qualified types.
 347 \end{describe}
 348
 349 \begin{table}
 350   \begin{tabular}[C]{ll}                                           \hlx*{hv}
 351     \thd{C type}        & \thd{Specifiers}                      \\ \hlx{vhv}
 352     @|void|             & @|void|                               \\ \hlx{v}
 353     @|char|             & @|char|                               \\ \hlx{v}
 354     @|unsigned char|    & @|unsigned-char|, @|uchar|            \\ \hlx{}
 355     @|signed char|      & @|signed-char|, @|schar|              \\ \hlx{v}
 356     @|short|            & @|short|, @|signed-short|, @|short-int|,
 357                           @|signed-short-int| @|sshort|         \\ \hlx{}
 358     @|unsigned short|   & @|unsigned-short|, @|unsigned-short-int|,
 359                           @|ushort|                             \\ \hlx{v}
 360     @|int|              & @|int|, @|signed|, @|signed-int|,
 361                           @|sint|                               \\ \hlx{}
 362     @|unsigned int|     & @|unsigned|, @|unsigned-int|, @|uint| \\ \hlx{v}
 363     @|long|             & @|long|, @|signed-long|, @|long-int|,
 364                           @|signed-long-int|, @|slong|          \\ \hlx{}
 365     @|unsigned long|    & @|unsigned-long|, @|unsigned-long-int|,
 366                           @|ulong|                              \\ \hlx{v}
 367     @|long long|        & @|long-long|, @|signed-long-long|,
 368                           @|long-long-int|,                     \\
 369                         & \qquad @|signed-long-long-int|,
 370                           @|llong|, @|sllong|                   \\ \hlx{v}
 371     @|unsigned long long|
 372                         & @|unsigned-long-long|, @|unsigned-long-long-int|,
 373                           @|ullong|                             \\ \hlx{v}
 374     @|float|            & @|float|                              \\ \hlx{}
 375     @|double|           & @|double|                             \\ \hlx{v}
 376     @|va_list|          & @|va-list|                            \\ \hlx{v}
 377     @|size_t|           & @|size-t|                             \\ \hlx{v}
 378     @|ptrdiff_t|        & @|ptrdiff-t|                          \\ \hlx*{vh}
 379   \end{tabular}
 380   \caption{Builtin symbolic type specifiers for simple C types}
 381   \label{tab:codegen.c-types.simple}
 382 \end{table}
 383
 384 \begin{describe}{fun}
 385     {make-simple-type @<name> \&optional @<qualifiers> @> @<c-type>}
 386   Return the (unique interned) simple C type object for the C type whose name
 387   is @<name> (a string) and which has the given @<qualifiers> (a list of
 388   keywords).
 389 \end{describe}
 390
 391 \begin{describe}{gf}{c-type-name @<c-type> @> @<string>}
 392   Returns the name of a @|simple-c-type| instance @<c-type> as an immutable
 393   string.
 394 \end{describe}
 395
 396 \begin{describe}{mac}
 397     {define-simple-c-type @{ @<name> @! (@<name>^*) @} @<string> @> @<name>}
 398   Define type specifiers for a new simple C type.  Each symbol @<name> is
 399   defined as a symbolic type specifier for the (unique interned) simple C
 400   type whose name is the value of @<string>.  Further, each @<name> is
 401   defined to be a type operator: the type specifier @|(@<name>
 402   @<qualifier>^*)| evaluates to the (unique interned) simple C type whose
 403   name is @<string> and which has the @<qualifiers> (which are evaluated).
 404 \end{describe}
 405
 406 \begin{describe}{cls}{tagged-c-type (qualifiable-c-type)
 407     \&key :qualifiers :tag}
 408   Provides common behaviour for C tagged types.  A @<tag> is a string
 409   containing a C identifier.
 410
 411   Two tagged types are equal if and only if they have the same class, their
 412   @<tag>s are @|string=|, and they have matching qualifiers.  (User-defined
 413   subclasses may have additional methods on @|c-type-equal-p| which impose
 414   further restrictions.)
 415 \end{describe}
 416 \begin{boxy}[Bug]
 417   Sod maintains distinct namespaces for the three kinds of tagged types.  In
 418   C, there is only one namespace for tags which is shared between enums,
 419   structs and unions.
 420 \end{boxy}
 421
 422 \begin{describe}{gf}{c-tagged-type-kind @<c-type> @> @<keyword>}
 423   Returns a keyword classifying the tagged @<c-type>: one of @|:enum|,
 424   @|:struct| or @|:union|.  User-defined subclasses of @|tagged-c-type|
 425   should return their own classification symbols.  It is intended that
 426   @|(string-downcase (c-tagged-type-kind @<c-type>))| be valid C
 427   syntax.\footnote{%
 428     Alas, C doesn't provide a syntactic category for these keywords;
 429     \Cplusplus\ calls them a @<class-key>.} %
 430   There is a method defined for each of the built-in tagged type classes
 431   @|c-struct-type|, @|c-union-type| and @|c-enum-type|.
 432 \end{describe}
 433
 434 \begin{describe}{gf}{kind-c-tagged-type @<keyword> @> @<symbol>}
 435   This is not quite the inverse of @|c-tagged-type-kind|.  Given a keyword
 436   naming a kind of tagged type, return the name of the corresponding C
 437   type class as a symbol.
 438 \end{describe}
 439
 440 \begin{describe}{cls}{c-enum-type (tagged-c-type) \&key :qualifiers :tag}
 441   Represents a C enumerated type.  An instance denotes the C type @|enum|
 442   @<tag>.  See the direct superclass @|tagged-c-type| for details.
 443
 444   The type specifier @|(enum @<tag> @<qualifier>^*)| returns the (unique
 445   interned) enumerated type with the given @<tag> and @<qualifier>s (all
 446   evaluated).
 447 \end{describe}
 448 \begin{describe}{fun}
 449     {make-enum-type @<tag> \&optional @<qualifiers> @> @<c-enum-type>}
 450   Return the (unique interned) C type object for the enumerated C type whose
 451   tag is @<tag> (a string) and which has the given @<qualifiers> (a list of
 452   keywords).
 453 \end{describe}
 454
 455 \begin{describe}{cls}{c-struct-type (tagged-c-type) \&key :qualifiers :tag}
 456   Represents a C structured type.  An instance denotes the C type @|struct|
 457   @<tag>.  See the direct superclass @|tagged-c-type| for details.
 458
 459   The type specifier @|(struct @<tag> @<qualifier>^*)| returns the (unique
 460   interned) structured type with the given @<tag> and @<qualifier>s (all
 461   evaluated).
 462 \end{describe}
 463 \begin{describe}{fun}
 464     {make-struct-type @<tag> \&optional @<qualifiers> @> @<c-struct-type>}
 465   Return the (unique interned) C type object for the structured C type whose
 466   tag is @<tag> (a string) and which has the given @<qualifiers> (a list of
 467   keywords).
 468 \end{describe}
 469
 470 \begin{describe}{cls}{c-union-type (tagged-c-type) \&key :qualifiers :tag}
 471   Represents a C union type.  An instance denotes the C type @|union|
 472   @<tag>.  See the direct superclass @|tagged-c-type|
 473   for details.
 474
 475   The type specifier @|(union @<tag> @<qualifier>^*)| returns the (unique
 476   interned) union type with the given @<tag> and @<qualifier>s (all
 477   evaluated).
 478 \end{describe}
 479 \begin{describe}{fun}
 480     {make-union-type @<tag> \&optional @<qualifiers> @> @<c-union-type>}
 481   Return the (unique interned) C type object for the union C type whose tag
 482   is @<tag> (a string) and which has the given @<qualifiers> (a list of
 483   keywords).
 484 \end{describe}
 485
 486 \subsection{Compound C types} \label{sec:code.c-types.compound}
 487
 488 Some C types are \emph{compound types}: they're defined in terms of existing
 489 types.  The classes which represent compound types implement a common
 490 protocol.
 491
 492 \begin{describe}{gf}{c-type-subtype @<c-type> @> @<subtype>}
 493   Returns the underlying type of a compound type @<c-type>.  Precisely what
 494   this means depends on the class of @<c-type>.
 495 \end{describe}
 496
 497 \subsection{Pointer types} \label{sec:clang.c-types.pointer}
 498
 499 Pointers compound types.  The subtype of a pointer type is the type it points
 500 to.
 501
 502 \begin{describe}{cls}
 503     {c-pointer-type (qualifiable-c-type) \&key :qualifiers :subtype}
 504   Represents a C pointer type.  An instance denotes the C type @<subtype>
 505   @|*|@<qualifiers>.
 506
 507   The @<subtype> may be any C type.  Two pointer types are equal if and only
 508   if their subtypes are equal and they have matching qualifiers.
 509
 510   The type specifier @|(* @<type-spec> @<qualifier>^*)| returns a type
 511   qualified pointer-to-@<subtype>, where @<subtype> is the type specified by
 512   @<type-spec> and the @<qualifier>s are qualifier keywords (which are
 513   evaluated).  The synonyms @|ptr| and @|pointer| may be used in place of the
 514   star @`*'.
 515
 516   The symbol @|string| is a type specifier for the type pointer to
 517   characters; the symbol @|const-string| is a type specifier for the type
 518   pointer to constant characters.
 519 \end{describe}
 520
 521 \begin{describe}{fun}
 522     {make-pointer-type @<c-type> \&optional @<qualifiers>
 523       @> @<c-pointer-type>}
 524   Return an object describing the type qualified pointer to @<subtype>.
 525   If @<subtype> is interned, then the returned pointer type object is
 526   interned also.
 527 \end{describe}
 528
 529 \subsection{Array types} \label{sec:clang.c-types.array}
 530
 531 Arrays implement the compound-type protocol.  The subtype of an array type is
 532 the array element type.
 533
 534 \begin{describe}{cls}{c-array-type (c-type) \&key :subtype :dimensions}
 535   Represents a multidimensional C array type.  The @<dimensions> are a list
 536   of dimension specifiers $d_0$, $d_1$, \ldots, $d_{n-1}$; an instance then
 537   denotes the C type @<subtype> @|[$d_0$][$d_1$]$\ldots$[$d_{n-1}$]|.  An
 538   individual dimension specifier is either a string containing a C integral
 539   constant expression, or nil which is equivalent to an empty string.  Only
 540   the first (outermost) dimension $d_0$ should be empty.
 541
 542   C doesn't actually have multidimensional arrays as a primitive notion;
 543   rather, it permits an array (with known extent) to be the element type of
 544   an array, which achieves an equivalent effect.  C arrays are stored in
 545   row-major order: i.e., if we write down the indices of the elements of an
 546   array in order of ascending address, the rightmost index varies fastest;
 547   hence, the type constructed is more accurately an array of $d_0$ arrays of
 548   $d_1$ of \ldots\ arrays of $d_{n-1}$ elements of type @<subtype>.  We shall
 549   continue to abuse terminology and refer to multidimensional arrays.
 550
 551   The type specifier @|([] @<type-spec> @<dimension>^*)| constructs a
 552   multidimensional array with the given @<dimension>s whose elements have the
 553   type specified by @<type-spec>.  If no dimensions are given then a
 554   single-dimensional array with unspecified extent.  The synonyms @|array|
 555   and @|vector| may be used in place of the brackets @`[]'.
 556 \end{describe}
 557
 558 \begin{describe}{fun}
 559     {make-array-type @<subtype> @<dimensions> @> @<c-array-type>}
 560   Return an object describing the type of arrays with given @<dimensions> and
 561   with element type @<subtype> (an instance of @|c-type|).  The @<dimensions>
 562   argument is a list whose elements are strings or nil; see the description
 563   of the class @|c-array-type| above for details.
 564 \end{describe}
 565
 566 \begin{describe}{gf}{c-array-dimensions @<c-type> @> @<list>}
 567   Returns the dimensions of @<c-type>, an array type, as an immutable list.
 568 \end{describe}
 569
 570 \subsection{Function types} \label{sec:clang.c-types.fun}
 571
 572 Function types implement the compound-type protocol.  The subtype of a
 573 function type is the type of the function's return value.
 574
 575 \begin{describe}{cls}{argument}
 576   Represents an ordinary function argument.
 577 \end{describe}
 578
 579 \begin{describe}{fun}{argumentp @<value> @> @<generalized-boolean>}
 580   Decide whether @<value> is an @<argument> object: if so, return non-nil; if
 581   not return nil.
 582 \end{describe}
 583
 584 \begin{describe}{fun}{make-argument @<name> @<c-type> @> @<argument>}
 585   Construct and a return a new @<argument> object.  The argument has type
 586   @<c-type>, which must be a @|c-type| object, and is named @<name>.
 587
 588   The @<name> may be nil to indicate that the argument has no name: in this
 589   case the argument will be formatted as an abstract declarator, which is not
 590   suitable for function definitions.  If @<name> is not nil, then the
 591   @<name>'s print representation, with @|*print-escape*| nil, is used as the
 592   argument name.
 593 \end{describe}
 594
 595 \begin{describe}{fun}{argument-name @<argument> @> @<name>}
 596   Return the name of the @<argument>, as it was supplied to @|make-argument|.
 597 \end{describe}
 598
 599 \begin{describe}{fun}{argument-type @<argument> @> @<c-type>}
 600   Return the type of the @<argument>, as it was supplied to @|make-argument|.
 601 \end{describe}
 602
 603 \begin{describe}{gf}
 604     {commentify-argument-name @<name> @> @<commentified-name>}
 605   Convert the argument name @<name> so that it's suitable to declare the
 606   function in a header file.
 607
 608   Robust header files shouldn't include literal argument names in
 609   declarations of functions or function types, since this restricts the
 610   including file from defining such names as macros.  This generic function
 611   is used to convert names into a safe form.
 612
 613   \begin{describe}{meth}{commentify-argument-name (@<name> null) @> nil}
 614     Returns nil: if the argument name is already omitted, it's safe for use
 615     in a header file.
 616   \end{describe}
 617   \begin{describe}{meth}{commentify-argument-name (@<name> t) @> @<string>}
 618     Returns the print form of @<name> wrapped in a C comment, as
 619     @`/*@<name>*/'.
 620   \end{describe}
 621 \end{describe}
 622
 623 \begin{describe}{fun}
 624     {commentify-argument-names @<arguments> @> @<commentified-arguments>}
 625   Convert the @<arguments> list so that it's suitable for use in a header
 626   file.
 627
 628   The @<arguments> list should be a list whose items are @|argument| objects
 629   or the keyword @|:ellipsis|.  The return value is a list constructed as
 630   follows.  For each @|argument| object in the input list, there is a
 631   corresponding @|argument| object in the returned list, with the same type,
 632   and whose name is the result of @|commentify-argument-name| applied to the
 633   input argument name; an @|:ellipsis| in the input list is passed through
 634   unchanged.
 635 \end{describe}
 636
 637 \begin{describe}{cls}{c-function-type (c-type) \&key :subtype :arguments}
 638   Represents C function types.  An instance denotes the type of a C
 639   function which accepts the @<arguments> and returns @<subtype>.
 640
 641   The @<arguments> are a possibly empty list.  All but the last element of
 642   the list must be @|argument| objects; the final element may instead be the
 643   keyword @|:ellipsis|, which denotes a variable argument list.
 644
 645   An @<arguments> list consisting of a single argument with type @|void| is
 646   converted into an empty list.  On output as C code, an empty argument list
 647   is written as @|void|.  It is not possible to represent a pre-ANSI C
 648   function without prototypes.
 649
 650   Two function types are considered to be the same if their return types are
 651   the same, and their argument lists consist of arguments with the same type,
 652   in the same order, and either both or neither argument list ends with
 653   @|:ellipsis|; argument names are not compared.
 654
 655   The type specifier @|(fun @<return-type> @{ (@<arg-name> @<arg-type>) @}^*
 656   @[:ellipsis @! . @<form> @])| constructs a function type.  The function has
 657   the subtype @<return-type>.  The remaining items in the type-specifier list
 658   are used to construct the argument list.  The argument items are a possibly
 659   improper list, beginning with zero or more \emph{explicit arguments}:
 660   two-item @<arg-name>/@<arg-type> lists.  For each such list, an @|argument|
 661   object is constructed with the given name (evaluated) and type.  Following
 662   the explicit arguments, there may be
 663   \begin{itemize}
 664   \item nothing, in which case the function's argument list consists only of
 665     the explicit arguments;
 666   \item the keyword @|:ellipsis|, as the final item in the type-specifier
 667     list, indicating a variable argument list may follow the explicit
 668     arguments; or
 669   \item a possibly-improper list tail, beginning with an atom either as a
 670     list item or as the final list cdr, indicating that the entire list tail
 671     is Lisp expression which is to be evaluated to compute the remaining
 672     arguments.
 673   \end{itemize}
 674   A tail expression may return a list of @|argument| objects, optionally
 675   followed by an @|:ellipsis|.
 676
 677   For example,
 678   \begin{prog}
 679     (c-type (fun \=(lisp (c-type-subtype other-func)) \+ \\
 680                    ("first" int) . (c-function-arguments other-func))
 681   \end{prog}
 682   evaluates to a function type like @|other-func|, only with an additional
 683   argument of type @|int| added to the front of its argument list.  This
 684   could also have been written
 685   \begin{prog}
 686     (let (\=(args (c-function-arguments other-func)) \+ \\
 687             (ret (c-type-subtype other-func))) \- \\ \ind
 688       (c-type (fun \=(lisp ret) ("first" int) . args)
 689   \end{prog}
 690 \end{describe}
 691
 692 \begin{describe}{fun}
 693     {make-function-type @<subtype> @<arguments> @> @<c-function-type>}
 694   Construct and return a new function type, returning @<subtype> and
 695   accepting the @<arguments>.
 696 \end{describe}
 697
 698 \begin{describe}{gf}
 699     {c-function-arguments @<c-function-type> @> @<arguments>}
 700   Return the arguments list of the @<c-function-type>.
 701 \end{describe}
 702
 703 \begin{describe}{fun}
 704     {commentify-function-type @<c-function-type> @> @<commentified-c-type>}
 705   Return a commentified version of the @<c-function-type>.
 706
 707   The returned type has the same subtype as the given type, and the argument
 708   list of the returned type is the result of applying
 709   @|commentify-argument-names| to the argument list of the given type.
 710 \end{describe}
 711
 712 \subsection{Parsing C types} \label{sec:clang.c-types.parsing}
 713
 714 %%%--------------------------------------------------------------------------
 715 \section{Generating C code} \label{sec:clang.codegen}
 716
 717 This section deals with Sod's facilities for constructing and manipulating C
 718 expressions, declarations, instructions and definitions.
 719
 720 \subsection{Temporary names} \label{sec:clang.codegen.temporaries}
 721
 722 Many C-level objects, especially ones with external linkage or inclusion in a
 723 header file, are assigned names which are simple strings, perhaps fixed ones,
 724 perhaps constructed.  Other objects don't need meaningful names, and
 725 suitably unique constructed names would be tedious and most likely rather
 726 opaque.  Therefore Sod has an ability to construct \emph{temporary names}.
 727
 728 These aren't temporary in the sense that they name C objects which have
 729 limited lifetimes at runtime.  Rather, the idea is that the names be
 730 significant only to small pieces of Lisp code, which will soon forget about
 731 them.
 732
 733 \subsubsection{The temporary name protocol}
 734 Temporary names are represented by objects which implement a simple protocol.
 735
 736 \begin{describe}{gf}{format-temporary-name @<var> @<stream>}
 737 \end{describe}
 738
 739 \begin{describe*}
 740     {\dhead{gf}{var-in-use-p @<var> @> @<generalized-boolean>}
 741      \dhead[setf var-in-use-p]
 742        {gf}{setf (var-in-use-p @<var>) @<generalized-boolean>}}
 743 \end{describe*}
 744
 745 \subsubsection{Temporary name objects}
 746
 747 \begin{describe}{cls}{temporary-name () \&key :tag}
 748   A temporary name object.  This is the root of a small collection of
 749   subclasses, but is also usable on its own.
 750 \end{describe}
 751
 752 \begin{describe}{meth}
 753     {commentify-argument-name (@<name> temporary-name) @> nil}
 754 \end{describe}
 755
 756 \begin{table}
 757   \begin{tabular}[C]{*2{>{\codeface}l}}                            \hlx*{hv}
 758     \thd{\textbf{Class}} & \thd{\textbf{Name format}}           \\ \hlx{vhv}
 759     temporary-name              & @<tag>                        \\
 760     temporary-argument          & sod__a@<tag>                  \\
 761     temporary-function          & sod__f@<tag>                  \\
 762     temporary-variable          & sod__v@<tag>                  \\ \hlx*{vh}
 763   \end{tabular}
 764   \caption{Temporary name formats}
 765   \label{tab:codegen.codegen.temps-format}
 766 \end{table}
 767
 768 \begin{describe}{cls}{temporary-argument (temporary-name) \&key :tag}
 769 \end{describe}
 770
 771 \begin{describe}{cls}{temporary-function (temporary-name) \&key :tag}
 772 \end{describe}
 773
 774 \begin{describe}{fun}{temporary-function @> @<name>}
 775 \end{describe}
 776
 777 \begin{describe}{cls}
 778     {temporary-variable (temporary-name) \&key :tag :in-use-p}
 779 \end{describe}
 780
 781 \subsubsection{Well-known `temporary' names}
 782
 783 \begin{table}
 784   \begin{tabular}[C]{*2{>{\codeface}l}}                            \hlx*{hv}
 785     \thd{\textbf{Variable}} & \thd{\textbf{Name format}}        \\ \hlx{vhv}
 786     {}*sod-ap*                  & sod__ap                       \\
 787     {}*sod-master-ap*           & sod__master_ap                \\
 788     {}*sod-tmp-ap*              & sod__tmp_ap                   \\ \hlx*{vh}
 789   \end{tabular}
 790   \caption{Well-known temporary names}
 791   \label{tab:codegen.codegen.well-known-temps}
 792 \end{table}
 793
 794 \subsection{Instructions} \label{sec:clang.codegen.insts}
 795
 796 \begin{describe}{cls}{inst () \&key}
 797 \end{describe}
 798
 799 \begin{describe}{gf}{inst-metric @<inst>}
 800 \end{describe}
 801
 802 \begin{describe}{mac}
 803     {definst @<code> (@<streamvar> \&key @<export>) (@<arg>^*)
 804       @<body-form>^*}
 805 \end{describe}
 806
 807 \begin{describe}{mac}
 808     {format-compound-statement (@<stream> @<child> \&optional @<morep>)
 809       @<body-form>^*}
 810 \end{describe}
 811
 812 \begin{table}
 813   \begin{tabular}[C]{ll>{\codeface}l}                              \hlx*{hv}
 814     \thd{Class name} &
 815     \thd{Arguments} &
 816     \thd{Output format}                                         \\ \hlx{vhv}
 817     @|var|      & @<name> @<type> @<init>  & @<type> @<name> @[= @<init>@];
 818                                                                 \\ \hlx{v}
 819     @|set|      & @<var> @<expr>           & @<var> = @<expr>;  \\ \hlx{v}
 820     @|update|   & @<var> @<op> @<expr>     & @<var> @<op>= @<expr>;
 821                                                                 \\ \hlx{v}
 822     @|return|   & @<expr>                  & return @[@<expr>@];
 823                                                                 \\ \hlx{v}
 824     @|break|    & ---                      & break;             \\ \hlx{v}
 825     @|continue| & ---                      & continue;          \\ \hlx{v}
 826     @|expr|     & @<expr>                  & @<expr>;           \\ \hlx{v}
 827     @|call|     & @<func> @<args>          & @<func>(@<arg>_1,
 828                                                      $\ldots$,
 829                                                      @<arg>_n)  \\ \hlx{v}
 830     @|va-start| & @<ap> @<arg>             & va_start(@<ap>, @<arg>);
 831                                                                 \\ \hlx{v}
 832     @|va-copy|  & @<to> @<from>            & va_copy(@<to>, @<from>);
 833                                                                 \\ \hlx{v}
 834     @|va-end|   & @<ap>                    & va_end(@<ap>);     \\ \hlx{vhv}
 835     @|block|    & @<decls> @<body>         & \{ @[@<decls>@] @<body> \}
 836                                                                 \\ \hlx{v}
 837     @|if|       & @<cond> @<conseq> @<alt> & if (@<cond>) @<conseq>
 838                                              @[else @<alt>@]    \\ \hlx{v}
 839     @|while|    & @<cond> @<body>          & while (@<cond>) @<body>
 840                                                                 \\ \hlx{v}
 841     @|do-while| & @<body> @<cond>          & do @<body> while (@<cond>);
 842                                                                 \\ \hlx{v}
 843     @|function| & @<name> @<type> @<body>  &
 844       @<type>_0 @<name>(@<type>_1 @<arg>_1, $\ldots$,
 845                              @<type>_n @<arg>_n @[, \dots@])
 846         @<body>                                                 \\ \hlx*{vh}
 847   \end{tabular}
 848   \caption{Instruction classes}
 849   \label{tab:codegen.codegen.insts}
 850 \end{table}
 851
 852 \subsection{Code generation} \label{sec:clang.codegen.codegen}
 853
 854 \begin{describe}{gf}{codegen-functions @<codegen> @> @<list>}
 855 \end{describe}
 856
 857 \begin{describe}{gf}
 858     {ensure-var @<codegen> @<name> @<type> \&optional @<init>}
 859 \end{describe}
 860
 861 \begin{describe}{gf}{emit-inst @<codegen> @<inst>}
 862 \end{describe}
 863
 864 \begin{describe}{gf}{emit-insts @<codegen> @<insts>}
 865 \end{describe}
 866
 867 \begin{describe}{gf}{emit-decl @<codegen> @<decl>}
 868 \end{describe}
 869
 870 \begin{describe}{gf}{emit-declss @<codegen> @<decls>}
 871 \end{describe}
 872
 873 \begin{describe}{gf}{codegen-push @<codegen>}
 874 \end{describe}
 875
 876 \begin{describe}{gf}{codegen-pop @<codegen> @> @<decls> @<insts>}
 877 \end{describe}
 878
 879 \begin{describe}{gf}{codegen-pop-block @<codegen> @> @<block-inst>}
 880 \end{describe}
 881
 882 \begin{describe}{gf}
 883     {codegen-pop-function @<codegen> @<name> @<type> @> @<name>}
 884 \end{describe}
 885
 886 \begin{describe}{gf}{codegen-add-function @<codegen> @<function>}
 887 \end{describe}
 888
 889 \begin{describe}{fun}
 890     {codegen-build-function @<codegen> @<name> @<type> @<vars> @<insts>
 891       @> @<name>}
 892 \end{describe}
 893
 894 \begin{describe}{gf}{temporary-var @<codegen> @<type> @> @<name>}
 895 \end{describe}
 896
 897 \begin{describe}{mac}
 898     {with-temporary-var (@<codegen> @<var> @<type>) @<body-form>^*
 899       @> @<value>^*}
 900 \end{describe}
 901
 902 \begin{describe}{fun}{deliver-expr @<codegen> @<target> @<expr>}
 903 \end{describe}
 904
 905 \begin{describe}{fun}{convert-stmts @<codegen> @<target> @<type> @<func>}
 906 \end{describe}
 907
 908 \begin{describe}{cls}{codegen () \&key :vars :insts (:temp-index 0)}
 909 \end{describe}
 910
 911 %%%----- That's all, folks --------------------------------------------------
 912
 913 %%% Local variables:
 914 %%% mode: LaTeX
 915 %%% TeX-master: "sod.tex"
 916 %%% TeX-PDF-mode: t
 917 %%% End: