78087d66d9ad06fb24a71553a9cde73f16bd6e1f
[become] / src / mdwopt.h
1 /* -*-c-*-
2 *
3 * $Id: mdwopt.h,v 1.2 1997/08/04 10:24:24 mdw Exp $
4 *
5 * Options parsing, similar to GNU @getopt_long@
6 *
7 * (c) 1996 Mark Wooding
8 */
9
10 /*----- Licencing notice --------------------------------------------------*
11 *
12 * This file is part of many programs.
13 *
14 * `mdwopt' is free software; you can redistribute it and/or modify
15 * it under the terms of the GNU General Public License as published by
16 * the Free Software Foundation; either version 2 of the License, or
17 * (at your option) any later version.
18 *
19 * `mdwopt' is distributed in the hope that it will be useful,
20 * but WITHOUT ANY WARRANTY; without even the implied warranty of
21 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
22 * GNU General Public License for more details.
23 *
24 * You should have received a copy of the GNU General Public License
25 * along with `mdwopt'; if not, write to the Free Software Foundation,
26 * Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
27 */
28
29 /*----- Revision history --------------------------------------------------*
30 *
31 * $Log: mdwopt.h,v $
32 * Revision 1.2 1997/08/04 10:24:24 mdw
33 * Sources placed under CVS control.
34 *
35 * Revision 1.4 1997/07/29 21:11:49 mdw
36 * Fixed address of the FSF.
37 *
38 * Revision 1.3 1996/12/31 19:41:33 mdw
39 * Formatting changes.
40 *
41 * Revision 1.2 1996/11/23 00:47:25 mdw
42 * Added `MdwOpt' object from the `anagram' source code.
43 *
44 * Revision 1.1 1996/09/24 18:01:43 mdw
45 * Initial revision
46 *
47 */
48
49 #ifndef MDWOPT_H
50 #define MDWOPT_H
51
52 /*----- Options handling structures ---------------------------------------*/
53
54 #ifdef __cplusplus
55 extern "C" {
56 #endif
57
58 /* --- @mdwopt_data@ --- *
59 *
60 * Contains all the information needed by the @mdwopt@ routine to do its
61 * work.
62 */
63
64 typedef struct {
65 /* --- Public variables --- */
66
67 char *arg; /* Arg of current option, or 0 */
68 int opt; /* Value of current option */
69 int ind; /* 0 for init, index when done */
70 int err; /* Set nonzero for error messages */
71 char *prog; /* Program name (from @argv[0]@) */
72
73 /* --- Private variables --- *
74 *
75 * Don't play with these, please.
76 */
77
78 char *list; /* Current short options pointer */
79 int next; /* Next argument, unpermuted */
80 int order; /* Ordering of options, flags */
81 char *env; /* Where we are in the env var */
82 char *estart; /* Pointer to env var buffer */
83 }
84 mdwopt_data;
85
86 /*----- Global variables --------------------------------------------------*/
87
88 extern mdwopt_data mdwopt_global; /* The default global data */
89
90 /* --- For compatibility with older programs (and prettiness) --- *
91 *
92 * The macros here access the global structure defined above. I consider it
93 * to be perfectly acceptable to use these macros in new code, because it
94 * looks nicer than playing with @mdwopt_global@.
95 */
96
97 #define optarg (mdwopt_global.arg) /* Argument of current option */
98 #define optopt (mdwopt_global.opt) /* Code of current option */
99 #define opterr (mdwopt_global.err) /* Zero to report error messages */
100 #define optind (mdwopt_global.ind) /* Index of first non-option */
101 #define optprog (mdwopt_global.prog) /* Pointer to program name */
102
103 /*----- Type definitions --------------------------------------------------*/
104
105 /* --- Long options definition table --- */
106
107 struct option {
108 const char *name; /* Name of the long option */
109 int has_arg; /* Does it have an argument? */
110 int *flag; /* Address of flag variable */
111 int val; /* Value to store/return */
112 };
113
114 /* --- Old-style names for argument flags in long options table --- */
115
116 enum {
117 no_argument, /* No argument required */
118 required_argument, /* User must specify argument */
119 optional_argument /* Argument is optional */
120 };
121
122 /* --- New style flag names --- */
123
124 enum {
125 gFlag_argReq = 1, /* Required argument */
126 gFlag_argOpt = 2, /* Optional argument */
127 gFlag_switch = 4, /* OR val into flag, don't store */
128 gFlag_negate = 8, /* Allow long option to be negated */
129 gFlag__last_long_opt_flag = 0 /* Dummy value */
130 };
131
132 enum {
133 gFlag_noLongs = 1, /* Don't read long options */
134 gFlag_noShorts = 2, /* Don't read short options */
135 gFlag_numbers = 4, /* Read numeric options */
136 gFlag_negation = 8, /* Allow `%|+|%' for negations */
137 gFlag_envVar = 16, /* Parse options from env var */
138 gFlag_noProgName = 32, /* Don't set @optprog@ */
139 gFlag_negNumber = 64, /* Allow negated number options */
140 gFlag__last_mdwopt_flag = 0 /* Dummy value */
141 };
142
143 enum {
144 gFlag_negated = 256, /* Option flag was negated by user */
145 gFlag__last_return_flag = 0 /* Dummy value */
146 };
147
148 /*----- Main code ---------------------------------------------------------*/
149
150 /* --- @mdwopt@ --- *
151 *
152 * Arguments: @int argc@ = number of command line arguments
153 * @char * const *argv@ = pointer to command line arguments
154 * @const char *shortopt@ = pointer to short options information
155 * @const struct option *longopts@ = pointer to long opts info
156 * @int *longind@ = where to store matched longopt
157 * @mdwopt_data *data@ = persistent state for the parser
158 * @int flags@ = various useful flags
159 *
160 * Returns: Value of option found next, or an error character, or
161 * @EOF@ for the last thing.
162 *
163 * Use: Reads options. The routine should be more-or-less compatible
164 * with standard getopts, although it provides many more
165 * features even than the standard GNU implementation.
166 *
167 * The precise manner of options parsing is determined by
168 * various flag settings, which are described below. By setting
169 * flag values appropriately, you can achieve behaviour very
170 * similar to most other getopt routines.
171 *
172 *
173 * How options parsing appears to users
174 *
175 * A command line consists of a number of `words' (which may
176 * contain spaces, according to various shell quoting
177 * conventions). A word may be an option, an argument to an
178 * option, or a non-option. An option begins with a special
179 * character, usually `%|-|%', although `%|+|%' is also used
180 * sometimes. As special exceptions, the word containing only a
181 * `%|-|%' is considered to be a non-option, since it usually
182 * represents standard input or output as a filename, and the
183 * word containing a double-dash `%|--|%' is used to mark all
184 * following words as being non-options regardless of their
185 * initial character.
186 *
187 * Traditionally, all words after the first non-option have been
188 * considered to be non-options automatically, so that options
189 * must be specified before filenames. However, this
190 * implementation can extract all the options from the command
191 * line regardless of their position. This can usually be
192 * disabled by setting one of the environment variables
193 * `%|POSIXLY_CORRECT|%' or `%|_POSIX_OPTION_ORDER|%'.
194 *
195 * There are two different styles of options: `short' and
196 * `long'.
197 *
198 * Short options are the sort which Unix has known for ages: an
199 * option is a single letter, preceded by a `%|-|%'. Short
200 * options can be joined together to save space (and possibly to
201 * make silly words): e.g., instead of giving options
202 * `%|-x.-y|%', a user could write `%|-xy|%'. Some short
203 * options can have arguments, which appear after the option
204 * letter, either immediately following, or in the next `word'
205 * (so an option with an argument could be written as
206 * `%|-o foo|%' or as `%|-ofoo|%'). Note that options with
207 * optional arguments must be written in the second style.
208 *
209 * When a short option controls a flag setting, it is sometimes
210 * possible to explicitly turn the flag off, as well as turning
211 * it on, (usually to override default options). This is
212 * usually done by using a `%|+|%' instead of a `%|-|%' to
213 * introduce the option.
214 *
215 * Long options, as popularised by the GNU utilities, are given
216 * long-ish memorable names, preceded by a double-dash `%|--|%'.
217 * Since their names are more than a single character, long
218 * options can't be combined in the same way as short options.
219 * Arguments to long options may be given either in the same
220 * `word', separated from the option name by an equals sign, or
221 * in the following `word'.
222 *
223 * Long option names can be abbreviated if necessary, as long
224 * as the abbreviation is unique. This means that options can
225 * have sensible and memorable names but still not require much
226 * typing from an experienced user.
227 *
228 * Like short options, long options can control flag settings.
229 * The options to manipulate these settings come in pairs: an
230 * option of the form `%|--set-flag|%' might set the flag, while
231 * an option of the form `%|--no-set-flag|%' might clear it.
232 *
233 * It is usual for applications to provide both short and long
234 * options with identical behaviour. Some applications with
235 * lots of options may only provide long options (although they
236 * will often be only two or three characters long). In this
237 * case, long options can be preceded with a single `%|-|%'
238 * character, and negated by a `%|+|%' character.
239 *
240 * Finally, some (older) programs accept arguments of the form
241 * `%%@.{"-"<number>}%%', to set some numerical parameter,
242 * typically a line count of some kind.
243 *
244 *
245 * How programs parse options
246 *
247 * An application parses its options by calling mdwopt
248 * repeatedly. Each time it is called, mdwopt returns a value
249 * describing the option just read, and stores information about
250 * the option in a data block. The value %$-1$% is returned
251 * when there are no more options to be read. The `%|?|%'
252 * character is returned when an error is encountered.
253 *
254 * Before starting to parse options, the value @data->ind@ must
255 * be set to 0 or 1. The value of @data->err@ can also be set,
256 * to choose whether errors are reported by mdwopt.
257 *
258 * The program's `@argc@' and `@argv@' arguments are passed to
259 * the options parser, so that it can read the command line. A
260 * flags word is also passed, allowing the program fine control
261 * over parsing. The flags are described above.
262 *
263 * Short options are described by a string, which once upon a
264 * time just contained the permitted option characters. Now the
265 * options string begins with a collection of flag characters,
266 * and various flag characters can be put after options
267 * characters to change their properties.
268 *
269 * If the first character of the short options string is
270 * `%|+|%', `%|-|%' or `%|!|%', the order in which options are
271 * read is modified, as follows:
272 *
273 * `%|+|%' forces the POSIX order to be used. As soon as a non-
274 * option is found, mdwopt returns %$-1$%.
275 *
276 * `%|-|%' makes mdwopt treat non-options as being `special'
277 * sorts of option. When a non-option word is found, the
278 * value 0 is returned, and the actual text of the word
279 * is stored as being the option's argument.
280 *
281 * `%|!|%' forces the default order to be used. The entire
282 * command line is scanned for options, which are
283 * returned in order. However, during this process,
284 * the options are moved in the @argv@ array, so that
285 * they appear before the non- options.
286 *
287 * A `%|:|%' character may be placed after the ordering flag (or
288 * at the very beginning if no ordering flag is given) which
289 * indicates that the character `%|:|%', rather than `%|?|%',
290 * should be returned if a missing argument error is detected.
291 *
292 * Each option in the string can be followed by a `%|+|%' sign,
293 * indicating that it can be negated, a `%|:|%' sign indicating
294 * that it requires an argument, or a `%|::|%' string,
295 * indicating an optional argument. Both `%|+|%' and `%|:|%' or
296 * `%|::|%' may be given, although the `%|+|%' must come first.
297 *
298 * If an option is found, the option character is returned to
299 * the caller. A pointer to an argument is stored in
300 * @data->arg@, or @NULL@ is stored if there was no argument.
301 * If a negated option was found, the option character is
302 * returned ORred with @gFlag_negated@ (bit 8 set).
303 *
304 * Long options are described in a table. Each entry in the
305 * table is of type @struct option@, and the table is terminated
306 * by an entry whose @name@ field is null. Each option has
307 * a flags word which, due to historical reasons, is called
308 * @has_arg@. This describes various properties of the option,
309 * such as what sort of argument it takes, and whether it can
310 * be negated.
311 *
312 * When mdwopt finds a long option, it looks the name up in the
313 * table. The index of the matching entry is stored in the
314 * @longind@ variable, passed to mdwopt (unless @longind@ is 0):
315 * a value of %$-1$% indicates that no long option was
316 * found. The behaviour is then dependent on the values in the
317 * table entry. If @flag@ is nonzero, it points to an integer
318 * to be modified by mdwopt. Usually the value in the @val@
319 * field is simply stored in the @flag@ variable. If the flag
320 * @gFlag_switch@ is set, however, the value is combined with
321 * the existing value of the flags using a bitwise OR. If
322 * @gFlag_negate@ is set, then the flag bit will be cleared if a
323 * matching negated long option is found. The value 0 is
324 * returned.
325 *
326 * If @flag@ is zero, the value in @val@ is returned by mdwopt,
327 * possibly with bit 8 set if the option was negated.
328 *
329 * Arguments for long options are stored in @data->arg@, as
330 * before.
331 *
332 * Numeric options, if enabled, cause the value `%|#|%' to be
333 * returned, and the numeric value to be stored in @data->opt@.
334 *
335 * If the flag @gFlag_envVar@ is set on entry, options will be
336 * extracted from an environment variable whose name is built by
337 * capitalising all the letters of the program's name. (This
338 * allows a user to have different default settings for a
339 * program, by calling it through different symbolic links.) */
340
341 extern int mdwopt(int /*argc*/, char *const */*argv*/,
342 const char */*shortopt*/,
343 const struct option */*longopts*/, int */*longind*/,
344 mdwopt_data */*data*/, int /*flags*/);
345
346 /* --- Macros for more commonly used routines --- */
347
348 #define getopt(c, v, o) mdwopt(c, v, o, 0, 0, 0, gFlag_noLongs)
349 #define getopt_long(c, v, o, l, li) mdwopt(c, v, o, l, li, 0, 0)
350 #define getopt_long_only(c, v, o, l, li) \
351 mdwopt(c, v, o, l, li, 0, gFlag_noShorts)
352
353 #ifdef __cplusplus
354 }
355 #endif
356
357 /*----- C++ wrapper class -------------------------------------------------*/
358
359 #ifdef __cplusplus
360
361 /* --- Class: @MdwOpt@ --- *
362 *
363 * Parent: ---
364 *
365 * Methods: @MdwOpt@ -- construct a new mdwopt object with the given
366 * arguments. These are remembered for later use.
367 * @arg@ -- return the argument of the current option
368 * arguments. These are remembered for later use.
369 * @arg@ -- return the argument of the current option
370 * @opt@ -- return the value of the current option
371 * @ind@ -- return the index of the next unread argument
372 * @longind@ -- return index of current long option in table
373 * @errors@ -- return or set whether we report errors to the
374 * user
375 * @prog@ -- return program name from @argv[0]@
376 * @next@ -- return next option read from the table
377 *
378 * Use: A simple C++ class for encapsulating the options parser.
379 * The methods are all nice and simple, and extremely similar
380 * to the normal C interface described above.
381 */
382
383 class MdwOpt {
384 protected:
385 int argc;
386 char * const *argv;
387 const char *shortopts;
388 const struct option *longopts;
389 int long_ind;
390 int flags;
391
392 mdwopt_data data;
393
394 public:
395 MdwOpt(int c, char * const *v, const char *so,
396 const struct option *lo, int f=0) :
397 argc(c), argv(v), shortopts(so), longopts(lo), flags(f) {
398 data.ind = 0;
399 data.err = 1;
400 }
401
402 const char *arg(void) const { return (data.arg); }
403 int opt(void) const { return (data.opt); }
404 int errors(void) const { return (data.err); }
405 int errors(int e) { int oe = data.err; data.err = e; return (oe); }
406 int ind(void) const { return (data.ind); }
407 int longind(void) const { return (long_ind); }
408 const char *prog(void) const { return (data.prog); }
409
410 int next(void) {
411 return (mdwopt(argc, argv, shortopts,
412 longopts, &long_ind, &data, flags));
413 }
414 };
415
416 #endif
417
418 /*----- That's all, folks -------------------------------------------------*/
419
420 #endif