Bump copyright dates, and change the one at the start of the manual to be
[sgt/halibut] / halibut.h
CommitLineData
d7482997 1#ifndef HALIBUT_HALIBUT_H
2#define HALIBUT_HALIBUT_H
3
4#include <stdio.h>
5#include <wchar.h>
6#include <time.h>
9c1cf191 7#include <string.h>
d7482997 8
e34ba5c3 9#include "charset.h"
10
d7482997 11#ifdef __GNUC__
12#define NORETURN __attribute__((__noreturn__))
13#else
14#define NORETURN /* nothing */
15#endif
16
17#ifndef TRUE
18#define TRUE 1
19#endif
20#ifndef FALSE
21#define FALSE 0
22#endif
23
24/* For suppressing unused-parameter warnings */
25#define IGNORE(x) ( (x) = (x) )
26
27#include "tree234.h"
28
29/*
30 * Structure tags
31 */
32typedef struct input_Tag input;
33typedef struct filepos_Tag filepos;
34typedef struct paragraph_Tag paragraph;
35typedef struct word_Tag word;
36typedef struct keywordlist_Tag keywordlist;
37typedef struct keyword_Tag keyword;
d7482997 38typedef struct numberstate_Tag numberstate;
39typedef struct indexdata_Tag indexdata;
40typedef struct indextag_Tag indextag;
41typedef struct indexentry_Tag indexentry;
42typedef struct macrostack_Tag macrostack;
43
44/*
45 * Data structure to hold a file name and index, a line and a
46 * column number, for reporting errors
47 */
48struct filepos_Tag {
49 char *filename;
50 int line, col;
51};
52
53/*
54 * Data structure to hold all the file names etc for input
55 */
56typedef struct pushback_Tag {
57 int chr;
58 filepos pos;
59} pushback;
60struct input_Tag {
61 char **filenames; /* complete list of input files */
62 int nfiles; /* how many in the list */
63 FILE *currfp; /* the currently open one */
64 int currindex; /* which one is that in the list */
65 pushback *pushback; /* pushed-back input characters */
66 int npushback, pushbacksize;
67 filepos pos;
68 int reportcols; /* report column numbers in errors */
69 macrostack *stack; /* macro expansions in force */
e34ba5c3 70 int defcharset, charset; /* character sets for input files */
71 charset_state csstate;
72 wchar_t wc[16]; /* wide chars from input conversion */
73 int nwc, wcpos; /* size of, and position in, wc[] */
e4ea58f8 74 char *pushback_chars; /* used to save input-encoding data */
d7482997 75};
76
77/*
78 * Data structure to hold the input form of the source, ie a linked
79 * list of paragraphs
80 */
81struct paragraph_Tag {
82 paragraph *next;
83 int type;
84 wchar_t *keyword; /* for most special paragraphs */
e4ea58f8 85 char *origkeyword; /* same again in original charset */
d7482997 86 word *words; /* list of words in paragraph */
87 int aux; /* number, in a numbered paragraph
88 * or subsection level
89 */
90 word *kwtext; /* chapter/section indication */
91 word *kwtext2; /* numeric-only form of kwtext */
92 filepos fpos;
93
94 paragraph *parent, *child, *sibling; /* for hierarchy navigation */
95
96 void *private_data; /* for temp use in backends */
97};
98enum {
99 para_IM, /* index merge */
100 para_BR, /* bibliography rewrite */
101 para_Rule, /* random horizontal rule */
102 para_Chapter,
103 para_Appendix,
104 para_UnnumberedChapter,
105 para_Heading,
106 para_Subsect,
107 para_Normal,
108 para_Biblio, /* causes no output unless turned ... */
109 para_BiblioCited, /* ... into this paragraph type */
110 para_Bullet,
111 para_NumberedList,
7136a6c7 112 para_DescribedThing,
113 para_Description,
d7482997 114 para_Code,
115 para_Copyright,
d7482997 116 para_NoCite,
117 para_Title,
118 para_VersionID,
119 para_Config, /* configuration directive */
7136a6c7 120 para_LcontPush, /* begin continuation of list item */
121 para_LcontPop, /* end continuation of list item */
2614b01d 122 para_QuotePush, /* begin block quote */
123 para_QuotePop, /* end block quote */
3f3d1acc 124 /*
125 * Back ends may define their own paragraph types beyond here,
126 * in case they need to use them internally.
127 */
d7482997 128 para_NotParaType /* placeholder value */
129};
130
131/*
132 * Data structure to hold an individual word
133 */
134struct word_Tag {
135 word *next, *alt;
136 int type;
137 int aux;
138 int breaks; /* can a line break after it? */
139 wchar_t *text;
140 filepos fpos;
5dd44dce 141
142 void *private_data; /* for temp use in backends */
d7482997 143};
144enum {
145 /* ORDERING CONSTRAINT: these normal-word types ... */
146 word_Normal,
147 word_Emph,
148 word_Code, /* monospaced; `quoted' in text */
149 word_WeakCode, /* monospaced, normal in text */
150 /* ... must be in the same order as these space types ... */
151 word_WhiteSpace, /* text is NULL or ignorable */
152 word_EmphSpace, /* WhiteSpace when emphasised */
153 word_CodeSpace, /* WhiteSpace when code */
154 word_WkCodeSpace, /* WhiteSpace when weak code */
155 /* ... and must be in the same order as these quote types ... */
156 word_Quote, /* text is NULL or ignorable */
157 word_EmphQuote, /* Quote when emphasised */
158 word_CodeQuote, /* (can't happen) */
159 word_WkCodeQuote, /* (can't happen) */
160 /* END ORDERING CONSTRAINT */
161 word_internal_endattrs,
162 word_UpperXref, /* \K */
163 word_LowerXref, /* \k */
164 word_XrefEnd, /* (invisible; no text) */
165 word_IndexRef, /* (always an invisible one) */
166 word_HyperLink, /* (invisible) */
3f3d1acc 167 word_HyperEnd, /* (also invisible; no text) */
168 /*
169 * Back ends may define their own word types beyond here, in
170 * case they need to use them internally.
171 */
172 word_NotWordType /* placeholder value */
d7482997 173};
174/* aux values for attributed words */
175enum {
176 attr_Only = 0x0000, /* a lone word with the attribute */
177 attr_First = 0x0001, /* the first of a series */
178 attr_Last = 0x0002, /* the last of a series */
179 attr_Always = 0x0003, /* any other part of a series */
ee90d1f0 180 attr_mask = 0x0003
d7482997 181};
182/* aux values for quote-type words */
183enum {
184 quote_Open = 0x0010,
185 quote_Close = 0x0020,
ee90d1f0 186 quote_mask = 0x0030
d7482997 187};
188#define isattr(x) ( ( (x) > word_Normal && (x) < word_WhiteSpace ) || \
189 ( (x) > word_WhiteSpace && (x) < word_internal_endattrs ) )
190#define sameattr(x,y) ( (((x)-(y)) & 3) == 0 )
191#define towordstyle(x) ( word_Normal + ((x) & 3) )
192#define tospacestyle(x) ( word_WhiteSpace + ((x) & 3) )
193#define toquotestyle(x) ( word_Quote + ((x) & 3) )
194#define removeattr(x) ( word_Normal + ((x) &~ 3) )
195
196#define attraux(x) ( (x) & attr_mask )
197#define quoteaux(x) ( (x) & quote_mask )
198
199/*
200 * error.c
201 */
202void fatal(int code, ...) NORETURN;
203void error(int code, ...);
204enum {
205 err_nomemory, /* out of memory */
206 err_optnoarg, /* option `-%s' requires an argument */
207 err_nosuchopt, /* unrecognised option `-%s' */
675958c3 208 err_cmdcharset, /* unrecognised charset %s (cmdline) */
209 err_futileopt, /* futile option `-%s'%s */
d7482997 210 err_noinput, /* no input files */
211 err_cantopen, /* unable to open input file `%s' */
212 err_nodata, /* no data in input files */
213 err_brokencodepara, /* line in codepara didn't begin `\c' */
214 err_kwunclosed, /* expected `}' after keyword */
215 err_kwillegal, /* paragraph type expects no keyword */
216 err_kwexpected, /* paragraph type expects a keyword */
217 err_kwtoomany, /* paragraph type expects only 1 */
218 err_bodyillegal, /* paragraph type expects only kws! */
219 err_badparatype, /* invalid command at start of para */
220 err_badmidcmd, /* invalid command in mid-para */
221 err_unexbrace, /* unexpected brace */
222 err_explbr, /* expected `{' after command */
223 err_commenteof, /* EOF inside braced comment */
224 err_kwexprbr, /* expected `}' after cross-ref */
6ff15f2b 225 err_codequote, /* \q within \c is not supported */
d7482997 226 err_missingrbrace, /* unclosed braces at end of para */
7136a6c7 227 err_missingrbrace2, /* unclosed braces at end of file */
d7482997 228 err_nestedstyles, /* unable to nest text styles */
229 err_nestedindex, /* unable to nest `\i' thingys */
da090173 230 err_indexcase, /* two \i differing only in case */
d7482997 231 err_nosuchkw, /* unresolved cross-reference */
232 err_multiBR, /* multiple \BRs on same keyword */
233 err_nosuchidxtag, /* \IM on unknown index tag (warning) */
234 err_cantopenw, /* can't open output file for write */
235 err_macroexists, /* this macro already exists */
236 err_sectjump, /* jump a heading level, eg \C -> \S */
237 err_winhelp_ctxclash, /* WinHelp context ID hash clash */
238 err_multikw, /* keyword clash in sections */
7136a6c7 239 err_misplacedlcont, /* \lcont not after a list item */
2614b01d 240 err_sectmarkerinblock, /* section marker appeared in block */
12f0ee84 241 err_cfginsufarg, /* \cfg{%s} insufficient args (<%d) */
f4551933 242 err_infonodechar, /* colon/comma in node name in info */
db662ca1 243 err_text_codeline, /* \c line too long in text backend */
27bdc5ab 244 err_htmlver, /* unrecognised HTML version keyword */
0960a3d8 245 err_charset, /* unrecognised character set name */
ba0fe3ec 246 err_nofont, /* unrecognised font name */
247 err_afmeof, /* eof in AFM file */
248 err_afmkey, /* missing expected keyword in AFM */
249 err_afmvers, /* unsupported AFM version */
250 err_afmval, /* missing value(s) for AFM key */
c885c2ff 251 err_pfeof, /* eof in Type 1 font file */
252 err_pfhead, /* bad Type 1 header line */
253 err_pfbad, /* otherwise invalide Type 1 font */
254 err_pfnoafm, /* Type 1 font but no AFM */
f2ef00b5 255 err_chmnames, /* need both or neither of hhp+chm */
d7482997 256 err_whatever /* random error of another type */
257};
258
259/*
260 * malloc.c
261 */
262#ifdef LOGALLOC
263void *smalloc(char *file, int line, int size);
264void *srealloc(char *file, int line, void *p, int size);
265void sfree(char *file, int line, void *p);
266#define smalloc(x) smalloc(__FILE__, __LINE__, x)
267#define srealloc(x, y) srealloc(__FILE__, __LINE__, x, y)
268#define sfree(x) sfree(__FILE__, __LINE__, x)
269#else
270void *smalloc(int size);
271void *srealloc(void *p, int size);
272void sfree(void *p);
273#endif
274void free_word_list(word *w);
275void free_para_list(paragraph *p);
276word *dup_word_list(word *w);
277char *dupstr(char *s);
278
f1530049 279#define snew(type) ( (type *) smalloc (sizeof (type)) )
280#define snewn(number, type) ( (type *) smalloc ((number) * sizeof (type)) )
281#define sresize(array, number, type) \
282 ( (type *) srealloc ((array), (number) * sizeof (type)) )
d7482997 283#define lenof(array) ( sizeof(array) / sizeof(*(array)) )
284
285/*
286 * ustring.c
287 */
e4ea58f8 288wchar_t *ustrdup(wchar_t const *s);
289char *ustrtoa(wchar_t const *s, char *outbuf, int size, int charset);
290char *ustrtoa_careful(wchar_t const *s, char *outbuf, int size, int charset);
291wchar_t *ustrfroma(char const *s, wchar_t *outbuf, int size, int charset);
292char *utoa_dup(wchar_t const *s, int charset);
293char *utoa_dup_len(wchar_t const *s, int charset, int *len);
294char *utoa_careful_dup(wchar_t const *s, int charset);
295wchar_t *ufroma_dup(char const *s, int charset);
7e976207 296char *utoa_locale_dup(wchar_t const *s);
297wchar_t *ufroma_locale_dup(char const *s);
5dd44dce 298int ustrlen(wchar_t const *s);
d7482997 299wchar_t *uadv(wchar_t *s);
5dd44dce 300wchar_t *ustrcpy(wchar_t *dest, wchar_t const *source);
08e78486 301wchar_t *ustrncpy(wchar_t *dest, wchar_t const *source, int n);
d7482997 302wchar_t utolower(wchar_t);
831da32e 303int uisalpha(wchar_t);
d7482997 304int ustrcmp(wchar_t *lhs, wchar_t *rhs);
78c73085 305int ustricmp(wchar_t const *lhs, wchar_t const *rhs);
306int ustrnicmp(wchar_t const *lhs, wchar_t const *rhs, int maxlen);
dd567011 307int utoi(wchar_t const *);
308double utof(wchar_t const *);
309int utob(wchar_t const *);
d7482997 310int uisdigit(wchar_t);
311wchar_t *ustrlow(wchar_t *s);
c8422236 312wchar_t *ustrftime(const wchar_t *wfmt, const struct tm *timespec);
91f93b94 313int cvt_ok(int charset, const wchar_t *s);
0960a3d8 314int charset_from_ustr(filepos *fpos, const wchar_t *name);
d7482997 315
316/*
e5cd393f 317 * wcwidth.c
318 */
319int strwid(char const *s, int charset);
320int ustrwid(wchar_t const *s, int charset);
321
322/*
d7482997 323 * help.c
324 */
325void help(void);
326void usage(void);
327void showversion(void);
f336fa9a 328void listcharsets(void);
d7482997 329
330/*
331 * licence.c
332 */
333void licence(void);
334
335/*
336 * version.c
337 */
961ee75b 338extern const char *const version;
d7482997 339
340/*
341 * misc.c
342 */
e4ea58f8 343char *adv(char *s);
344
d7482997 345typedef struct stackTag *stack;
346stack stk_new(void);
347void stk_free(stack);
348void stk_push(stack, void *);
349void *stk_pop(stack);
7136a6c7 350void *stk_top(stack);
d7482997 351
352typedef struct tagRdstring rdstring;
353struct tagRdstring {
354 int pos, size;
355 wchar_t *text;
356};
357typedef struct tagRdstringc rdstringc;
358struct tagRdstringc {
359 int pos, size;
360 char *text;
361};
362extern const rdstring empty_rdstring;
363extern const rdstringc empty_rdstringc;
364void rdadd(rdstring *rs, wchar_t c);
5dd44dce 365void rdadds(rdstring *rs, wchar_t const *p);
d7482997 366wchar_t *rdtrim(rdstring *rs);
367void rdaddc(rdstringc *rs, char c);
5dd44dce 368void rdaddsc(rdstringc *rs, char const *p);
7e2417cc 369void rdaddsn(rdstringc *rc, char const *p, int len);
d7482997 370char *rdtrimc(rdstringc *rs);
371
372int compare_wordlists(word *a, word *b);
373
bb9e7835 374void mark_attr_ends(word *words);
d7482997 375
376typedef struct tagWrappedLine wrappedline;
377struct tagWrappedLine {
378 wrappedline *next;
379 word *begin, *end; /* first & last words of line */
380 int nspaces; /* number of whitespaces in line */
381 int shortfall; /* how much shorter than max width */
382};
43341922 383wrappedline *wrap_para(word *, int, int, int (*)(void *, word *), void *, int);
d7482997 384void wrap_free(wrappedline *);
e4ea58f8 385void cmdline_cfg_add(paragraph *cfg, char *string);
386paragraph *cmdline_cfg_new(void);
387paragraph *cmdline_cfg_simple(char *string, ...);
d7482997 388
389/*
390 * input.c
391 */
392paragraph *read_input(input *in, indexdata *idx);
393
394/*
ba0fe3ec 395 * in_afm.c
396 */
397void read_afm_file(input *in);
398
399/*
44407fea 400 * in_pf.c
401 */
402void read_pfa_file(input *in);
403
404/*
d7482997 405 * keywords.c
406 */
407struct keywordlist_Tag {
408 int nkeywords;
409 int size;
410 tree234 *keys; /* sorted by `key' field */
411 word **looseends; /* non-keyword list element numbers */
412 int nlooseends;
413 int looseendssize;
414};
415struct keyword_Tag {
416 wchar_t *key; /* the keyword itself */
417 word *text; /* "Chapter 2", "Appendix Q"... */
418 /* (NB: filepos are not set) */
419 paragraph *para; /* the paragraph referenced */
420};
421keyword *kw_lookup(keywordlist *, wchar_t *);
422keywordlist *get_keywords(paragraph *);
423void free_keywords(keywordlist *);
424void subst_keywords(paragraph *, keywordlist *);
425
426/*
427 * index.c
428 */
429
430/*
431 * Data structure to hold both sides of the index.
432 */
433struct indexdata_Tag {
434 tree234 *tags; /* holds type `indextag' */
435 tree234 *entries; /* holds type `indexentry' */
436};
437
438/*
439 * Data structure to hold an index tag (LHS of index).
440 */
441struct indextag_Tag {
442 wchar_t *name;
443 word *implicit_text;
f4551933 444 filepos implicit_fpos;
d7482997 445 word **explicit_texts;
f4551933 446 filepos *explicit_fpos;
d7482997 447 int nexplicit, explicit_size;
448 int nrefs;
449 indexentry **refs; /* array of entries referenced by tag */
450};
451
452/*
453 * Data structure to hold an index entry (RHS of index).
454 */
455struct indexentry_Tag {
456 word *text;
457 void *backend_data; /* private to back end */
f4551933 458 filepos fpos;
d7482997 459};
460
461indexdata *make_index(void);
462void cleanup_index(indexdata *);
463/* index_merge takes responsibility for freeing arg 3 iff implicit; never
464 * takes responsibility for arg 2 */
f4551933 465void index_merge(indexdata *, int is_explicit, wchar_t *, word *, filepos *);
d7482997 466void build_index(indexdata *);
467void index_debug(indexdata *);
468indextag *index_findtag(indexdata *idx, wchar_t *name);
469
470/*
471 * contents.c
472 */
473numberstate *number_init(void);
474void number_cfg(numberstate *, paragraph *);
96f3af16 475word *number_mktext(numberstate *, paragraph *, wchar_t *, int *, int *);
d7482997 476void number_free(numberstate *);
477
478/*
479 * biblio.c
480 */
481void gen_citations(paragraph *, keywordlist *);
482
483/*
d7482997 484 * bk_text.c
485 */
43341922 486void text_backend(paragraph *, keywordlist *, indexdata *, void *);
ba9c1487 487paragraph *text_config_filename(char *filename);
d7482997 488
489/*
78c73085 490 * bk_html.c
d7482997 491 */
78c73085 492void html_backend(paragraph *, keywordlist *, indexdata *, void *);
493paragraph *html_config_filename(char *filename);
d7482997 494
495/*
496 * bk_whlp.c
497 */
43341922 498void whlp_backend(paragraph *, keywordlist *, indexdata *, void *);
ba9c1487 499paragraph *whlp_config_filename(char *filename);
d7482997 500
7136a6c7 501/*
502 * bk_man.c
503 */
43341922 504void man_backend(paragraph *, keywordlist *, indexdata *, void *);
ba9c1487 505paragraph *man_config_filename(char *filename);
7136a6c7 506
5dd44dce 507/*
508 * bk_info.c
509 */
43341922 510void info_backend(paragraph *, keywordlist *, indexdata *, void *);
5dd44dce 511paragraph *info_config_filename(char *filename);
512
43341922 513/*
514 * bk_paper.c
515 */
516void *paper_pre_backend(paragraph *, keywordlist *, indexdata *);
517
518/*
519 * bk_ps.c
520 */
521void ps_backend(paragraph *, keywordlist *, indexdata *, void *);
522paragraph *ps_config_filename(char *filename);
523
524/*
525 * bk_pdf.c
526 */
527void pdf_backend(paragraph *, keywordlist *, indexdata *, void *);
528paragraph *pdf_config_filename(char *filename);
529
d7482997 530#endif