input.c was capable of generating a paragraph structure with no text
[sgt/halibut] / halibut.h
CommitLineData
d7482997 1#ifndef HALIBUT_HALIBUT_H
2#define HALIBUT_HALIBUT_H
3
4#include <stdio.h>
5#include <wchar.h>
6#include <time.h>
9c1cf191 7#include <string.h>
d7482997 8
e34ba5c3 9#include "charset.h"
10
d7482997 11#ifdef __GNUC__
12#define NORETURN __attribute__((__noreturn__))
13#else
14#define NORETURN /* nothing */
15#endif
16
17#ifndef TRUE
18#define TRUE 1
19#endif
20#ifndef FALSE
21#define FALSE 0
22#endif
23
24/* For suppressing unused-parameter warnings */
25#define IGNORE(x) ( (x) = (x) )
26
27#include "tree234.h"
28
29/*
30 * Structure tags
31 */
32typedef struct input_Tag input;
33typedef struct filepos_Tag filepos;
34typedef struct paragraph_Tag paragraph;
35typedef struct word_Tag word;
36typedef struct keywordlist_Tag keywordlist;
37typedef struct keyword_Tag keyword;
38typedef struct userstyle_Tag userstyle;
39typedef struct numberstate_Tag numberstate;
40typedef struct indexdata_Tag indexdata;
41typedef struct indextag_Tag indextag;
42typedef struct indexentry_Tag indexentry;
43typedef struct macrostack_Tag macrostack;
44
45/*
46 * Data structure to hold a file name and index, a line and a
47 * column number, for reporting errors
48 */
49struct filepos_Tag {
50 char *filename;
51 int line, col;
52};
53
54/*
55 * Data structure to hold all the file names etc for input
56 */
57typedef struct pushback_Tag {
58 int chr;
59 filepos pos;
60} pushback;
61struct input_Tag {
62 char **filenames; /* complete list of input files */
63 int nfiles; /* how many in the list */
64 FILE *currfp; /* the currently open one */
65 int currindex; /* which one is that in the list */
66 pushback *pushback; /* pushed-back input characters */
67 int npushback, pushbacksize;
68 filepos pos;
69 int reportcols; /* report column numbers in errors */
70 macrostack *stack; /* macro expansions in force */
e34ba5c3 71 int defcharset, charset; /* character sets for input files */
72 charset_state csstate;
73 wchar_t wc[16]; /* wide chars from input conversion */
74 int nwc, wcpos; /* size of, and position in, wc[] */
e4ea58f8 75 char *pushback_chars; /* used to save input-encoding data */
d7482997 76};
77
78/*
79 * Data structure to hold the input form of the source, ie a linked
80 * list of paragraphs
81 */
82struct paragraph_Tag {
83 paragraph *next;
84 int type;
85 wchar_t *keyword; /* for most special paragraphs */
e4ea58f8 86 char *origkeyword; /* same again in original charset */
d7482997 87 word *words; /* list of words in paragraph */
88 int aux; /* number, in a numbered paragraph
89 * or subsection level
90 */
91 word *kwtext; /* chapter/section indication */
92 word *kwtext2; /* numeric-only form of kwtext */
93 filepos fpos;
94
95 paragraph *parent, *child, *sibling; /* for hierarchy navigation */
96
97 void *private_data; /* for temp use in backends */
98};
99enum {
100 para_IM, /* index merge */
101 para_BR, /* bibliography rewrite */
102 para_Rule, /* random horizontal rule */
103 para_Chapter,
104 para_Appendix,
105 para_UnnumberedChapter,
106 para_Heading,
107 para_Subsect,
108 para_Normal,
109 para_Biblio, /* causes no output unless turned ... */
110 para_BiblioCited, /* ... into this paragraph type */
111 para_Bullet,
112 para_NumberedList,
7136a6c7 113 para_DescribedThing,
114 para_Description,
d7482997 115 para_Code,
116 para_Copyright,
d7482997 117 para_NoCite,
118 para_Title,
119 para_VersionID,
120 para_Config, /* configuration directive */
7136a6c7 121 para_LcontPush, /* begin continuation of list item */
122 para_LcontPop, /* end continuation of list item */
2614b01d 123 para_QuotePush, /* begin block quote */
124 para_QuotePop, /* end block quote */
3f3d1acc 125 /*
126 * Back ends may define their own paragraph types beyond here,
127 * in case they need to use them internally.
128 */
d7482997 129 para_NotParaType /* placeholder value */
130};
131
132/*
133 * Data structure to hold an individual word
134 */
135struct word_Tag {
136 word *next, *alt;
137 int type;
138 int aux;
139 int breaks; /* can a line break after it? */
140 wchar_t *text;
141 filepos fpos;
5dd44dce 142
143 void *private_data; /* for temp use in backends */
d7482997 144};
145enum {
146 /* ORDERING CONSTRAINT: these normal-word types ... */
147 word_Normal,
148 word_Emph,
149 word_Code, /* monospaced; `quoted' in text */
150 word_WeakCode, /* monospaced, normal in text */
151 /* ... must be in the same order as these space types ... */
152 word_WhiteSpace, /* text is NULL or ignorable */
153 word_EmphSpace, /* WhiteSpace when emphasised */
154 word_CodeSpace, /* WhiteSpace when code */
155 word_WkCodeSpace, /* WhiteSpace when weak code */
156 /* ... and must be in the same order as these quote types ... */
157 word_Quote, /* text is NULL or ignorable */
158 word_EmphQuote, /* Quote when emphasised */
159 word_CodeQuote, /* (can't happen) */
160 word_WkCodeQuote, /* (can't happen) */
161 /* END ORDERING CONSTRAINT */
162 word_internal_endattrs,
163 word_UpperXref, /* \K */
164 word_LowerXref, /* \k */
165 word_XrefEnd, /* (invisible; no text) */
166 word_IndexRef, /* (always an invisible one) */
167 word_HyperLink, /* (invisible) */
3f3d1acc 168 word_HyperEnd, /* (also invisible; no text) */
169 /*
170 * Back ends may define their own word types beyond here, in
171 * case they need to use them internally.
172 */
173 word_NotWordType /* placeholder value */
d7482997 174};
175/* aux values for attributed words */
176enum {
177 attr_Only = 0x0000, /* a lone word with the attribute */
178 attr_First = 0x0001, /* the first of a series */
179 attr_Last = 0x0002, /* the last of a series */
180 attr_Always = 0x0003, /* any other part of a series */
181 attr_mask = 0x0003,
182};
183/* aux values for quote-type words */
184enum {
185 quote_Open = 0x0010,
186 quote_Close = 0x0020,
187 quote_mask = 0x0030,
188};
189#define isattr(x) ( ( (x) > word_Normal && (x) < word_WhiteSpace ) || \
190 ( (x) > word_WhiteSpace && (x) < word_internal_endattrs ) )
191#define sameattr(x,y) ( (((x)-(y)) & 3) == 0 )
192#define towordstyle(x) ( word_Normal + ((x) & 3) )
193#define tospacestyle(x) ( word_WhiteSpace + ((x) & 3) )
194#define toquotestyle(x) ( word_Quote + ((x) & 3) )
195#define removeattr(x) ( word_Normal + ((x) &~ 3) )
196
197#define attraux(x) ( (x) & attr_mask )
198#define quoteaux(x) ( (x) & quote_mask )
199
200/*
201 * error.c
202 */
203void fatal(int code, ...) NORETURN;
204void error(int code, ...);
205enum {
206 err_nomemory, /* out of memory */
207 err_optnoarg, /* option `-%s' requires an argument */
208 err_nosuchopt, /* unrecognised option `-%s' */
675958c3 209 err_cmdcharset, /* unrecognised charset %s (cmdline) */
210 err_futileopt, /* futile option `-%s'%s */
d7482997 211 err_noinput, /* no input files */
212 err_cantopen, /* unable to open input file `%s' */
213 err_nodata, /* no data in input files */
214 err_brokencodepara, /* line in codepara didn't begin `\c' */
215 err_kwunclosed, /* expected `}' after keyword */
216 err_kwillegal, /* paragraph type expects no keyword */
217 err_kwexpected, /* paragraph type expects a keyword */
218 err_kwtoomany, /* paragraph type expects only 1 */
219 err_bodyillegal, /* paragraph type expects only kws! */
220 err_badparatype, /* invalid command at start of para */
221 err_badmidcmd, /* invalid command in mid-para */
222 err_unexbrace, /* unexpected brace */
223 err_explbr, /* expected `{' after command */
224 err_commenteof, /* EOF inside braced comment */
225 err_kwexprbr, /* expected `}' after cross-ref */
6ff15f2b 226 err_codequote, /* \q within \c is not supported */
d7482997 227 err_missingrbrace, /* unclosed braces at end of para */
7136a6c7 228 err_missingrbrace2, /* unclosed braces at end of file */
d7482997 229 err_nestedstyles, /* unable to nest text styles */
230 err_nestedindex, /* unable to nest `\i' thingys */
da090173 231 err_indexcase, /* two \i differing only in case */
d7482997 232 err_nosuchkw, /* unresolved cross-reference */
233 err_multiBR, /* multiple \BRs on same keyword */
234 err_nosuchidxtag, /* \IM on unknown index tag (warning) */
235 err_cantopenw, /* can't open output file for write */
236 err_macroexists, /* this macro already exists */
237 err_sectjump, /* jump a heading level, eg \C -> \S */
238 err_winhelp_ctxclash, /* WinHelp context ID hash clash */
239 err_multikw, /* keyword clash in sections */
7136a6c7 240 err_misplacedlcont, /* \lcont not after a list item */
2614b01d 241 err_sectmarkerinblock, /* section marker appeared in block */
12f0ee84 242 err_cfginsufarg, /* \cfg{%s} insufficient args (<%d) */
f4551933 243 err_infonodechar, /* colon/comma in node name in info */
db662ca1 244 err_text_codeline, /* \c line too long in text backend */
27bdc5ab 245 err_htmlver, /* unrecognised HTML version keyword */
0960a3d8 246 err_charset, /* unrecognised character set name */
176f9548 247 err_emptypara, /* paragraph contains no actual text */
d7482997 248 err_whatever /* random error of another type */
249};
250
251/*
252 * malloc.c
253 */
254#ifdef LOGALLOC
255void *smalloc(char *file, int line, int size);
256void *srealloc(char *file, int line, void *p, int size);
257void sfree(char *file, int line, void *p);
258#define smalloc(x) smalloc(__FILE__, __LINE__, x)
259#define srealloc(x, y) srealloc(__FILE__, __LINE__, x, y)
260#define sfree(x) sfree(__FILE__, __LINE__, x)
261#else
262void *smalloc(int size);
263void *srealloc(void *p, int size);
264void sfree(void *p);
265#endif
266void free_word_list(word *w);
267void free_para_list(paragraph *p);
268word *dup_word_list(word *w);
269char *dupstr(char *s);
270
f1530049 271#define snew(type) ( (type *) smalloc (sizeof (type)) )
272#define snewn(number, type) ( (type *) smalloc ((number) * sizeof (type)) )
273#define sresize(array, number, type) \
274 ( (type *) srealloc ((array), (number) * sizeof (type)) )
d7482997 275#define lenof(array) ( sizeof(array) / sizeof(*(array)) )
276
277/*
278 * ustring.c
279 */
e4ea58f8 280wchar_t *ustrdup(wchar_t const *s);
281char *ustrtoa(wchar_t const *s, char *outbuf, int size, int charset);
282char *ustrtoa_careful(wchar_t const *s, char *outbuf, int size, int charset);
283wchar_t *ustrfroma(char const *s, wchar_t *outbuf, int size, int charset);
284char *utoa_dup(wchar_t const *s, int charset);
285char *utoa_dup_len(wchar_t const *s, int charset, int *len);
286char *utoa_careful_dup(wchar_t const *s, int charset);
287wchar_t *ufroma_dup(char const *s, int charset);
7e976207 288char *utoa_locale_dup(wchar_t const *s);
289wchar_t *ufroma_locale_dup(char const *s);
5dd44dce 290int ustrlen(wchar_t const *s);
d7482997 291wchar_t *uadv(wchar_t *s);
5dd44dce 292wchar_t *ustrcpy(wchar_t *dest, wchar_t const *source);
08e78486 293wchar_t *ustrncpy(wchar_t *dest, wchar_t const *source, int n);
d7482997 294wchar_t utolower(wchar_t);
831da32e 295int uisalpha(wchar_t);
d7482997 296int ustrcmp(wchar_t *lhs, wchar_t *rhs);
78c73085 297int ustricmp(wchar_t const *lhs, wchar_t const *rhs);
298int ustrnicmp(wchar_t const *lhs, wchar_t const *rhs, int maxlen);
dd567011 299int utoi(wchar_t const *);
300double utof(wchar_t const *);
301int utob(wchar_t const *);
d7482997 302int uisdigit(wchar_t);
303wchar_t *ustrlow(wchar_t *s);
c8422236 304wchar_t *ustrftime(const wchar_t *wfmt, const struct tm *timespec);
91f93b94 305int cvt_ok(int charset, const wchar_t *s);
0960a3d8 306int charset_from_ustr(filepos *fpos, const wchar_t *name);
d7482997 307
308/*
e5cd393f 309 * wcwidth.c
310 */
311int strwid(char const *s, int charset);
312int ustrwid(wchar_t const *s, int charset);
313
314/*
d7482997 315 * help.c
316 */
317void help(void);
318void usage(void);
319void showversion(void);
f336fa9a 320void listcharsets(void);
d7482997 321
322/*
323 * licence.c
324 */
325void licence(void);
326
327/*
328 * version.c
329 */
330const char *const version;
331
332/*
333 * misc.c
334 */
e4ea58f8 335char *adv(char *s);
336
d7482997 337typedef struct stackTag *stack;
338stack stk_new(void);
339void stk_free(stack);
340void stk_push(stack, void *);
341void *stk_pop(stack);
7136a6c7 342void *stk_top(stack);
d7482997 343
344typedef struct tagRdstring rdstring;
345struct tagRdstring {
346 int pos, size;
347 wchar_t *text;
348};
349typedef struct tagRdstringc rdstringc;
350struct tagRdstringc {
351 int pos, size;
352 char *text;
353};
354extern const rdstring empty_rdstring;
355extern const rdstringc empty_rdstringc;
356void rdadd(rdstring *rs, wchar_t c);
5dd44dce 357void rdadds(rdstring *rs, wchar_t const *p);
d7482997 358wchar_t *rdtrim(rdstring *rs);
359void rdaddc(rdstringc *rs, char c);
5dd44dce 360void rdaddsc(rdstringc *rs, char const *p);
d7482997 361char *rdtrimc(rdstringc *rs);
362
363int compare_wordlists(word *a, word *b);
364
bb9e7835 365void mark_attr_ends(word *words);
d7482997 366
367typedef struct tagWrappedLine wrappedline;
368struct tagWrappedLine {
369 wrappedline *next;
370 word *begin, *end; /* first & last words of line */
371 int nspaces; /* number of whitespaces in line */
372 int shortfall; /* how much shorter than max width */
373};
43341922 374wrappedline *wrap_para(word *, int, int, int (*)(void *, word *), void *, int);
d7482997 375void wrap_free(wrappedline *);
e4ea58f8 376void cmdline_cfg_add(paragraph *cfg, char *string);
377paragraph *cmdline_cfg_new(void);
378paragraph *cmdline_cfg_simple(char *string, ...);
d7482997 379
380/*
381 * input.c
382 */
383paragraph *read_input(input *in, indexdata *idx);
384
385/*
386 * keywords.c
387 */
388struct keywordlist_Tag {
389 int nkeywords;
390 int size;
391 tree234 *keys; /* sorted by `key' field */
392 word **looseends; /* non-keyword list element numbers */
393 int nlooseends;
394 int looseendssize;
395};
396struct keyword_Tag {
397 wchar_t *key; /* the keyword itself */
398 word *text; /* "Chapter 2", "Appendix Q"... */
399 /* (NB: filepos are not set) */
400 paragraph *para; /* the paragraph referenced */
401};
402keyword *kw_lookup(keywordlist *, wchar_t *);
403keywordlist *get_keywords(paragraph *);
404void free_keywords(keywordlist *);
405void subst_keywords(paragraph *, keywordlist *);
406
407/*
408 * index.c
409 */
410
411/*
412 * Data structure to hold both sides of the index.
413 */
414struct indexdata_Tag {
415 tree234 *tags; /* holds type `indextag' */
416 tree234 *entries; /* holds type `indexentry' */
417};
418
419/*
420 * Data structure to hold an index tag (LHS of index).
421 */
422struct indextag_Tag {
423 wchar_t *name;
424 word *implicit_text;
f4551933 425 filepos implicit_fpos;
d7482997 426 word **explicit_texts;
f4551933 427 filepos *explicit_fpos;
d7482997 428 int nexplicit, explicit_size;
429 int nrefs;
430 indexentry **refs; /* array of entries referenced by tag */
431};
432
433/*
434 * Data structure to hold an index entry (RHS of index).
435 */
436struct indexentry_Tag {
437 word *text;
438 void *backend_data; /* private to back end */
f4551933 439 filepos fpos;
d7482997 440};
441
442indexdata *make_index(void);
443void cleanup_index(indexdata *);
444/* index_merge takes responsibility for freeing arg 3 iff implicit; never
445 * takes responsibility for arg 2 */
f4551933 446void index_merge(indexdata *, int is_explicit, wchar_t *, word *, filepos *);
d7482997 447void build_index(indexdata *);
448void index_debug(indexdata *);
449indextag *index_findtag(indexdata *idx, wchar_t *name);
450
451/*
452 * contents.c
453 */
454numberstate *number_init(void);
455void number_cfg(numberstate *, paragraph *);
96f3af16 456word *number_mktext(numberstate *, paragraph *, wchar_t *, int *, int *);
d7482997 457void number_free(numberstate *);
458
459/*
460 * biblio.c
461 */
462void gen_citations(paragraph *, keywordlist *);
463
464/*
465 * style.c
466 */
467struct userstyle_Tag {
468};
469
470/*
471 * bk_text.c
472 */
43341922 473void text_backend(paragraph *, keywordlist *, indexdata *, void *);
ba9c1487 474paragraph *text_config_filename(char *filename);
d7482997 475
476/*
78c73085 477 * bk_html.c
d7482997 478 */
78c73085 479void html_backend(paragraph *, keywordlist *, indexdata *, void *);
480paragraph *html_config_filename(char *filename);
d7482997 481
482/*
483 * bk_whlp.c
484 */
43341922 485void whlp_backend(paragraph *, keywordlist *, indexdata *, void *);
ba9c1487 486paragraph *whlp_config_filename(char *filename);
d7482997 487
7136a6c7 488/*
489 * bk_man.c
490 */
43341922 491void man_backend(paragraph *, keywordlist *, indexdata *, void *);
ba9c1487 492paragraph *man_config_filename(char *filename);
7136a6c7 493
5dd44dce 494/*
495 * bk_info.c
496 */
43341922 497void info_backend(paragraph *, keywordlist *, indexdata *, void *);
5dd44dce 498paragraph *info_config_filename(char *filename);
499
43341922 500/*
501 * bk_paper.c
502 */
503void *paper_pre_backend(paragraph *, keywordlist *, indexdata *);
504
505/*
506 * bk_ps.c
507 */
508void ps_backend(paragraph *, keywordlist *, indexdata *, void *);
509paragraph *ps_config_filename(char *filename);
510
511/*
512 * bk_pdf.c
513 */
514void pdf_backend(paragraph *, keywordlist *, indexdata *, void *);
515paragraph *pdf_config_filename(char *filename);
516
d7482997 517#endif