d7482997 |
1 | /* |
2 | * xhtml backend for Halibut |
3 | * (initial implementation by James Aylett) |
4 | * |
5 | * Still to do: |
6 | * |
7 | * +++ doesn't handle non-breaking hyphens. Not sure how to yet. |
8 | * +++ entity names (from a file -- ideally supply normal SGML files) |
9 | * +++ configuration directive to file split where the current layout |
10 | * code wouldn't. Needs changes to _ponder_layout() and _do_paras(), |
11 | * perhaps others. |
12 | * |
13 | * Limitations: |
14 | * |
15 | * +++ biblio/index references target the nearest section marker, rather |
16 | * than having a dedicated target themselves. In large bibliographies |
17 | * this will cause problems. (The solution is to fake up a response |
18 | * from xhtml_find_section(), probably linking it into the sections |
19 | * chain just in case we need it again, and to make freeing it up |
20 | * easier.) docsrc.pl used to work as we do, however, and SGT agrees that |
21 | * this is acceptable for now. |
22 | * +++ can't cope with leaf-level == 0. It's all to do with the |
23 | * top-level file not being normal, probably not even having a valid |
24 | * section level, and stuff like that. I question whether this is an |
25 | * issue, frankly; small manuals that fit on one page should probably |
26 | * not be written in halibut at all. |
27 | */ |
28 | |
29 | #include <stdio.h> |
30 | #include <stdlib.h> |
677e18a2 |
31 | #include <string.h> |
d7482997 |
32 | #include <assert.h> |
33 | #include "halibut.h" |
34 | |
50d6b4bd |
35 | /* |
36 | * FILENAME_TEMPLATE (overridable in config of course) allows you |
37 | * to choose the general form for your HTML file names. It is |
38 | * slightly printf-styled (% followed by a single character is a |
39 | * formatting directive, %% is a literal %). Formatting directives |
40 | * are: |
41 | * |
ba9c1487 |
42 | * - %n is the section type-plus-number, minus whitespace (`Chapter1.2'). |
50d6b4bd |
43 | * - %b is the section number on its own (`1.2'). |
44 | * - %k is the section's _internal_ keyword. |
45 | * - %N is the section's visible title in the output, again minus |
46 | * whitespace. |
47 | * |
48 | * %n, %b and %k will all default to %N if the section is |
49 | * unnumbered (`Bibliography' is often a good example). |
6d6d850c |
50 | * |
51 | * FRAGMENT_TEMPLATE is the same, but defines the <a name="foo"> |
52 | * markers used to cross-reference to particular subsections of a |
53 | * file. |
50d6b4bd |
54 | */ |
55 | |
56 | #define FILENAME_SINGLE "Manual.html" |
57 | #define FILENAME_CONTENTS "Contents.html" |
58 | #define FILENAME_INDEX "IndexPage.html" |
59 | #define FILENAME_TEMPLATE "%n.html" |
6d6d850c |
60 | #define FRAGMENT_TEMPLATE "%b" |
50d6b4bd |
61 | |
d7482997 |
62 | struct xhtmlsection_Struct { |
63 | struct xhtmlsection_Struct *next; /* next sibling (NULL if split across files) */ |
64 | struct xhtmlsection_Struct *child; /* NULL if split across files */ |
65 | struct xhtmlsection_Struct *parent; /* NULL if split across files */ |
66 | struct xhtmlsection_Struct *chain; /* single structure independent of weird trees */ |
67 | paragraph *para; |
68 | struct xhtmlfile_Struct *file; /* which file is this a part of? */ |
69 | char *fragment; /* fragment id within the file */ |
70 | int level; |
71 | }; |
72 | |
73 | struct xhtmlfile_Struct { |
74 | struct xhtmlfile_Struct *next; |
75 | struct xhtmlfile_Struct *child; |
76 | struct xhtmlfile_Struct *parent; |
77 | char *filename; |
78 | struct xhtmlsection_Struct *sections; /* sections within this file (only one for non-leaf) */ |
79 | int is_leaf; /* is this file a leaf file, ie does it not have any children? */ |
80 | }; |
81 | |
82 | typedef struct xhtmlsection_Struct xhtmlsection; |
83 | typedef struct xhtmlfile_Struct xhtmlfile; |
84 | typedef struct xhtmlindex_Struct xhtmlindex; |
85 | |
86 | struct xhtmlindex_Struct { |
87 | int nsection; |
88 | int size; |
89 | xhtmlsection **sections; |
90 | }; |
91 | |
92 | typedef struct { |
5d9cc07b |
93 | int just_numbers; |
94 | wchar_t *number_suffix; |
95 | } xhtmlheadfmt; |
96 | |
97 | typedef struct { |
d7482997 |
98 | int contents_depth[6]; |
99 | int leaf_contains_contents; |
100 | int leaf_level; |
101 | int leaf_smallest_contents; |
102 | int include_version_id; |
103 | wchar_t *author, *description; |
104 | wchar_t *head_end, *body, *body_start, *body_end, *address_start, *address_end, *nav_attrs; |
105 | int suppress_address; |
5d9cc07b |
106 | xhtmlheadfmt fchapter, *fsect; |
107 | int nfsect; |
50d6b4bd |
108 | char *contents_filename, *index_filename; |
6d6d850c |
109 | char *single_filename, *template_filename, *template_fragment; |
d7482997 |
110 | } xhtmlconfig; |
111 | |
112 | /*static void xhtml_level(paragraph *, int); |
113 | static void xhtml_level_0(paragraph *); |
114 | static void xhtml_docontents(FILE *, paragraph *, int); |
115 | static void xhtml_dosections(FILE *, paragraph *, int); |
116 | static void xhtml_dobody(FILE *, paragraph *, int);*/ |
117 | |
118 | static void xhtml_doheader(FILE *, word *); |
119 | static void xhtml_dofooter(FILE *); |
120 | static void xhtml_versionid(FILE *, word *, int); |
121 | |
122 | static void xhtml_utostr(wchar_t *, char **); |
123 | static int xhtml_para_level(paragraph *); |
124 | static int xhtml_reservedchar(int); |
125 | |
4b3c5afb |
126 | static int xhtml_convert(wchar_t *, int, char **, int); |
ce9921d6 |
127 | static void xhtml_rdaddwc(rdstringc *, word *, word *, int); |
128 | static void xhtml_para(FILE *, word *, int); |
d7482997 |
129 | static void xhtml_codepara(FILE *, word *); |
ce9921d6 |
130 | static void xhtml_heading(FILE *, paragraph *, int); |
d7482997 |
131 | |
132 | /* File-global variables are much easier than passing these things |
133 | * all over the place. Evil, but easier. We can replace this with a single |
134 | * structure at some point. |
135 | */ |
136 | static xhtmlconfig conf; |
137 | static keywordlist *keywords; |
138 | static indexdata *idx; |
139 | static xhtmlfile *topfile; |
140 | static xhtmlsection *topsection; |
141 | static paragraph *sourceparas; |
142 | static xhtmlfile *lastfile; |
143 | static xhtmlfile *xhtml_last_file = NULL; |
c8c7926b |
144 | static int last_level=-1, start_level; |
d7482997 |
145 | static xhtmlsection *currentsection; |
146 | |
147 | static xhtmlconfig xhtml_configure(paragraph *source) |
148 | { |
149 | xhtmlconfig ret; |
150 | |
151 | /* |
152 | * Defaults. |
153 | */ |
154 | ret.contents_depth[0] = 2; |
155 | ret.contents_depth[1] = 3; |
156 | ret.contents_depth[2] = 4; |
157 | ret.contents_depth[3] = 5; |
158 | ret.contents_depth[4] = 6; |
159 | ret.contents_depth[5] = 7; |
160 | ret.leaf_level = 2; |
161 | ret.leaf_smallest_contents = 4; |
162 | ret.leaf_contains_contents = FALSE; |
163 | ret.include_version_id = TRUE; |
164 | ret.author = NULL; |
165 | ret.description = NULL; |
166 | ret.head_end = NULL; |
167 | ret.body = NULL; |
168 | ret.body_start = NULL; |
169 | ret.body_end = NULL; |
170 | ret.address_start = NULL; |
171 | ret.address_end = NULL; |
172 | ret.nav_attrs = NULL; |
173 | ret.suppress_address = FALSE; |
174 | |
5d9cc07b |
175 | ret.fchapter.just_numbers = FALSE; |
e5e6bf9d |
176 | ret.fchapter.number_suffix = L": "; |
5d9cc07b |
177 | ret.nfsect = 2; |
178 | ret.fsect = mknewa(xhtmlheadfmt, ret.nfsect); |
179 | ret.fsect[0].just_numbers = FALSE; |
e5e6bf9d |
180 | ret.fsect[0].number_suffix = L": "; |
5d9cc07b |
181 | ret.fsect[1].just_numbers = TRUE; |
e5e6bf9d |
182 | ret.fsect[1].number_suffix = L" "; |
50d6b4bd |
183 | ret.contents_filename = strdup(FILENAME_CONTENTS); |
184 | ret.single_filename = strdup(FILENAME_SINGLE); |
185 | ret.index_filename = strdup(FILENAME_INDEX); |
186 | ret.template_filename = strdup(FILENAME_TEMPLATE); |
6d6d850c |
187 | ret.template_fragment = strdup(FRAGMENT_TEMPLATE); |
5d9cc07b |
188 | |
d7482997 |
189 | for (; source; source = source->next) |
190 | { |
191 | if (source->type == para_Config) |
192 | { |
50d6b4bd |
193 | if (!ustricmp(source->keyword, L"xhtml-contents-filename")) { |
194 | sfree(ret.contents_filename); |
195 | ret.contents_filename = utoa_dup(uadv(source->keyword)); |
196 | } else if (!ustricmp(source->keyword, L"xhtml-single-filename")) { |
197 | sfree(ret.single_filename); |
198 | ret.single_filename = utoa_dup(uadv(source->keyword)); |
199 | } else if (!ustricmp(source->keyword, L"xhtml-index-filename")) { |
200 | sfree(ret.index_filename); |
201 | ret.index_filename = utoa_dup(uadv(source->keyword)); |
202 | } else if (!ustricmp(source->keyword, L"xhtml-template-filename")) { |
203 | sfree(ret.template_filename); |
204 | ret.template_filename = utoa_dup(uadv(source->keyword)); |
6d6d850c |
205 | } else if (!ustricmp(source->keyword, L"xhtml-template-fragment")) { |
206 | sfree(ret.template_fragment); |
207 | ret.template_fragment = utoa_dup(uadv(source->keyword)); |
50d6b4bd |
208 | } else if (!ustricmp(source->keyword, L"xhtml-contents-depth-0")) { |
d7482997 |
209 | ret.contents_depth[0] = utoi(uadv(source->keyword)); |
210 | } else if (!ustricmp(source->keyword, L"xhtml-contents-depth-1")) { |
211 | ret.contents_depth[1] = utoi(uadv(source->keyword)); |
212 | } else if (!ustricmp(source->keyword, L"xhtml-contents-depth-2")) { |
213 | ret.contents_depth[2] = utoi(uadv(source->keyword)); |
214 | } else if (!ustricmp(source->keyword, L"xhtml-contents-depth-3")) { |
215 | ret.contents_depth[3] = utoi(uadv(source->keyword)); |
216 | } else if (!ustricmp(source->keyword, L"xhtml-contents-depth-4")) { |
217 | ret.contents_depth[4] = utoi(uadv(source->keyword)); |
218 | } else if (!ustricmp(source->keyword, L"xhtml-contents-depth-5")) { |
219 | ret.contents_depth[5] = utoi(uadv(source->keyword)); |
220 | } else if (!ustricmp(source->keyword, L"xhtml-leaf-level")) { |
221 | ret.leaf_level = utoi(uadv(source->keyword)); |
d7482997 |
222 | } else if (!ustricmp(source->keyword, L"xhtml-leaf-smallest-contents")) { |
223 | ret.leaf_smallest_contents = utoi(uadv(source->keyword)); |
224 | } else if (!ustricmp(source->keyword, L"xhtml-versionid")) { |
225 | ret.include_version_id = utob(uadv(source->keyword)); |
226 | } else if (!ustricmp(source->keyword, L"xhtml-leaf-contains-contents")) { |
227 | ret.leaf_contains_contents = utob(uadv(source->keyword)); |
228 | } else if (!ustricmp(source->keyword, L"xhtml-suppress-address")) { |
229 | ret.suppress_address = utob(uadv(source->keyword)); |
230 | } else if (!ustricmp(source->keyword, L"xhtml-author")) { |
231 | ret.author = uadv(source->keyword); |
232 | } else if (!ustricmp(source->keyword, L"xhtml-description")) { |
233 | ret.description = uadv(source->keyword); |
234 | } else if (!ustricmp(source->keyword, L"xhtml-head-end")) { |
235 | ret.head_end = uadv(source->keyword); |
236 | } else if (!ustricmp(source->keyword, L"xhtml-body-start")) { |
237 | ret.body_start = uadv(source->keyword); |
238 | } else if (!ustricmp(source->keyword, L"xhtml-body-tag")) { |
239 | ret.body = uadv(source->keyword); |
240 | } else if (!ustricmp(source->keyword, L"xhtml-body-end")) { |
241 | ret.body_end = uadv(source->keyword); |
242 | } else if (!ustricmp(source->keyword, L"xhtml-address-start")) { |
243 | ret.address_start = uadv(source->keyword); |
244 | } else if (!ustricmp(source->keyword, L"xhtml-address-end")) { |
245 | ret.address_end = uadv(source->keyword); |
246 | } else if (!ustricmp(source->keyword, L"xhtml-navigation-attributes")) { |
247 | ret.nav_attrs = uadv(source->keyword); |
5d9cc07b |
248 | } else if (!ustricmp(source->keyword, L"xhtml-chapter-numeric")) { |
249 | ret.fchapter.just_numbers = utob(uadv(source->keyword)); |
250 | } else if (!ustricmp(source->keyword, L"xhtml-chapter-suffix")) { |
e5e6bf9d |
251 | ret.fchapter.number_suffix = uadv(source->keyword); |
5d9cc07b |
252 | } else if (!ustricmp(source->keyword, L"xhtml-section-numeric")) { |
253 | wchar_t *p = uadv(source->keyword); |
254 | int n = 0; |
255 | if (uisdigit(*p)) { |
256 | n = utoi(p); |
257 | p = uadv(p); |
258 | } |
259 | if (n >= ret.nfsect) { |
260 | int i; |
261 | ret.fsect = resize(ret.fsect, n+1); |
262 | for (i = ret.nfsect; i <= n; i++) |
263 | ret.fsect[i] = ret.fsect[ret.nfsect-1]; |
264 | ret.nfsect = n+1; |
265 | } |
266 | ret.fsect[n].just_numbers = utob(p); |
267 | } else if (!ustricmp(source->keyword, L"xhtml-section-suffix")) { |
268 | wchar_t *p = uadv(source->keyword); |
269 | int n = 0; |
270 | if (uisdigit(*p)) { |
271 | n = utoi(p); |
272 | p = uadv(p); |
273 | } |
274 | if (n >= ret.nfsect) { |
275 | int i; |
276 | ret.fsect = resize(ret.fsect, n+1); |
277 | for (i = ret.nfsect; i <= n; i++) |
278 | ret.fsect[i] = ret.fsect[ret.nfsect-1]; |
279 | ret.nfsect = n+1; |
280 | } |
e5e6bf9d |
281 | ret.fsect[n].number_suffix = p; |
d7482997 |
282 | } |
283 | } |
284 | } |
285 | |
286 | /* printf(" !!! leaf_level = %i\n", ret.leaf_level); |
287 | printf(" !!! contentdepth-0 = %i\n", ret.contents_depth[0]); |
288 | printf(" !!! contentdepth-1 = %i\n", ret.contents_depth[1]); |
289 | printf(" !!! contentdepth-2 = %i\n", ret.contents_depth[2]); |
290 | printf(" !!! contentdepth-3 = %i\n", ret.contents_depth[3]); |
291 | printf(" !!! contentdepth-4 = %i\n", ret.contents_depth[4]); |
292 | printf(" !!! contentdepth-5 = %i\n", ret.contents_depth[5]); |
293 | printf(" !!! leaf_contains_contents = %i\n", ret.leaf_contains_contents);*/ |
294 | return ret; |
295 | } |
296 | |
ba9c1487 |
297 | paragraph *xhtml_config_filename(char *filename) |
298 | { |
299 | /* |
300 | * If the user passes in a single filename as a parameter to |
301 | * the `--html' command-line option, then we should assume it |
302 | * to imply _two_ config directives: |
303 | * \cfg{xhtml-single-filename}{whatever} and |
304 | * \cfg{xhtml-leaf-level}{0}; the rationale being that the user |
305 | * wants their output _in that file_. |
306 | */ |
307 | |
308 | paragraph *p[2]; |
309 | int i, len; |
310 | wchar_t *ufilename, *up; |
311 | |
312 | for (i = 0; i < 2; i++) { |
313 | p[i] = mknew(paragraph); |
314 | memset(p[i], 0, sizeof(*p[i])); |
315 | p[i]->type = para_Config; |
316 | p[i]->next = NULL; |
317 | p[i]->fpos.filename = "<command line>"; |
318 | p[i]->fpos.line = p[i]->fpos.col = -1; |
319 | } |
320 | |
321 | ufilename = ufroma_dup(filename); |
322 | len = ustrlen(ufilename) + 2 + lenof(L"xhtml-single-filename"); |
323 | p[0]->keyword = mknewa(wchar_t, len); |
324 | up = p[0]->keyword; |
325 | ustrcpy(up, L"xhtml-single-filename"); |
326 | up = uadv(up); |
327 | ustrcpy(up, ufilename); |
328 | up = uadv(up); |
329 | *up = L'\0'; |
330 | assert(up - p[0]->keyword < len); |
331 | sfree(ufilename); |
332 | |
333 | len = lenof(L"xhtml-leaf-level") + lenof(L"0") + 1; |
334 | p[1]->keyword = mknewa(wchar_t, len); |
335 | up = p[1]->keyword; |
336 | ustrcpy(up, L"xhtml-leaf-level"); |
337 | up = uadv(up); |
338 | ustrcpy(up, L"0"); |
339 | up = uadv(up); |
340 | *up = L'\0'; |
341 | assert(up - p[1]->keyword < len); |
342 | |
343 | p[0]->next = p[1]; |
344 | |
345 | return p[0]; |
346 | } |
347 | |
d7482997 |
348 | static xhtmlsection *xhtml_new_section(xhtmlsection *last) |
349 | { |
350 | xhtmlsection *ret = mknew(xhtmlsection); |
351 | ret->next=NULL; |
352 | ret->child=NULL; |
353 | ret->parent=NULL; |
354 | ret->chain=last; |
355 | ret->para=NULL; |
356 | ret->file=NULL; |
357 | ret->fragment=NULL; |
358 | ret->level=-1; /* marker: end of chain */ |
359 | return ret; |
360 | } |
361 | |
362 | /* Returns NULL or the section that marks that paragraph */ |
363 | static xhtmlsection *xhtml_find_section(paragraph *p) |
364 | { |
365 | xhtmlsection *ret = topsection; |
366 | if (xhtml_para_level(p)==-1) { /* first, we back-track to a section paragraph */ |
367 | paragraph *p2 = sourceparas; |
368 | paragraph *p3 = NULL; |
369 | while (p2 && p2!=p) { |
370 | if (xhtml_para_level(p2)!=-1) { |
371 | p3 = p2; |
372 | } |
373 | p2=p2->next; |
374 | } |
375 | if (p3==NULL) { /* for some reason, we couldn't find a section before this paragraph ... ? */ |
376 | /* Note that this can happen, if you have a cross-reference to before the first chapter starts. |
377 | * So don't do that, then. |
378 | */ |
379 | return NULL; |
380 | } |
381 | p=p3; |
382 | } |
383 | while (ret && ret->para != p) { |
384 | /* printf(" xhtml_find_section(): checking %s for para @ %p\n", ret->fragment, p);*/ |
385 | ret=ret->chain; |
386 | } |
387 | return ret; |
388 | } |
389 | |
6d6d850c |
390 | static void xhtml_format(paragraph *p, char *template_string, rdstringc *r) |
391 | { |
392 | char *c, *t; |
393 | word *w; |
394 | wchar_t *ws; |
395 | |
396 | t = template_string; |
397 | while (*t) { |
398 | if (*t == '%' && t[1]) { |
399 | int fmt; |
400 | |
401 | t++; |
402 | fmt = *t++; |
403 | |
404 | if (fmt == '%') { |
405 | rdaddc(r, fmt); |
406 | continue; |
407 | } |
408 | |
409 | w = NULL; |
410 | ws = NULL; |
411 | |
412 | if (p->kwtext && fmt == 'n') |
413 | w = p->kwtext; |
414 | else if (p->kwtext2 && fmt == 'b') |
415 | w = p->kwtext2; |
416 | else if (p->keyword && *p->keyword && fmt == 'k') |
417 | ws = p->keyword; |
418 | else |
419 | w = p->words; |
420 | |
421 | while (w) { |
422 | switch (removeattr(w->type)) |
423 | { |
424 | case word_Normal: |
425 | /*case word_Emph: |
426 | case word_Code: |
427 | case word_WeakCode:*/ |
428 | xhtml_utostr(w->text, &c); |
429 | rdaddsc(r,c); |
430 | sfree(c); |
431 | break; |
432 | } |
433 | w = w->next; |
434 | } |
435 | if (ws) { |
436 | xhtml_utostr(ws, &c); |
437 | rdaddsc(r,c); |
438 | sfree(c); |
439 | } |
440 | } else { |
441 | rdaddc(r, *t++); |
442 | } |
443 | } |
444 | } |
445 | |
d7482997 |
446 | static xhtmlfile *xhtml_new_file(xhtmlsection *sect) |
447 | { |
448 | xhtmlfile *ret = mknew(xhtmlfile); |
449 | |
450 | ret->next=NULL; |
451 | ret->child=NULL; |
452 | ret->parent=NULL; |
453 | ret->filename=NULL; |
454 | ret->sections=sect; |
455 | ret->is_leaf=(sect!=NULL && sect->level==conf.leaf_level); |
456 | if (sect==NULL) { |
457 | if (conf.leaf_level==0) { /* currently unused */ |
50d6b4bd |
458 | ret->filename = smalloc(strlen(conf.single_filename)+1); |
459 | sprintf(ret->filename, conf.single_filename); |
d7482997 |
460 | } else { |
50d6b4bd |
461 | ret->filename = smalloc(strlen(conf.contents_filename)+1); |
462 | sprintf(ret->filename, conf.contents_filename); |
d7482997 |
463 | } |
464 | } else { |
465 | paragraph *p = sect->para; |
466 | rdstringc fname_c = { 0, 0, NULL }; |
6d6d850c |
467 | xhtml_format(p, conf.template_filename, &fname_c); |
d7482997 |
468 | ret->filename = rdtrimc(&fname_c); |
469 | } |
470 | /* printf(" ! new file '%s', is_leaf == %s\n", ret->filename, (ret->is_leaf)?("true"):("false"));*/ |
471 | return ret; |
472 | } |
473 | |
474 | /* |
475 | * Walk the tree fixing up files which are actually leaf (ie |
476 | * have no children) but aren't at leaf level, so they have the |
477 | * leaf flag set. |
478 | */ |
479 | void xhtml_fixup_layout(xhtmlfile* file) |
480 | { |
481 | if (file->child==NULL) { |
482 | file->is_leaf = TRUE; |
483 | } else { |
484 | xhtml_fixup_layout(file->child); |
485 | } |
486 | if (file->next) |
487 | xhtml_fixup_layout(file->next); |
488 | } |
489 | |
490 | /* |
491 | * Create the tree structure so we know where everything goes. |
492 | * Method: |
493 | * |
494 | * Ignoring file splitting, we have three choices with each new section: |
495 | * |
496 | * +-----------------+-----------------+ |
497 | * | | | |
498 | * X +----X----+ (1) |
499 | * | | |
5d9cc07b |
500 | * Y (2) |
d7482997 |
501 | * | |
502 | * (3) |
503 | * |
504 | * Y is the last section we added (currentsect). |
505 | * If sect is the section we want to add, then: |
506 | * |
507 | * (1) if sect->level < currentsect->level |
508 | * (2) if sect->level == currentsect->level |
509 | * (3) if sect->level > currentsect->level |
510 | * |
511 | * This requires the constraint that you never skip section numbers |
512 | * (so you can't have a.b.c.d without all of a, a.b and a.b.c existing). |
513 | * |
514 | * Note that you _can_ have 1.1.1.1 followed by 1.2 - you can change |
515 | * more than one level at a time. Lots of asserts, and probably part of |
516 | * the algorithm here, rely on this being true. (It currently isn't |
517 | * enforced by halibut, however.) |
518 | * |
519 | * File splitting makes this harder. For instance, say we added at (3) |
520 | * above and now need to add another section. We are splitting at level |
521 | * 2, ie the level of Y. Z is the last section we added: |
522 | * |
523 | * +-----------------+-----------------+ |
524 | * | | | |
525 | * X +----X----+ (1) |
526 | * | | |
527 | * +----Y----+ (1) |
528 | * | | |
529 | * Z (2) |
530 | * | |
531 | * (3) |
532 | * |
533 | * The (1) case is now split; we need to search upwards to find where |
534 | * to actually link in. The other two cases remain the same (and will |
535 | * always be like this). |
536 | * |
537 | * File splitting makes this harder, however. The decision of whether |
538 | * to split to a new file is always on the same condition, however (is |
539 | * the level of this section higher than the leaf_level configuration |
540 | * value or not). |
541 | * |
542 | * Treating the cases backwards: |
543 | * |
544 | * (3) same file if sect->level > conf.leaf_level, otherwise new file |
545 | * |
546 | * if in the same file, currentsect->child points to sect |
547 | * otherwise the linking is done through the file tree (which works |
548 | * in more or less the same way, ie currentfile->child points to |
549 | * the new file) |
550 | * |
551 | * (2) same file if sect->level > conf.leaf_level, otherwise new file |
552 | * |
553 | * if in the same file, currentsect->next points to sect |
554 | * otherwise file linking and currentfile->next points to the new |
555 | * file (we know that Z must have caused a new file to be created) |
556 | * |
557 | * (1) same file if sect->level > conf.leaf_level, otherwise new file |
558 | * |
559 | * this is actually effectively the same case as (2) here, |
560 | * except that we first have to travel up the sections to figure |
561 | * out which section this new one will be a sibling of. In doing |
562 | * so, we may disappear off the top of a file and have to go up |
563 | * to its parent in the file tree. |
564 | * |
565 | */ |
566 | static void xhtml_ponder_layout(paragraph *p) |
567 | { |
568 | xhtmlsection *lastsection; |
569 | xhtmlsection *currentsect; |
570 | xhtmlfile *currentfile; |
571 | |
572 | lastfile = NULL; |
573 | topsection = xhtml_new_section(NULL); |
574 | topfile = xhtml_new_file(NULL); |
575 | lastsection = topsection; |
576 | currentfile = topfile; |
577 | currentsect = topsection; |
578 | |
d2e74722 |
579 | if (conf.leaf_level == 0) { |
580 | topfile->is_leaf = 1; |
581 | topfile->sections = topsection; |
582 | topsection->file = topfile; |
583 | } |
584 | |
d7482997 |
585 | for (; p; p=p->next) |
586 | { |
587 | int level = xhtml_para_level(p); |
588 | if (level>0) /* actually a section */ |
589 | { |
590 | xhtmlsection *sect; |
6d6d850c |
591 | rdstringc frag_c = { 0, 0, NULL }; |
d7482997 |
592 | |
593 | sect = xhtml_new_section(lastsection); |
594 | lastsection = sect; |
595 | sect->para = p; |
6d6d850c |
596 | |
597 | xhtml_format(p, conf.template_fragment, &frag_c); |
598 | sect->fragment = rdtrimc(&frag_c); |
d7482997 |
599 | sect->level = level; |
600 | /* printf(" ! adding para @ %p as sect %s, level %i\n", sect->para, sect->fragment, level);*/ |
601 | |
602 | if (level>currentsect->level) { /* case (3) */ |
603 | if (level>conf.leaf_level) { /* same file */ |
604 | assert(currentfile->is_leaf); |
605 | currentsect->child = sect; |
606 | sect->parent=currentsect; |
607 | sect->file=currentfile; |
608 | /* printf("connected '%s' to existing file '%s' [I]\n", sect->fragment, currentfile->filename);*/ |
609 | currentsect=sect; |
610 | } else { /* new file */ |
611 | xhtmlfile *file = xhtml_new_file(sect); |
612 | assert(!currentfile->is_leaf); |
613 | currentfile->child=file; |
614 | sect->file=file; |
615 | file->parent=currentfile; |
616 | /* printf("connected '%s' to new file '%s' [I]\n", sect->fragment, file->filename);*/ |
617 | currentfile=file; |
618 | currentsect=sect; |
619 | } |
620 | } else if (level >= currentsect->file->sections->level) { |
621 | /* Case (1) or (2) *AND* still under the section that starts |
622 | * the current file. |
623 | * |
624 | * I'm not convinced that this couldn't be rolled in with the |
625 | * final else {} leg further down. It seems a lot of effort |
626 | * this way. |
627 | */ |
628 | if (level>conf.leaf_level) { /* stick within the same file */ |
629 | assert(currentfile->is_leaf); |
630 | sect->file = currentfile; |
631 | while (currentsect && currentsect->level > level && |
632 | currentsect->file==currentsect->parent->file) { |
633 | currentsect = currentsect->parent; |
634 | } |
635 | assert(currentsect); |
636 | currentsect->next = sect; |
637 | assert(currentsect->level == sect->level); |
638 | sect->parent = currentsect->parent; |
639 | currentsect = sect; |
640 | /* printf("connected '%s' to existing file '%s' [II]\n", sect->fragment, currentfile->filename);*/ |
641 | } else { /* new file */ |
642 | xhtmlfile *file = xhtml_new_file(sect); |
643 | sect->file=file; |
644 | currentfile->next=file; |
645 | file->parent=currentfile->parent; |
646 | file->is_leaf=(level==conf.leaf_level); |
647 | file->sections=sect; |
648 | /* printf("connected '%s' to new file '%s' [II]\n", sect->fragment, file->filename);*/ |
649 | currentfile=file; |
650 | currentsect=sect; |
651 | } |
652 | } else { /* Case (1) or (2) and we must move up the file tree first */ |
653 | /* this loop is now probably irrelevant - we know we can't connect |
654 | * to anything in the current file */ |
655 | while (currentsect && level<currentsect->level) { |
656 | currentsect=currentsect->parent; |
657 | if (currentsect) { |
658 | /* printf(" * up one level to '%s'\n", currentsect->fragment);*/ |
659 | } else { |
660 | /* printf(" * up one level (off top of current file)\n");*/ |
661 | } |
662 | } |
663 | if (currentsect) { |
664 | /* I'm pretty sure this can now never fire */ |
665 | assert(currentfile->is_leaf); |
666 | /* printf("connected '%s' to existing file '%s' [III]\n", sect->fragment, currentfile->filename);*/ |
667 | sect->file = currentfile; |
668 | currentsect->next=sect; |
669 | currentsect=sect; |
670 | } else { /* find a file we can attach to */ |
671 | while (currentfile && currentfile->sections && level<currentfile->sections->level) { |
672 | currentfile=currentfile->parent; |
673 | if (currentfile) { |
674 | /* printf(" * up one file level to '%s'\n", currentfile->filename);*/ |
675 | } else { |
676 | /* printf(" * up one file level (off top of tree)\n");*/ |
677 | } |
678 | } |
679 | if (currentfile) { /* new file (we had to skip up a file to |
680 | get here, so we must be dealing with a |
681 | level no lower than the configured |
682 | leaf_level */ |
683 | xhtmlfile *file = xhtml_new_file(sect); |
684 | currentfile->next=file; |
685 | sect->file=file; |
686 | file->parent=currentfile->parent; |
687 | file->is_leaf=(level==conf.leaf_level); |
688 | file->sections=sect; |
689 | /* printf("connected '%s' to new file '%s' [III]\n", sect->fragment, file->filename);*/ |
690 | currentfile=file; |
691 | currentsect=sect; |
692 | } else { |
693 | fatal(err_whatever, "Ran off the top trying to connect sibling: strange document."); |
694 | } |
695 | } |
696 | } |
697 | } |
698 | } |
699 | topsection = lastsection; /* get correct end of the chain */ |
700 | xhtml_fixup_layout(topfile); /* leaf files not at leaf level marked as such */ |
701 | } |
702 | |
703 | static void xhtml_do_index(); |
704 | static void xhtml_do_file(xhtmlfile *file); |
705 | static void xhtml_do_top_file(xhtmlfile *file, paragraph *sourceform); |
ce9921d6 |
706 | static void xhtml_do_paras(FILE *fp, paragraph *p, paragraph *end, int indexable); |
d7482997 |
707 | static int xhtml_do_contents_limit(FILE *fp, xhtmlfile *file, int limit); |
708 | static int xhtml_do_contents_section_limit(FILE *fp, xhtmlsection *section, int limit); |
709 | static int xhtml_add_contents_entry(FILE *fp, xhtmlsection *section, int limit); |
710 | static int xhtml_do_contents(FILE *fp, xhtmlfile *file); |
711 | static int xhtml_do_naked_contents(FILE *fp, xhtmlfile *file); |
712 | static void xhtml_do_sections(FILE *fp, xhtmlsection *sections); |
713 | |
714 | /* |
715 | * Do all the files in this structure. |
716 | */ |
717 | static void xhtml_do_files(xhtmlfile *file) |
718 | { |
719 | xhtml_do_file(file); |
720 | if (file->child) |
721 | xhtml_do_files(file->child); |
722 | if (file->next) |
723 | xhtml_do_files(file->next); |
724 | } |
725 | |
726 | /* |
727 | * Free up all memory used by the file tree from 'xfile' downwards |
728 | */ |
729 | static void xhtml_free_file(xhtmlfile* xfile) |
730 | { |
731 | if (xfile==NULL) { |
732 | return; |
733 | } |
734 | |
735 | if (xfile->filename) { |
736 | sfree(xfile->filename); |
737 | } |
738 | xhtml_free_file(xfile->child); |
739 | xhtml_free_file(xfile->next); |
740 | sfree(xfile); |
741 | } |
742 | |
743 | /* |
744 | * Main function. |
745 | */ |
746 | void xhtml_backend(paragraph *sourceform, keywordlist *in_keywords, |
43341922 |
747 | indexdata *in_idx, void *unused) |
d7482997 |
748 | { |
749 | /* int i;*/ |
750 | indexentry *ientry; |
751 | int ti; |
752 | xhtmlsection *xsect; |
753 | |
43341922 |
754 | IGNORE(unused); |
755 | |
d7482997 |
756 | sourceparas = sourceform; |
757 | conf = xhtml_configure(sourceform); |
758 | keywords = in_keywords; |
759 | idx = in_idx; |
760 | |
761 | /* Clear up the index entries backend data pointers */ |
762 | for (ti=0; (ientry = (indexentry *)index234(idx->entries, ti))!=NULL; ti++) { |
763 | ientry->backend_data=NULL; |
764 | } |
765 | |
766 | xhtml_ponder_layout(sourceform); |
767 | |
768 | /* old system ... (writes to *.alt, but gets some stuff wrong and is ugly) */ |
769 | /* xhtml_level_0(sourceform); |
770 | for (i=1; i<=conf.leaf_level; i++) |
771 | { |
772 | xhtml_level(sourceform, i); |
773 | }*/ |
774 | |
775 | /* new system ... (writes to *.html, but isn't fully trusted) */ |
776 | xhtml_do_top_file(topfile, sourceform); |
777 | assert(!topfile->next); /* shouldn't have a sibling at all */ |
d2e74722 |
778 | if (topfile->child) { |
779 | xhtml_do_files(topfile->child); |
780 | xhtml_do_index(); |
781 | } |
d7482997 |
782 | |
783 | /* release file, section, index data structures */ |
784 | xsect = topsection; |
785 | while (xsect) { |
786 | xhtmlsection *tmp = xsect->chain; |
787 | if (xsect->fragment) { |
788 | sfree(xsect->fragment); |
789 | } |
790 | sfree(xsect); |
791 | xsect = tmp; |
792 | } |
793 | xhtml_free_file(topfile); |
794 | for (ti = 0; (ientry=(indexentry *)index234(idx->entries, ti))!=NULL; ti++) { |
795 | if (ientry->backend_data!=NULL) { |
796 | xhtmlindex *xi = (xhtmlindex*) ientry->backend_data; |
797 | if (xi->sections!=NULL) { |
798 | sfree(xi->sections); |
799 | } |
800 | sfree(xi); |
801 | } |
802 | ientry->backend_data = NULL; |
803 | } |
e5e6bf9d |
804 | sfree(conf.fsect); |
d7482997 |
805 | } |
806 | |
807 | static int xhtml_para_level(paragraph *p) |
808 | { |
809 | switch (p->type) |
810 | { |
d9d3dd95 |
811 | case para_Title: |
812 | return 0; |
813 | break; |
d7482997 |
814 | case para_UnnumberedChapter: |
815 | case para_Chapter: |
816 | case para_Appendix: |
817 | return 1; |
818 | break; |
819 | /* case para_BiblioCited: |
820 | return 2; |
821 | break;*/ |
822 | case para_Heading: |
823 | case para_Subsect: |
824 | return p->aux+2; |
825 | break; |
826 | default: |
827 | return -1; |
828 | break; |
829 | } |
830 | } |
831 | |
d7482997 |
832 | /* Output the nav links for the current file. |
833 | * file == NULL means we're doing the index |
834 | */ |
835 | static void xhtml_donavlinks(FILE *fp, xhtmlfile *file) |
836 | { |
837 | xhtmlfile *xhtml_next_file = NULL; |
838 | fprintf(fp, "<p"); |
839 | if (conf.nav_attrs!=NULL) { |
840 | fprintf(fp, " %ls>", conf.nav_attrs); |
841 | } else { |
842 | fprintf(fp, ">"); |
843 | } |
844 | if (xhtml_last_file==NULL) { |
845 | fprintf(fp, "Previous | "); |
846 | } else { |
503e4ab0 |
847 | fprintf(fp, "<a href=\"%s\">Previous</a> | ", xhtml_last_file->filename); |
d7482997 |
848 | } |
503e4ab0 |
849 | fprintf(fp, "<a href=\"%s\">Contents</a> | ", conf.contents_filename); |
25acf71d |
850 | if (file == NULL) { |
851 | fprintf(fp, "Index | "); |
852 | } else { |
503e4ab0 |
853 | fprintf(fp, "<a href=\"%s\">Index</a> | ", conf.index_filename); |
25acf71d |
854 | } |
d7482997 |
855 | if (file != NULL) { /* otherwise we're doing nav links for the index */ |
856 | if (xhtml_next_file==NULL) |
857 | xhtml_next_file = file->child; |
858 | if (xhtml_next_file==NULL) |
859 | xhtml_next_file = file->next; |
860 | if (xhtml_next_file==NULL) |
861 | xhtml_next_file = file->parent->next; |
862 | } |
863 | if (xhtml_next_file==NULL) { |
864 | if (file==NULL) { /* index, so no next file */ |
865 | fprintf(fp, "Next "); |
866 | } else { |
503e4ab0 |
867 | fprintf(fp, "<a href=\"%s\">Next</a>", conf.index_filename); |
d7482997 |
868 | } |
869 | } else { |
503e4ab0 |
870 | fprintf(fp, "<a href=\"%s\">Next</a>", xhtml_next_file->filename); |
d7482997 |
871 | } |
872 | fprintf(fp, "</p>\n"); |
873 | } |
874 | |
875 | /* Write out the index file */ |
d2e74722 |
876 | static void xhtml_do_index_body(FILE *fp) |
d7482997 |
877 | { |
d7482997 |
878 | indexentry *y; |
879 | int ti; |
d7482997 |
880 | |
d2e74722 |
881 | if (count234(idx->entries) == 0) |
882 | return; /* don't write anything at all */ |
d7482997 |
883 | |
884 | fprintf(fp, "<dl>\n"); |
885 | /* iterate over idx->entries using the tree functions and display everything */ |
886 | for (ti = 0; (y = (indexentry *)index234(idx->entries, ti)) != NULL; ti++) { |
887 | if (y->backend_data) { |
888 | int i; |
889 | xhtmlindex *xi; |
890 | |
891 | fprintf(fp, "<dt>"); |
ce9921d6 |
892 | xhtml_para(fp, y->text, FALSE); |
d7482997 |
893 | fprintf(fp, "</dt>\n<dd>"); |
894 | |
895 | xi = (xhtmlindex*) y->backend_data; |
896 | for (i=0; i<xi->nsection; i++) { |
897 | xhtmlsection *sect = xi->sections[i]; |
898 | if (sect) { |
503e4ab0 |
899 | fprintf(fp, "<a href=\"%s#%s\">", sect->file->filename, sect->fragment); |
d7482997 |
900 | if (sect->para->kwtext) { |
ce9921d6 |
901 | xhtml_para(fp, sect->para->kwtext, FALSE); |
d7482997 |
902 | } else if (sect->para->words) { |
ce9921d6 |
903 | xhtml_para(fp, sect->para->words, FALSE); |
d7482997 |
904 | } |
905 | fprintf(fp, "</a>"); |
906 | if (i+1<xi->nsection) { |
907 | fprintf(fp, ", "); |
908 | } |
909 | } |
910 | } |
911 | fprintf(fp, "</dd>\n"); |
912 | } |
913 | } |
914 | fprintf(fp, "</dl>\n"); |
d2e74722 |
915 | } |
916 | static void xhtml_do_index() |
917 | { |
5dd44dce |
918 | word temp_word = { NULL, NULL, word_Normal, 0, 0, L"Index", |
919 | { NULL, 0, 0}, NULL }; |
50d6b4bd |
920 | FILE *fp = fopen(conf.index_filename, "w"); |
d2e74722 |
921 | |
922 | if (fp==NULL) |
50d6b4bd |
923 | fatal(err_cantopenw, conf.index_filename); |
d2e74722 |
924 | xhtml_doheader(fp, &temp_word); |
925 | xhtml_donavlinks(fp, NULL); |
926 | |
927 | xhtml_do_index_body(fp); |
d7482997 |
928 | |
929 | xhtml_donavlinks(fp, NULL); |
930 | xhtml_dofooter(fp); |
931 | fclose(fp); |
932 | } |
933 | |
934 | /* Output the given file. This includes whatever contents at beginning and end, etc. etc. */ |
935 | static void xhtml_do_file(xhtmlfile *file) |
936 | { |
937 | FILE *fp = fopen(file->filename, "w"); |
938 | if (fp==NULL) |
939 | fatal(err_cantopenw, file->filename); |
940 | |
941 | if (file->sections->para->words) { |
942 | xhtml_doheader(fp, file->sections->para->words); |
943 | } else if (file->sections->para->kwtext) { |
944 | xhtml_doheader(fp, file->sections->para->kwtext); |
945 | } else { |
946 | xhtml_doheader(fp, NULL); |
947 | } |
948 | |
949 | xhtml_donavlinks(fp, file); |
950 | |
d2e74722 |
951 | if (file->is_leaf && conf.leaf_contains_contents && |
952 | xhtml_do_contents(NULL, file)>=conf.leaf_smallest_contents) |
d7482997 |
953 | xhtml_do_contents(fp, file); |
954 | xhtml_do_sections(fp, file->sections); |
955 | if (!file->is_leaf) |
956 | xhtml_do_naked_contents(fp, file); |
957 | |
958 | xhtml_donavlinks(fp, file); |
959 | |
960 | xhtml_dofooter(fp); |
961 | fclose(fp); |
962 | |
963 | xhtml_last_file = file; |
964 | } |
965 | |
966 | /* Output the top-level file. */ |
967 | static void xhtml_do_top_file(xhtmlfile *file, paragraph *sourceform) |
968 | { |
969 | paragraph *p; |
970 | int done=FALSE; |
971 | FILE *fp = fopen(file->filename, "w"); |
972 | if (fp==NULL) |
973 | fatal(err_cantopenw, file->filename); |
974 | |
975 | /* Do the title -- only one allowed */ |
976 | for (p = sourceform; p && !done; p = p->next) |
977 | { |
978 | if (p->type == para_Title) |
979 | { |
980 | xhtml_doheader(fp, p->words); |
981 | done=TRUE; |
982 | } |
983 | } |
984 | if (!done) |
985 | xhtml_doheader(fp, NULL /* Eek! */); |
986 | |
d2e74722 |
987 | /* |
988 | * Display the title. |
989 | */ |
990 | for (p = sourceform; p; p = p->next) |
991 | { |
992 | if (p->type == para_Title) { |
ce9921d6 |
993 | xhtml_heading(fp, p, FALSE); |
d2e74722 |
994 | break; |
995 | } |
996 | } |
997 | |
9057a0a8 |
998 | /* Do the preamble */ |
d7482997 |
999 | for (p = sourceform; p; p = p->next) |
1000 | { |
8902e0ed |
1001 | if (p->type == para_Chapter || p->type == para_Heading || |
1002 | p->type == para_Subsect || p->type == para_Appendix || |
1003 | p->type == para_UnnumberedChapter) { |
1004 | /* |
1005 | * We've found the end of the preamble. Do every normal |
1006 | * paragraph up to there. |
1007 | */ |
ce9921d6 |
1008 | xhtml_do_paras(fp, sourceform, p, FALSE); |
8902e0ed |
1009 | break; |
d7482997 |
1010 | } |
1011 | } |
d7482997 |
1012 | |
1013 | xhtml_do_contents(fp, file); |
1014 | xhtml_do_sections(fp, file->sections); |
d2e74722 |
1015 | |
5d9cc07b |
1016 | /* |
1017 | * Put the index in the top file if we're in single-file mode |
1018 | * (leaf-level 0). |
1019 | */ |
1020 | if (conf.leaf_level == 0 && count234(idx->entries) > 0) { |
d2e74722 |
1021 | fprintf(fp, "<a name=\"index\"></a><h1>Index</h1>\n"); |
1022 | xhtml_do_index_body(fp); |
1023 | } |
1024 | |
d7482997 |
1025 | xhtml_dofooter(fp); |
1026 | fclose(fp); |
1027 | } |
1028 | |
1029 | /* Convert a Unicode string to an ASCII one. '?' is |
1030 | * used for unmappable characters. |
1031 | */ |
1032 | static void xhtml_utostr(wchar_t *in, char **out) |
1033 | { |
1034 | int l = ustrlen(in); |
1035 | int i; |
1036 | *out = smalloc(l+1); |
1037 | for (i=0; i<l; i++) |
1038 | { |
1039 | if (in[i]>=32 && in[i]<=126) |
1040 | (*out)[i]=(char)in[i]; |
1041 | else |
1042 | (*out)[i]='?'; |
1043 | } |
1044 | (*out)[i]=0; |
1045 | } |
1046 | |
1047 | /* |
1048 | * Write contents for the given file, and subfiles, down to |
1049 | * the appropriate contents depth. Returns the number of |
1050 | * entries written. |
1051 | */ |
1052 | static int xhtml_do_contents(FILE *fp, xhtmlfile *file) |
1053 | { |
c8c7926b |
1054 | int level, limit, count = 0; |
d7482997 |
1055 | if (!file) |
1056 | return 0; |
1057 | |
1058 | level = (file->sections)?(file->sections->level):(0); |
1059 | limit = conf.contents_depth[(level>5)?(5):(level)]; |
1060 | start_level = (file->is_leaf) ? (level-1) : (level); |
1061 | last_level = start_level; |
1062 | |
1063 | count += xhtml_do_contents_section_limit(fp, file->sections, limit); |
1064 | count += xhtml_do_contents_limit(fp, file->child, limit); |
1065 | if (fp!=NULL) { |
1066 | while (last_level > start_level) { |
1067 | last_level--; |
c8c7926b |
1068 | fprintf(fp, "</li></ul>\n"); |
d7482997 |
1069 | } |
1070 | } |
1071 | return count; |
1072 | } |
1073 | |
1074 | /* As above, but doesn't do anything in the current file */ |
1075 | static int xhtml_do_naked_contents(FILE *fp, xhtmlfile *file) |
1076 | { |
1077 | int level, limit, start_level, count = 0; |
1078 | if (!file) |
1079 | return 0; |
1080 | |
1081 | level = (file->sections)?(file->sections->level):(0); |
1082 | limit = conf.contents_depth[(level>5)?(5):(level)]; |
1083 | start_level = (file->is_leaf) ? (level-1) : (level); |
1084 | last_level = start_level; |
1085 | |
1086 | count = xhtml_do_contents_limit(fp, file->child, limit); |
1087 | if (fp!=NULL) { |
1088 | while (last_level > start_level) { |
1089 | last_level--; |
c8c7926b |
1090 | fprintf(fp, "</li></ul>\n"); |
d7482997 |
1091 | } |
1092 | } |
1093 | return count; |
1094 | } |
1095 | |
1096 | /* |
1097 | * Write contents for the given file, children, and siblings, down to |
1098 | * given limit contents depth. |
1099 | */ |
1100 | static int xhtml_do_contents_limit(FILE *fp, xhtmlfile *file, int limit) |
1101 | { |
1102 | int count = 0; |
1103 | while (file) { |
1104 | count += xhtml_do_contents_section_limit(fp, file->sections, limit); |
1105 | count += xhtml_do_contents_limit(fp, file->child, limit); |
1106 | file = file->next; |
1107 | } |
1108 | return count; |
1109 | } |
1110 | |
1111 | /* |
1112 | * Write contents entries for the given section tree, down to the |
1113 | * limit contents depth. |
1114 | */ |
1115 | static int xhtml_do_contents_section_deep_limit(FILE *fp, xhtmlsection *section, int limit) |
1116 | { |
1117 | int count = 0; |
1118 | while (section) { |
1119 | if (!xhtml_add_contents_entry(fp, section, limit)) |
1120 | return 0; |
1121 | else |
1122 | count++; |
1123 | count += xhtml_do_contents_section_deep_limit(fp, section->child, limit); |
1124 | section = section->next; |
1125 | } |
1126 | return count; |
1127 | } |
1128 | |
1129 | /* |
1130 | * Write contents entries for the given section tree, down to the |
1131 | * limit contents depth. |
1132 | */ |
1133 | static int xhtml_do_contents_section_limit(FILE *fp, xhtmlsection *section, int limit) |
1134 | { |
1135 | int count = 0; |
1136 | if (!section) |
1137 | return 0; |
1138 | xhtml_add_contents_entry(fp, section, limit); |
1139 | count=1; |
1140 | count += xhtml_do_contents_section_deep_limit(fp, section->child, limit); |
1141 | /* section=section->child; |
1142 | while (section && xhtml_add_contents_entry(fp, section, limit)) { |
1143 | section = section->next; |
1144 | }*/ |
1145 | return count; |
1146 | } |
1147 | |
1148 | /* |
1149 | * Add a section entry, unless we're exceeding the limit, in which |
1150 | * case return FALSE (otherwise return TRUE). |
1151 | */ |
1152 | static int xhtml_add_contents_entry(FILE *fp, xhtmlsection *section, int limit) |
1153 | { |
1154 | if (!section || section->level > limit) |
1155 | return FALSE; |
5d9cc07b |
1156 | if (fp==NULL || section->level < 0) |
d7482997 |
1157 | return TRUE; |
c8c7926b |
1158 | if (last_level > section->level) { |
1159 | while (last_level > section->level) { |
1160 | last_level--; |
1161 | fprintf(fp, "</li></ul>\n"); |
1162 | } |
1163 | fprintf(fp, "</li>\n"); |
1164 | } else if (last_level < section->level) { |
1165 | assert(last_level == section->level - 1); |
d7482997 |
1166 | last_level++; |
1167 | fprintf(fp, "<ul>\n"); |
c8c7926b |
1168 | } else { |
1169 | fprintf(fp, "</li>\n"); |
d7482997 |
1170 | } |
1171 | fprintf(fp, "<li><a href=\"%s#%s\">", section->file->filename, section->fragment); |
1172 | if (section->para->kwtext) { |
ce9921d6 |
1173 | xhtml_para(fp, section->para->kwtext, FALSE); |
d7482997 |
1174 | if (section->para->words) { |
1175 | fprintf(fp, ": "); |
1176 | } |
1177 | } |
1178 | if (section->para->words) { |
ce9921d6 |
1179 | xhtml_para(fp, section->para->words, FALSE); |
d7482997 |
1180 | } |
c8c7926b |
1181 | fprintf(fp, "</a>\n"); |
d7482997 |
1182 | return TRUE; |
1183 | } |
1184 | |
1185 | /* |
1186 | * Write all the sections in this file. Do all paragraphs in this section, then all |
1187 | * children (recursively), then go on to the next one (tail recursively). |
1188 | */ |
1189 | static void xhtml_do_sections(FILE *fp, xhtmlsection *sections) |
1190 | { |
1191 | while (sections) { |
1192 | currentsection = sections; |
ce9921d6 |
1193 | xhtml_do_paras(fp, sections->para, NULL, TRUE); |
d7482997 |
1194 | xhtml_do_sections(fp, sections->child); |
1195 | sections = sections->next; |
1196 | } |
1197 | } |
1198 | |
1199 | /* Write this list of paragraphs. Close off all lists at the end. */ |
ce9921d6 |
1200 | static void xhtml_do_paras(FILE *fp, paragraph *p, paragraph *end, |
1201 | int indexable) |
d7482997 |
1202 | { |
7136a6c7 |
1203 | int last_type = -1, ptype, first=TRUE; |
1204 | stack lcont_stack = stk_new(); |
d7482997 |
1205 | if (!p) |
1206 | return; |
1207 | |
1208 | /* for (; p && (xhtml_para_level(p)>limit || xhtml_para_level(p)==-1 || first); p=p->next) {*/ |
8902e0ed |
1209 | for (; p && p != end && (xhtml_para_level(p)==-1 || first); p=p->next) { |
d7482997 |
1210 | first=FALSE; |
7136a6c7 |
1211 | switch (ptype = p->type) |
d7482997 |
1212 | { |
1213 | /* |
1214 | * Things we ignore because we've already processed them or |
1215 | * aren't going to touch them in this pass. |
1216 | */ |
1217 | case para_IM: |
1218 | case para_BR: |
1219 | case para_Biblio: /* only touch BiblioCited */ |
1220 | case para_VersionID: |
d7482997 |
1221 | case para_NoCite: |
1222 | case para_Title: |
1223 | break; |
1224 | |
1225 | /* |
1226 | * Chapter titles. |
1227 | */ |
1228 | case para_Chapter: |
1229 | case para_Appendix: |
1230 | case para_UnnumberedChapter: |
ce9921d6 |
1231 | xhtml_heading(fp, p, indexable); |
d7482997 |
1232 | break; |
1233 | |
1234 | case para_Heading: |
1235 | case para_Subsect: |
ce9921d6 |
1236 | xhtml_heading(fp, p, indexable); |
d7482997 |
1237 | break; |
1238 | |
1239 | case para_Rule: |
1240 | fprintf(fp, "\n<hr />\n"); |
1241 | break; |
1242 | |
1243 | case para_Normal: |
9057a0a8 |
1244 | case para_Copyright: |
d7482997 |
1245 | fprintf(fp, "\n<p>"); |
ce9921d6 |
1246 | xhtml_para(fp, p->words, indexable); |
d7482997 |
1247 | fprintf(fp, "</p>\n"); |
1248 | break; |
1249 | |
7136a6c7 |
1250 | case para_LcontPush: |
1251 | { |
1252 | int *p; |
1253 | p = mknew(int); |
1254 | *p = last_type; |
1255 | stk_push(lcont_stack, p); |
1256 | last_type = para_Normal; |
1257 | } |
1258 | break; |
1259 | case para_LcontPop: |
1260 | { |
1261 | int *p = stk_pop(lcont_stack); |
1262 | assert(p); |
1263 | ptype = last_type = *p; |
1264 | sfree(p); |
1265 | goto closeofflist; /* ick */ |
1266 | } |
1267 | break; |
2614b01d |
1268 | case para_QuotePush: |
1269 | fprintf(fp, "<blockquote>\n"); |
1270 | break; |
1271 | case para_QuotePop: |
1272 | fprintf(fp, "</blockquote>\n"); |
1273 | break; |
7136a6c7 |
1274 | |
d7482997 |
1275 | case para_Bullet: |
1276 | case para_NumberedList: |
7136a6c7 |
1277 | case para_Description: |
1278 | case para_DescribedThing: |
d7482997 |
1279 | case para_BiblioCited: |
c8c7926b |
1280 | if (last_type!=p->type && |
1281 | !(last_type==para_DescribedThing && p->type==para_Description) && |
1282 | !(last_type==para_Description && p->type==para_DescribedThing)) { |
d7482997 |
1283 | /* start up list if necessary */ |
1284 | if (p->type == para_Bullet) { |
1285 | fprintf(fp, "<ul>\n"); |
1286 | } else if (p->type == para_NumberedList) { |
1287 | fprintf(fp, "<ol>\n"); |
7136a6c7 |
1288 | } else if (p->type == para_BiblioCited || |
1289 | p->type == para_DescribedThing || |
1290 | p->type == para_Description) { |
d7482997 |
1291 | fprintf(fp, "<dl>\n"); |
1292 | } |
1293 | } |
7136a6c7 |
1294 | if (p->type == para_Bullet || p->type == para_NumberedList) { |
d7482997 |
1295 | fprintf(fp, "<li>"); |
7136a6c7 |
1296 | } else if (p->type == para_DescribedThing) { |
1297 | fprintf(fp, "<dt>"); |
1298 | } else if (p->type == para_Description) { |
1299 | fprintf(fp, "<dd>"); |
1300 | } else if (p->type == para_BiblioCited) { |
d7482997 |
1301 | fprintf(fp, "<dt>"); |
ce9921d6 |
1302 | xhtml_para(fp, p->kwtext, indexable); |
d7482997 |
1303 | fprintf(fp, "</dt>\n<dd>"); |
1304 | } |
ce9921d6 |
1305 | xhtml_para(fp, p->words, indexable); |
7136a6c7 |
1306 | { |
1307 | paragraph *p2 = p->next; |
1308 | if (p2 && xhtml_para_level(p2)==-1 && p2->type == para_LcontPush) |
1309 | break; |
1310 | } |
1311 | |
1312 | closeofflist: |
1313 | if (ptype == para_BiblioCited) { |
d7482997 |
1314 | fprintf(fp, "</dd>\n"); |
c8c7926b |
1315 | } else if (ptype == para_DescribedThing) { |
7136a6c7 |
1316 | fprintf(fp, "</dt>"); |
c8c7926b |
1317 | } else if (ptype == para_Description) { |
7136a6c7 |
1318 | fprintf(fp, "</dd>"); |
1319 | } else if (ptype == para_Bullet || ptype == para_NumberedList) { |
d7482997 |
1320 | fprintf(fp, "</li>"); |
1321 | } |
7136a6c7 |
1322 | if (ptype == para_Bullet || ptype == para_NumberedList || |
1323 | ptype == para_BiblioCited || ptype == para_Description || |
1324 | ptype == para_DescribedThing) |
d7482997 |
1325 | /* close off list if necessary */ |
1326 | { |
1327 | paragraph *p2 = p->next; |
1328 | int close_off=FALSE; |
1329 | /* if (p2 && (xhtml_para_level(p2)>limit || xhtml_para_level(p2)==-1)) {*/ |
1330 | if (p2 && xhtml_para_level(p2)==-1) { |
c8c7926b |
1331 | if (p2->type != ptype && |
1332 | !(p2->type==para_DescribedThing && ptype==para_Description) && |
1333 | !(p2->type==para_Description && ptype==para_DescribedThing) && |
1334 | p2->type != para_LcontPush) |
d7482997 |
1335 | close_off=TRUE; |
1336 | } else { |
1337 | close_off=TRUE; |
1338 | } |
1339 | if (close_off) { |
7136a6c7 |
1340 | if (ptype == para_Bullet) { |
d7482997 |
1341 | fprintf(fp, "</ul>\n"); |
7136a6c7 |
1342 | } else if (ptype == para_NumberedList) { |
d7482997 |
1343 | fprintf(fp, "</ol>\n"); |
7136a6c7 |
1344 | } else if (ptype == para_BiblioCited || |
1345 | ptype == para_Description || |
1346 | ptype == para_DescribedThing) { |
d7482997 |
1347 | fprintf(fp, "</dl>\n"); |
1348 | } |
1349 | } |
1350 | } |
1351 | break; |
1352 | |
1353 | case para_Code: |
1354 | xhtml_codepara(fp, p->words); |
1355 | break; |
1356 | } |
7136a6c7 |
1357 | last_type = ptype; |
d7482997 |
1358 | } |
7136a6c7 |
1359 | |
1360 | stk_free(lcont_stack); |
d7482997 |
1361 | } |
1362 | |
1363 | /* |
1364 | * Output a header for this XHTML file. |
1365 | */ |
1366 | static void xhtml_doheader(FILE *fp, word *title) |
1367 | { |
1368 | fprintf(fp, "<!DOCTYPE html PUBLIC \"-//W3C//DTD XHTML 1.0 Transitional//EN\"\n"); |
1369 | fprintf(fp, "\"http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd\">\n"); |
503e4ab0 |
1370 | fprintf(fp, "<html xmlns=\"http://www.w3.org/1999/xhtml\">\n\n<head>\n<title>"); |
d7482997 |
1371 | if (title==NULL) |
1372 | fprintf(fp, "The thing with no name!"); |
1373 | else |
ce9921d6 |
1374 | xhtml_para(fp, title, FALSE); |
d7482997 |
1375 | fprintf(fp, "</title>\n"); |
1376 | fprintf(fp, "<meta name=\"generator\" content=\"Halibut %s xhtml-backend\" />\n", version); |
1377 | if (conf.author) |
1378 | fprintf(fp, "<meta name=\"author\" content=\"%ls\" />\n", conf.author); |
1379 | if (conf.description) |
1380 | fprintf(fp, "<meta name=\"description\" content=\"%ls\" />\n", conf.description); |
1381 | if (conf.head_end) |
1382 | fprintf(fp, "%ls\n", conf.head_end); |
1383 | fprintf(fp, "</head>\n\n"); |
1384 | if (conf.body) |
1385 | fprintf(fp, "%ls\n", conf.body); |
1386 | else |
1387 | fprintf(fp, "<body>\n"); |
1388 | if (conf.body_start) |
1389 | fprintf(fp, "%ls\n", conf.body_start); |
1390 | } |
1391 | |
1392 | /* |
1393 | * Output a footer for this XHTML file. |
1394 | */ |
1395 | static void xhtml_dofooter(FILE *fp) |
1396 | { |
1397 | fprintf(fp, "\n<hr />\n\n"); |
1398 | if (conf.body_end) |
1399 | fprintf(fp, "%ls\n", conf.body_end); |
1400 | if (!conf.suppress_address) { |
1401 | fprintf(fp,"<address>\n"); |
1402 | if (conf.address_start) |
1403 | fprintf(fp, "%ls\n", conf.address_start); |
1404 | /* Do the version ID */ |
1405 | if (conf.include_version_id) { |
1406 | paragraph *p; |
1407 | int started = 0; |
1408 | for (p = sourceparas; p; p = p->next) |
1409 | if (p->type == para_VersionID) { |
1410 | xhtml_versionid(fp, p->words, started); |
1411 | started = 1; |
1412 | } |
1413 | } |
1414 | if (conf.address_end) |
1415 | fprintf(fp, "%ls\n", conf.address_end); |
1416 | fprintf(fp, "</address>\n"); |
1417 | } |
1418 | fprintf(fp, "</body>\n\n</html>\n"); |
1419 | } |
1420 | |
1421 | /* |
1422 | * Output the versionid paragraph. Typically this is a version control |
1423 | * ID string (such as $Id...$ in RCS). |
1424 | */ |
1425 | static void xhtml_versionid(FILE *fp, word *text, int started) |
1426 | { |
1427 | rdstringc t = { 0, 0, NULL }; |
1428 | |
1429 | rdaddc(&t, '['); /* FIXME: configurability */ |
ce9921d6 |
1430 | xhtml_rdaddwc(&t, text, NULL, FALSE); |
d7482997 |
1431 | rdaddc(&t, ']'); /* FIXME: configurability */ |
1432 | |
1433 | if (started) |
c8c7926b |
1434 | fprintf(fp, "<br />\n"); |
d7482997 |
1435 | fprintf(fp, "%s\n", t.text); |
1436 | sfree(t.text); |
1437 | } |
1438 | |
1439 | /* Is this an XHTML reserved character? */ |
1440 | static int xhtml_reservedchar(int c) |
1441 | { |
1442 | if (c=='&' || c=='<' || c=='>' || c=='"') |
1443 | return TRUE; |
1444 | else |
1445 | return FALSE; |
1446 | } |
1447 | |
1448 | /* |
1449 | * Convert a wide string into valid XHTML: Anything outside ASCII will |
1450 | * be fixed up as an entity. Currently we don't worry about constraining the |
1451 | * encoded character set, which we should probably do at some point (we can |
1452 | * still fix up and return FALSE - see the last comment here). We also don't |
1453 | * currently |
1454 | * |
1455 | * Because this is only used for words, spaces are HARD spaces (any other |
1456 | * spaces will be word_Whitespace not word_Normal). So they become |
1457 | * Unless hard_spaces is FALSE, of course (code paragraphs break the above |
1458 | * rule). |
1459 | * |
1460 | * If `result' is non-NULL, mallocs the resulting string and stores a pointer to |
1461 | * it in `*result'. If `result' is NULL, merely checks whether all |
1462 | * characters in the string are feasible. |
1463 | * |
1464 | * Return is nonzero if all characters are OK. If not all |
1465 | * characters are OK but `result' is non-NULL, a result _will_ |
1466 | * still be generated! |
1467 | */ |
4b3c5afb |
1468 | static int xhtml_convert(wchar_t *s, int maxlen, char **result, |
1469 | int hard_spaces) { |
d7482997 |
1470 | int doing = (result != 0); |
1471 | int ok = TRUE; |
1472 | char *p = NULL; |
1473 | int plen = 0, psize = 0; |
1474 | |
4b3c5afb |
1475 | if (maxlen <= 0) |
1476 | maxlen = -1; |
1477 | |
1478 | for (; *s && maxlen != 0; s++, maxlen--) { |
d7482997 |
1479 | wchar_t c = *s; |
1480 | |
1481 | #define ensure_size(i) if (i>=psize) { psize = i+256; p = resize(p, psize); } |
1482 | |
1483 | if (((c == 32 && !hard_spaces) || (c > 32 && c <= 126 && !xhtml_reservedchar(c)))) { |
1484 | /* Char is OK. */ |
1485 | if (doing) |
1486 | { |
1487 | ensure_size(plen); |
1488 | p[plen++] = (char)c; |
1489 | } |
1490 | } else { |
1491 | /* Char needs fixing up. */ |
1492 | /* ok = FALSE; -- currently we never return FALSE; we |
1493 | * might want to when considering a character set for the |
1494 | * encoded document. |
1495 | */ |
1496 | if (doing) |
1497 | { |
1498 | if (c==32) { /* a space in a word is a hard space */ |
1499 | ensure_size(plen+6); /* includes space for the NUL, which is subsequently stomped on */ |
1500 | sprintf(p+plen, " "); |
1501 | plen+=6; |
1502 | } else { |
1503 | /* FIXME: entity names! */ |
1504 | ensure_size(plen+8); /* includes space for the NUL, which is subsequently stomped on */ |
1505 | plen+=sprintf(p+plen, "&#%04i;", (int)c); |
1506 | } |
1507 | } |
1508 | } |
1509 | } |
1510 | if (doing) { |
1511 | p = resize(p, plen+1); |
1512 | p[plen] = '\0'; |
1513 | *result = p; |
1514 | } |
1515 | return ok; |
1516 | } |
1517 | |
1518 | /* |
1519 | * This formats the given words as XHTML. |
ce9921d6 |
1520 | * |
1521 | * `indexable', if FALSE, prohibits adding any index references. |
1522 | * You might use this, for example, if an index reference occurred |
1523 | * in a section title, to prevent phony index references when the |
1524 | * section title is processed in strange places such as contents |
1525 | * sections. |
d7482997 |
1526 | */ |
ce9921d6 |
1527 | static void xhtml_rdaddwc(rdstringc *rs, word *text, word *end, int indexable) { |
d7482997 |
1528 | char *c; |
1529 | keyword *kwl; |
1530 | xhtmlsection *sect; |
1531 | indextag *itag; |
1532 | int ti; |
1533 | |
1534 | for (; text && text != end; text = text->next) { |
1535 | switch (text->type) { |
1536 | case word_HyperLink: |
1537 | xhtml_utostr(text->text, &c); |
1538 | rdaddsc(rs, "<a href=\""); |
1539 | rdaddsc(rs, c); |
1540 | rdaddsc(rs, "\">"); |
1541 | sfree(c); |
1542 | break; |
1543 | |
1544 | case word_UpperXref: |
1545 | case word_LowerXref: |
1546 | kwl = kw_lookup(keywords, text->text); |
1547 | if (kwl) { |
1548 | sect=xhtml_find_section(kwl->para); |
1549 | if (sect) { |
1550 | rdaddsc(rs, "<a href=\""); |
1551 | rdaddsc(rs, sect->file->filename); |
1552 | rdaddc(rs, '#'); |
1553 | rdaddsc(rs, sect->fragment); |
1554 | rdaddsc(rs, "\">"); |
1555 | } else { |
1556 | rdaddsc(rs, "<a href=\"Apologies.html\"><!-- probably a bibliography cross reference -->"); |
1557 | error(err_whatever, "Couldn't locate cross-reference! (Probably a bibliography entry.)"); |
1558 | } |
1559 | } else { |
1560 | rdaddsc(rs, "<a href=\"Apologies.html\"><!-- unknown cross-reference -->"); |
1561 | error(err_whatever, "Couldn't locate cross-reference! (Wasn't in source file.)"); |
1562 | } |
1563 | break; |
1564 | |
1565 | case word_IndexRef: /* in theory we could make an index target here */ |
1566 | /* rdaddsc(rs, "<a name=\"idx-"); |
1567 | xhtml_utostr(text->text, &c); |
1568 | rdaddsc(rs, c); |
1569 | sfree(c); |
1570 | rdaddsc(rs, "\"></a>");*/ |
1571 | /* what we _do_ need to do is to fix up the backend data |
1572 | * for any indexentry this points to. |
1573 | */ |
ce9921d6 |
1574 | if (!indexable) |
1575 | break; |
1576 | |
d7482997 |
1577 | for (ti=0; (itag = (indextag *)index234(idx->tags, ti))!=NULL; ti++) { |
1578 | /* FIXME: really ustricmp() and not ustrcmp()? */ |
1579 | if (ustricmp(itag->name, text->text)==0) { |
1580 | break; |
1581 | } |
1582 | } |
1583 | if (itag!=NULL) { |
1584 | if (itag->refs!=NULL) { |
1585 | int i; |
1586 | for (i=0; i<itag->nrefs; i++) { |
1587 | xhtmlindex *idx_ref; |
1588 | indexentry *ientry; |
1589 | |
1590 | ientry = itag->refs[i]; |
1591 | if (ientry->backend_data==NULL) { |
1592 | idx_ref = (xhtmlindex*) smalloc(sizeof(xhtmlindex)); |
1593 | if (idx_ref==NULL) |
1594 | fatal(err_nomemory); |
1595 | idx_ref->nsection = 0; |
1596 | idx_ref->size = 4; |
1597 | idx_ref->sections = (xhtmlsection**) smalloc(idx_ref->size * sizeof(xhtmlsection*)); |
1598 | if (idx_ref->sections==NULL) |
1599 | fatal(err_nomemory); |
1600 | ientry->backend_data = idx_ref; |
1601 | } else { |
1602 | idx_ref = ientry->backend_data; |
1603 | if (idx_ref->nsection+1 > idx_ref->size) { |
1604 | int new_size = idx_ref->size * 2; |
1605 | idx_ref->sections = srealloc(idx_ref->sections, new_size * sizeof(xhtmlsection)); |
1606 | if (idx_ref->sections==NULL) { |
1607 | fatal(err_nomemory); |
1608 | } |
1609 | idx_ref->size = new_size; |
1610 | } |
1611 | } |
1612 | idx_ref->sections[idx_ref->nsection++] = currentsection; |
1613 | #if 0 |
1614 | #endif |
1615 | } |
1616 | } else { |
1617 | fatal(err_whatever, "Index tag had no entries!"); |
1618 | } |
1619 | } else { |
1620 | fprintf(stderr, "Looking for index entry '%ls'\n", text->text); |
1621 | fatal(err_whatever, "Couldn't locate index entry! (Wasn't in index.)"); |
1622 | } |
1623 | break; |
1624 | |
1625 | case word_HyperEnd: |
1626 | case word_XrefEnd: |
1627 | rdaddsc(rs, "</a>"); |
1628 | break; |
1629 | |
1630 | case word_Normal: |
1631 | case word_Emph: |
1632 | case word_Code: |
1633 | case word_WeakCode: |
1634 | case word_WhiteSpace: |
1635 | case word_EmphSpace: |
1636 | case word_CodeSpace: |
1637 | case word_WkCodeSpace: |
1638 | case word_Quote: |
1639 | case word_EmphQuote: |
1640 | case word_CodeQuote: |
1641 | case word_WkCodeQuote: |
1642 | assert(text->type != word_CodeQuote && |
1643 | text->type != word_WkCodeQuote); |
1644 | if (towordstyle(text->type) == word_Emph && |
1645 | (attraux(text->aux) == attr_First || |
1646 | attraux(text->aux) == attr_Only)) |
1647 | rdaddsc(rs, "<em>"); |
1648 | else if ((towordstyle(text->type) == word_Code || towordstyle(text->type) == word_WeakCode) && |
1649 | (attraux(text->aux) == attr_First || |
1650 | attraux(text->aux) == attr_Only)) |
1651 | rdaddsc(rs, "<code>"); |
1652 | |
1653 | if (removeattr(text->type) == word_Normal) { |
12efc259 |
1654 | if (xhtml_convert(text->text, 0, &c, TRUE) || !text->alt) |
1655 | /* spaces in the word are hard */ |
d7482997 |
1656 | rdaddsc(rs, c); |
1657 | else |
ce9921d6 |
1658 | xhtml_rdaddwc(rs, text->alt, NULL, indexable); |
d7482997 |
1659 | sfree(c); |
1660 | } else if (removeattr(text->type) == word_WhiteSpace) { |
1661 | rdaddc(rs, ' '); |
1662 | } else if (removeattr(text->type) == word_Quote) { |
1663 | rdaddsc(rs, """); |
1664 | } |
1665 | |
1666 | if (towordstyle(text->type) == word_Emph && |
1667 | (attraux(text->aux) == attr_Last || |
1668 | attraux(text->aux) == attr_Only)) |
1669 | rdaddsc(rs, "</em>"); |
1670 | else if ((towordstyle(text->type) == word_Code || towordstyle(text->type) == word_WeakCode) && |
1671 | (attraux(text->aux) == attr_Last || |
1672 | attraux(text->aux) == attr_Only)) |
1673 | rdaddsc(rs, "</code>"); |
1674 | break; |
1675 | } |
1676 | } |
1677 | } |
1678 | |
1679 | /* Output a heading, formatted as XHTML. |
1680 | */ |
ce9921d6 |
1681 | static void xhtml_heading(FILE *fp, paragraph *p, int indexable) |
d7482997 |
1682 | { |
1683 | rdstringc t = { 0, 0, NULL }; |
1684 | word *tprefix = p->kwtext; |
1685 | word *nprefix = p->kwtext2; |
1686 | word *text = p->words; |
1687 | int level = xhtml_para_level(p); |
1688 | xhtmlsection *sect = xhtml_find_section(p); |
5d9cc07b |
1689 | xhtmlheadfmt *fmt; |
d7482997 |
1690 | char *fragment; |
1691 | if (sect) { |
1692 | fragment = sect->fragment; |
1693 | } else { |
d2e74722 |
1694 | if (p->type == para_Title) |
1695 | fragment = "title"; |
1696 | else { |
1697 | fragment = ""; /* FIXME: what else can we do? */ |
1698 | error(err_whatever, "Couldn't locate heading cross-reference!"); |
1699 | } |
d7482997 |
1700 | } |
1701 | |
5d9cc07b |
1702 | if (p->type == para_Title) |
1703 | fmt = NULL; |
1704 | else if (level == 1) |
1705 | fmt = &conf.fchapter; |
1706 | else if (level-1 < conf.nfsect) |
1707 | fmt = &conf.fsect[level-1]; |
1708 | else |
1709 | fmt = &conf.fsect[conf.nfsect-1]; |
1710 | |
1711 | if (fmt && fmt->just_numbers && nprefix) { |
ce9921d6 |
1712 | xhtml_rdaddwc(&t, nprefix, NULL, indexable); |
5d9cc07b |
1713 | if (fmt) { |
1714 | char *c; |
4b3c5afb |
1715 | if (xhtml_convert(fmt->number_suffix, 0, &c, FALSE)) { |
5d9cc07b |
1716 | rdaddsc(&t, c); |
1717 | sfree(c); |
1718 | } |
1719 | } |
1720 | } else if (fmt && !fmt->just_numbers && tprefix) { |
ce9921d6 |
1721 | xhtml_rdaddwc(&t, tprefix, NULL, indexable); |
5d9cc07b |
1722 | if (fmt) { |
1723 | char *c; |
4b3c5afb |
1724 | if (xhtml_convert(fmt->number_suffix, 0, &c, FALSE)) { |
5d9cc07b |
1725 | rdaddsc(&t, c); |
1726 | sfree(c); |
1727 | } |
1728 | } |
d7482997 |
1729 | } |
ce9921d6 |
1730 | xhtml_rdaddwc(&t, text, NULL, indexable); |
d9d3dd95 |
1731 | /* |
1732 | * If we're outputting in single-file mode, we need to lower |
1733 | * the level of each heading by one, because the overall |
1734 | * document title will be sitting right at the top as an <h1> |
1735 | * and so chapters and sections should start at <h2>. |
1736 | * |
1737 | * Even if not, the document title will come back from |
1738 | * xhtml_para_level() as level zero, so we must increment that |
1739 | * no matter what leaf_level is set to. |
1740 | */ |
1741 | if (conf.leaf_level == 0 || level == 0) |
1742 | level++; |
d7482997 |
1743 | fprintf(fp, "<a name=\"%s\"></a><h%i>%s</h%i>\n", fragment, level, t.text, level); |
1744 | sfree(t.text); |
1745 | } |
1746 | |
1747 | /* Output a paragraph. Styles are handled by xhtml_rdaddwc(). |
1748 | * This looks pretty simple; I may have missed something ... |
1749 | */ |
ce9921d6 |
1750 | static void xhtml_para(FILE *fp, word *text, int indexable) |
d7482997 |
1751 | { |
1752 | rdstringc out = { 0, 0, NULL }; |
ce9921d6 |
1753 | xhtml_rdaddwc(&out, text, NULL, indexable); |
d7482997 |
1754 | fprintf(fp, "%s", out.text); |
1755 | sfree(out.text); |
1756 | } |
1757 | |
1758 | /* Output a code paragraph. I'm treating this as preformatted, which |
1759 | * may not be entirely correct. See xhtml_para() for my worries about |
1760 | * this being overly-simple; however I think that most of the complexity |
1761 | * of the text backend came entirely out of word wrapping anyway. |
1762 | */ |
1763 | static void xhtml_codepara(FILE *fp, word *text) |
1764 | { |
1765 | fprintf(fp, "<pre>"); |
1766 | for (; text; text = text->next) if (text->type == word_WeakCode) { |
4b3c5afb |
1767 | word *here, *next; |
d7482997 |
1768 | char *c; |
4b3c5afb |
1769 | |
1770 | /* |
1771 | * See if this WeakCode is followed by an Emph to indicate |
1772 | * emphasis. |
1773 | */ |
1774 | here = text; |
1775 | if (text->next && text->next->type == word_Emph) { |
1776 | next = text = text->next; |
1777 | } else |
1778 | next = NULL; |
1779 | |
1780 | if (next) { |
1781 | wchar_t *t, *e; |
1782 | int n; |
1783 | |
1784 | t = here->text; |
1785 | e = next->text; |
1786 | |
1787 | while (*e) { |
1788 | int ec = *e; |
1789 | |
1790 | for (n = 0; t[n] && e[n] && e[n] == ec; n++); |
1791 | xhtml_convert(t, n, &c, FALSE); |
1792 | fprintf(fp, "%s%s%s", |
1793 | (ec == 'i' ? "<em>" : ec == 'b' ? "<b>" : ""), |
1794 | c, |
1795 | (ec == 'i' ? "</em>" : ec == 'b' ? "</b>" : "")); |
1796 | sfree(c); |
1797 | |
1798 | t += n; |
1799 | e += n; |
1800 | } |
1801 | |
1802 | xhtml_convert(t, 0, &c, FALSE); |
1803 | fprintf(fp, "%s\n", c); |
1804 | sfree(c); |
1805 | } else { |
1806 | xhtml_convert(here->text, 0, &c, FALSE); |
1807 | fprintf(fp, "%s\n", c); |
1808 | sfree(c); |
1809 | } |
d7482997 |
1810 | } |
1811 | fprintf(fp, "</pre>\n"); |
1812 | } |