mdw@git.distorted.org.uk Git - sgt/halibut/blob

1 /*

2 * Info backend for Halibut

3 *

4 * The Info file format isn't well-specified, and what specification

5 * there is is scattered all over the place. Sources include:

6 * (info), from GNU Texinfo.

7 * (texinfo), also from GNU Texinfo.

8 * (Emacs)Misc Help, and (emacs)Info Lookup, from GNU Emacs.

9 * info.el, from GNU Emacs.

10 *

11 * Possible future work:

12 *

13 * - configurable choice of how to allocate node names?

14 * + possibly a template-like approach, choosing node names to

15 * be the full section title or perhaps the internal keyword?

16 * + neither of those seems quite right. Perhaps instead a

17 * Windows Help-like mechanism, where a magic config

18 * directive allows user choice of name for every node.

19 * + Only trouble with that is, now what happens to the section

20 * numbers? Do they become completely vestigial and just sit

21 * in the title text of each node? Or do we keep them in the

22 * menus somehow? I think people might occasionally want to

23 * go to a section by number, if only because all the _other_

24 * formats of the same document will reference the numbers

25 * all the time. So our menu lines could look like one of

26 * these:

27 * * Nodename: Section 1.2. Title of section.

28 * * Section 1.2: Nodename. Title of section.

29 *

30 * - might be helpful to diagnose duplicate node names!

31 *

32 * - Indices generated by makeinfo use a menu rather than a bunch of

33 * cross-references, which reduces visual clutter rather. For

34 * singly-referenced items, it looks like:

35 * * toner cartridge, replacing: Toner.

36 * It does a horrid job on multiply-referenced entries, though,

37 * perhaps because the name before the colon is meant to be unique.

38 * Info's 'i' command requires the use of a menu -- it fails to

39 * find any index entries at all with Halibut's current index format.

40 *

41 * - The string "*note" is matched case-insensitively, so we could

42 * make things slightly less ugly by using the lower-case version

43 * when the user asks for \k. Unfortunately, standalone Info seems

44 * to match node names case-sensitively, so we can't downcase that.

45 *

46 * - The character encoding used in an Info file can be configured using

47 * an Emacs local variables block at the end, like this:

48 * Local Variables:

49 * coding: iso-8859-1

50 * End:

51 */

53 #include <stdio.h>

54 #include <stdlib.h>

55 #include <assert.h>

56 #include "halibut.h"

58 typedef struct {

59 wchar_t *underline;

60 } alignstruct;

62 typedef struct {

63 char *filename;

64 int maxfilesize;

65 int charset;

66 int listindentbefore, listindentafter;

67 int indent_code, width, index_width;

68 alignstruct atitle, achapter, *asect;

69 int nasect;

70 wchar_t *bullet, *listsuffix;

71 wchar_t *startemph, *endemph;

72 wchar_t *lquote, *rquote;

73 wchar_t *sectsuffix;

74 wchar_t *rule;

75 wchar_t *index_text;

76 } infoconfig;

78 typedef struct {

79 rdstringc output;

80 int charset;

81 charset_state state;

82 int wcmode;

83 } info_data;

84 #define EMPTY_INFO_DATA { { 0, 0, NULL }, 0, CHARSET_INIT_STATE, FALSE }

85 static const info_data empty_info_data = EMPTY_INFO_DATA;

87 typedef struct node_tag node;

88 struct node_tag {

89 node *listnext;

     node *up, *prev, *next, *lastchild;

91 int pos, started_menu, filenum;

92 char *name;

93 info_data text;

94 };

96 typedef struct {

97 char *text;

98 int length;

99 int nnodes, nodesize;

100 node **nodes;

101 } info_idx;

102

 static int info_rdadd(info_data *, wchar_t);

 static int info_rdadds(info_data *, wchar_t const *);

 static int info_rdaddc(info_data *, char);

 static int info_rdaddsc(info_data *, char const *);

107

 static void info_heading(info_data *, word *, word *, alignstruct, int,

109 infoconfig *);

 static void info_rule(info_data *, int, int, infoconfig *);

 static void info_para(info_data *, word *, wchar_t *, word *, keywordlist *,

                       int, int, int, infoconfig *);

 static void info_codepara(info_data *, word *, int, int);

 static void info_versionid(info_data *, word *, infoconfig *);

 static void info_menu_item(info_data *, node *, paragraph *, infoconfig *);

 static word *info_transform_wordlist(word *, keywordlist *);

 static int info_check_index(word *, node *, indexdata *);

118

 static int info_rdaddwc(info_data *, word *, word *, int, infoconfig *);

120

 static node *info_node_new(char *name, int charset);

 static char *info_node_name_for_para(paragraph *p, infoconfig *);

 static char *info_node_name_for_text(wchar_t *text, infoconfig *);

124

 static infoconfig info_configure(paragraph *source) {

126 infoconfig ret;

127 paragraph *p;

128 int n;

129

130 /*

131 * Defaults.

132 */

     ret.filename = dupstr("output.info");

     ret.maxfilesize = 64 << 10;

135 ret.charset = CS_ASCII;

136 ret.width = 70;

137 ret.listindentbefore = 1;

138 ret.listindentafter = 3;

139 ret.indent_code = 2;

140 ret.index_width = 40;

141 ret.listsuffix = L".";

     ret.bullet = L"\x2022\0-\0\0";

     ret.rule = L"\x2500\0-\0\0";

144 ret.startemph = L"_\0_\0\0";

     ret.endemph = uadv(ret.startemph);

     ret.lquote = L"\x2018\0\x2019\0`\0'\0\0";

     ret.rquote = uadv(ret.lquote);

148 ret.sectsuffix = L": ";

149 /*

150 * Default underline characters are chosen to match those recognised by

151 * Info-fontify-node.

152 */

     ret.atitle.underline = L"*\0\0";

     ret.achapter.underline = L"=\0\0";

155 ret.nasect = 2;

     ret.asect = snewn(ret.nasect, alignstruct);

     ret.asect[0].underline = L"-\0\0";

     ret.asect[1].underline = L".\0\0";

159 ret.index_text = L"Index";

160

161 /*

162 * Two-pass configuration so that we can pick up global config

163 * (e.g. `quotes') before having it overridden by specific

164 * config (`info-quotes'), irrespective of the order in which

165 * they occur.

166 */

     for (p = source; p; p = p->next) {

         if (p->type == para_Config) {

             if (!ustricmp(p->keyword, L"quotes")) {

                 if (*uadv(p->keyword) && *uadv(uadv(p->keyword))) {

                     ret.lquote = uadv(p->keyword);

                     ret.rquote = uadv(ret.lquote);

173 }

             } else if (!ustricmp(p->keyword, L"index")) {

                 ret.index_text = uadv(p->keyword);

176 }

177 }

178 }

179

     for (p = source; p; p = p->next) {

         if (p->type == para_Config) {

             if (!ustricmp(p->keyword, L"info-filename")) {

183 sfree(ret.filename);

                 ret.filename = dupstr(adv(p->origkeyword));

             } else if (!ustricmp(p->keyword, L"info-charset")) {

                 ret.charset = charset_from_ustr(&p->fpos, uadv(p->keyword));

             } else if (!ustricmp(p->keyword, L"info-max-file-size")) {

                 ret.maxfilesize = utoi(uadv(p->keyword));

             } else if (!ustricmp(p->keyword, L"info-width")) {

                 ret.width = utoi(uadv(p->keyword));

             } else if (!ustricmp(p->keyword, L"info-indent-code")) {

                 ret.indent_code = utoi(uadv(p->keyword));

             } else if (!ustricmp(p->keyword, L"info-index-width")) {

                 ret.index_width = utoi(uadv(p->keyword));

             } else if (!ustricmp(p->keyword, L"info-list-indent")) {

                 ret.listindentbefore = utoi(uadv(p->keyword));

             } else if (!ustricmp(p->keyword, L"info-listitem-indent")) {

                 ret.listindentafter = utoi(uadv(p->keyword));

             } else if (!ustricmp(p->keyword, L"info-section-suffix")) {

                 ret.sectsuffix = uadv(p->keyword);

             } else if (!ustricmp(p->keyword, L"info-underline")) {

                 ret.atitle.underline = ret.achapter.underline =

203 uadv(p->keyword);

                 for (n = 0; n < ret.nasect; n++)

                     ret.asect[n].underline = ret.atitle.underline;

             } else if (!ustricmp(p->keyword, L"info-chapter-underline")) {

                 ret.achapter.underline = uadv(p->keyword);

             } else if (!ustricmp(p->keyword, L"info-section-underline")) {

                 wchar_t *q = uadv(p->keyword);

210 int n = 0;

                 if (uisdigit(*q)) {

212 n = utoi(q);

213 q = uadv(q);

214 }

                 if (n >= ret.nasect) {

216 int i;

                     ret.asect = sresize(ret.asect, n+1, alignstruct);

                     for (i = ret.nasect; i <= n; i++)

                         ret.asect[i] = ret.asect[ret.nasect-1];

                     ret.nasect = n+1;

221 }

                 ret.asect[n].underline = q;

             } else if (!ustricmp(p->keyword, L"text-title-underline")) {

                 ret.atitle.underline = uadv(p->keyword);

             } else if (!ustricmp(p->keyword, L"info-bullet")) {

                 ret.bullet = uadv(p->keyword);

             } else if (!ustricmp(p->keyword, L"info-rule")) {

                 ret.rule = uadv(p->keyword);

             } else if (!ustricmp(p->keyword, L"info-list-suffix")) {

                 ret.listsuffix = uadv(p->keyword);

             } else if (!ustricmp(p->keyword, L"info-emphasis")) {

                 if (*uadv(p->keyword) && *uadv(uadv(p->keyword))) {

                     ret.startemph = uadv(p->keyword);

                     ret.endemph = uadv(ret.startemph);

235 }

             } else if (!ustricmp(p->keyword, L"info-quotes")) {

                 if (*uadv(p->keyword) && *uadv(uadv(p->keyword))) {

                     ret.lquote = uadv(p->keyword);

                     ret.rquote = uadv(ret.lquote);

240 }

241 }

242 }

243 }

244

245 /*

246 * Now process fallbacks on quote characters, underlines, the

247 * rule character, the emphasis characters, and bullets.

248 */

     while (*uadv(ret.rquote) && *uadv(uadv(ret.rquote)) &&

            (!cvt_ok(ret.charset, ret.lquote) ||

             !cvt_ok(ret.charset, ret.rquote))) {

         ret.lquote = uadv(ret.rquote);

         ret.rquote = uadv(ret.lquote);

254 }

255

     while (*uadv(ret.endemph) && *uadv(uadv(ret.endemph)) &&

            (!cvt_ok(ret.charset, ret.startemph) ||

             !cvt_ok(ret.charset, ret.endemph))) {

         ret.startemph = uadv(ret.endemph);

         ret.endemph = uadv(ret.startemph);

261 }

262

     while (*ret.atitle.underline && *uadv(ret.atitle.underline) &&

            !cvt_ok(ret.charset, ret.atitle.underline))

         ret.atitle.underline = uadv(ret.atitle.underline);

266

     while (*ret.achapter.underline && *uadv(ret.achapter.underline) &&

            !cvt_ok(ret.charset, ret.achapter.underline))

         ret.achapter.underline = uadv(ret.achapter.underline);

270

     for (n = 0; n < ret.nasect; n++) {

         while (*ret.asect[n].underline && *uadv(ret.asect[n].underline) &&

                !cvt_ok(ret.charset, ret.asect[n].underline))

             ret.asect[n].underline = uadv(ret.asect[n].underline);

275 }

276

     while (*ret.bullet && *uadv(ret.bullet) &&

            !cvt_ok(ret.charset, ret.bullet))

         ret.bullet = uadv(ret.bullet);

280

     while (*ret.rule && *uadv(ret.rule) &&

            !cvt_ok(ret.charset, ret.rule))

         ret.rule = uadv(ret.rule);

284

285 return ret;

286 }

287

 paragraph *info_config_filename(char *filename)

289 {

     return cmdline_cfg_simple("info-filename", filename, NULL);

291 }

292

 void info_backend(paragraph *sourceform, keywordlist *keywords,

                   indexdata *idx, void *unused) {

295 paragraph *p;

296 infoconfig conf;

297 word *prefix, *body, *wp;

298 word spaceword;

299 wchar_t *prefixextra;

300 int nesting, nestindent;

301 int indentb, indenta;

302 int filepos;

303 int has_index;

304 info_data intro_text = EMPTY_INFO_DATA;

305 node *topnode, *currnode;

306 word bullet;

307 FILE *fp;

308

309 IGNORE(unused);

310

311 conf = info_configure(sourceform);

312

313 /*

314 * Go through and create a node for each section.

315 */

     topnode = info_node_new("Top", conf.charset);

317 currnode = topnode;

     for (p = sourceform; p; p = p->next) switch (p->type) {

319 /*

320 * Chapter titles.

321 */

322 case para_Chapter:

323 case para_Appendix:

324 case para_UnnumberedChapter:

325 case para_Heading:

326 case para_Subsect:

327 {

328 node *newnode, *upnode;

329 char *nodename;

330

             nodename = info_node_name_for_para(p, &conf);

             newnode = info_node_new(nodename, conf.charset);

333 sfree(nodename);

334

335 p->private_data = newnode;

336

337 if (p->parent)

                 upnode = (node *)p->parent->private_data;

339 else

340 upnode = topnode;

341 assert(upnode);

342 newnode->up = upnode;

343

344 currnode->next = newnode;

345 newnode->prev = currnode;

346

347 currnode->listnext = newnode;

348 currnode = newnode;

349 }

350 break;

351 default:

352 p->private_data = NULL;

353 break;

354 }

355

356 /*

357 * Set up the display form of each index entry.

358 */

359 {

360 int i;

361 indexentry *entry;

362

         for (i = 0; (entry = index234(idx->entries, i)) != NULL; i++) {

             info_idx *ii = snew(info_idx);

365 info_data id = EMPTY_INFO_DATA;

366

367 id.charset = conf.charset;

368

             ii->nnodes = ii->nodesize = 0;

370 ii->nodes = NULL;

371

             ii->length = info_rdaddwc(&id, entry->text, NULL, FALSE, &conf);

373

             ii->text = id.output.text;

375

376 entry->backend_data = ii;

377 }

378 }

379

380 /*

381 * An Info file begins with a piece of introductory text which

382 * is apparently never shown anywhere. This seems to me to be a

383 * good place to put the copyright notice and the version IDs.

384 * Also, Info directory entries are expected to go here.

385 */

386 intro_text.charset = conf.charset;

387

388 info_rdaddsc(&intro_text,

389 "This Info file generated by Halibut, ");

390 info_rdaddsc(&intro_text, version);

     info_rdaddsc(&intro_text, "\n\n");

392

     for (p = sourceform; p; p = p->next)

         if (p->type == para_Config &&

             !ustricmp(p->keyword, L"info-dir-entry")) {

             wchar_t *section, *shortname, *longname, *kw;

397 char *s;

398

             section = uadv(p->keyword);

             shortname = *section ? uadv(section) : L"";

             longname = *shortname ? uadv(shortname) : L"";

             kw = *longname ? uadv(longname) : L"";

403

404 if (!*longname) {

                 err_cfginsufarg(&p->fpos, p->origkeyword, 3);

406 continue;

407 }

408

             info_rdaddsc(&intro_text, "INFO-DIR-SECTION ");

410 info_rdadds(&intro_text, section);

             info_rdaddsc(&intro_text, "\nSTART-INFO-DIR-ENTRY\n* ");

412 info_rdadds(&intro_text, shortname);

             info_rdaddsc(&intro_text, ": (");

             s = dupstr(conf.filename);

             if (strlen(s) > 5 && !strcmp(s+strlen(s)-5, ".info"))

                 s[strlen(s)-5] = '\0';

417 info_rdaddsc(&intro_text, s);

418 sfree(s);

             info_rdaddsc(&intro_text, ")");

420 if (*kw) {

                 keyword *kwl = kw_lookup(keywords, kw);

                 if (kwl && kwl->para->private_data) {

                     node *n = (node *)kwl->para->private_data;

                     info_rdaddsc(&intro_text, n->name);

425 }

426 }

             info_rdaddsc(&intro_text, ".   ");

428 info_rdadds(&intro_text, longname);

             info_rdaddsc(&intro_text, "\nEND-INFO-DIR-ENTRY\n\n");

430 }

431

     for (p = sourceform; p; p = p->next)

         if (p->type == para_Copyright)

             info_para(&intro_text, NULL, NULL, p->words, keywords,

                       0, 0, conf.width, &conf);

436

     for (p = sourceform; p; p = p->next)

         if (p->type == para_VersionID)

             info_versionid(&intro_text, p->words, &conf);

440

     if (intro_text.output.text[intro_text.output.pos-1] != '\n')

         info_rdaddc(&intro_text, '\n');

443

444 /* Do the title */

     for (p = sourceform; p; p = p->next)

         if (p->type == para_Title)

             info_heading(&topnode->text, NULL, p->words,

                          conf.atitle, conf.width, &conf);

449

     nestindent = conf.listindentbefore + conf.listindentafter;

451 nesting = 0;

452

453 currnode = topnode;

454

455 /* Do the main document */

     for (p = sourceform; p; p = p->next) switch (p->type) {

457

458 case para_QuotePush:

459 nesting += 2;

460 break;

461 case para_QuotePop:

462 nesting -= 2;

         assert(nesting >= 0);

464 break;

465

466 case para_LcontPush:

467 nesting += nestindent;

468 break;

469 case para_LcontPop:

470 nesting -= nestindent;

         assert(nesting >= 0);

472 break;

473

474 /*

475 * Things we ignore because we've already processed them or

476 * aren't going to touch them in this pass.

477 */

478 case para_IM:

479 case para_BR:

480 case para_Biblio: /* only touch BiblioCited */

481 case para_VersionID:

482 case para_NoCite:

483 case para_Title:

484 break;

485

486 /*

487 * Chapter titles.

488 */

489 case para_Chapter:

490 case para_Appendix:

491 case para_UnnumberedChapter:

492 case para_Heading:

493 case para_Subsect:

494 currnode = p->private_data;

495 assert(currnode);

496 assert(currnode->up);

497

         if (!currnode->up->started_menu) {

             info_rdaddsc(&currnode->up->text, "* Menu:\n\n");

500 currnode->up->started_menu = TRUE;

501 }

         info_menu_item(&currnode->up->text, currnode, p, &conf);

503

         has_index |= info_check_index(p->words, currnode, idx);

         if (p->type == para_Chapter || p->type == para_Appendix ||

506 p->type == para_UnnumberedChapter)

             info_heading(&currnode->text, p->kwtext, p->words,

                          conf.achapter, conf.width, &conf);

509 else

             info_heading(&currnode->text, p->kwtext, p->words,

                          conf.asect[p->aux>=conf.nasect?conf.nasect-1:p->aux],

512 conf.width, &conf);

513 nesting = 0;

514 break;

515

516 case para_Rule:

         info_rule(&currnode->text, nesting, conf.width - nesting, &conf);

518 break;

519

520 case para_Normal:

521 case para_Copyright:

522 case para_DescribedThing:

523 case para_Description:

524 case para_BiblioCited:

525 case para_Bullet:

526 case para_NumberedList:

         has_index |= info_check_index(p->words, currnode, idx);

         if (p->type == para_Bullet) {

529 bullet.next = NULL;

530 bullet.alt = NULL;

531 bullet.type = word_Normal;

532 bullet.text = conf.bullet;

533 prefix = &bullet;

534 prefixextra = NULL;

535 indentb = conf.listindentbefore;

536 indenta = conf.listindentafter;

         } else if (p->type == para_NumberedList) {

538 prefix = p->kwtext;

539 prefixextra = conf.listsuffix;

540 indentb = conf.listindentbefore;

541 indenta = conf.listindentafter;

         } else if (p->type == para_Description) {

543 prefix = NULL;

544 prefixextra = NULL;

545 indentb = conf.listindentbefore;

546 indenta = conf.listindentafter;

547 } else {

548 prefix = NULL;

549 prefixextra = NULL;

550 indentb = indenta = 0;

551 }

         if (p->type == para_BiblioCited) {

             body = dup_word_list(p->kwtext);

             for (wp = body; wp->next; wp = wp->next);

555 wp->next = &spaceword;

556 spaceword.next = p->words;

557 spaceword.alt = NULL;

558 spaceword.type = word_WhiteSpace;

559 spaceword.text = NULL;

560 } else {

561 wp = NULL;

562 body = p->words;

563 }

         info_para(&currnode->text, prefix, prefixextra, body, keywords,

565 nesting + indentb, indenta,

                   conf.width - nesting - indentb - indenta, &conf);

567 if (wp) {

568 wp->next = NULL;

569 free_word_list(body);

570 }

571 break;

572

573 case para_Code:

         info_codepara(&currnode->text, p->words,

575 nesting + conf.indent_code,

                       conf.width - nesting - 2 * conf.indent_code);

577 break;

578 }

579

580 /*

581 * Create an index node if required.

582 */

583 if (has_index) {

584 node *newnode;

585 int i, j, k;

586 indexentry *entry;

587 char *nodename;

588

         nodename = info_node_name_for_text(conf.index_text, &conf);

         newnode = info_node_new(nodename, conf.charset);

591 sfree(nodename);

592

593 newnode->up = topnode;

594

595 currnode->next = newnode;

596 newnode->prev = currnode;

597 currnode->listnext = newnode;

598

         k = info_rdadds(&newnode->text, conf.index_text);

         info_rdaddsc(&newnode->text, "\n");

         while (k > 0) {

             info_rdadds(&newnode->text, conf.achapter.underline);

             k -= ustrwid(conf.achapter.underline, conf.charset);

604 }

         info_rdaddsc(&newnode->text, "\n\n");

606

         info_menu_item(&topnode->text, newnode, NULL, &conf);

608

         for (i = 0; (entry = index234(idx->entries, i)) != NULL; i++) {

             info_idx *ii = (info_idx *)entry->backend_data;

611

             for (j = 0; j < ii->nnodes; j++) {

613 /*

614 * When we have multiple references for a single

615 * index term, we only display the actual term on

616 * the first line, to make it clear that the terms

617 * really are the same.

618 */

                 if (j == 0)

                     info_rdaddsc(&newnode->text, ii->text);

                 for (k = (j ? 0 : ii->length); k < conf.index_width-2; k++)

                     info_rdaddc(&newnode->text, ' ');

                 info_rdaddsc(&newnode->text, "  *Note ");

                 info_rdaddsc(&newnode->text, ii->nodes[j]->name);

                 info_rdaddsc(&newnode->text, "::\n");

626 }

627 }

628 }

629

630 /*

631 * Finalise the text of each node, by adding the ^_ delimiter

632 * and the node line at the top.

633 */

     for (currnode = topnode; currnode; currnode = currnode->listnext) {

         char *origtext = currnode->text.output.text;

636 currnode->text = empty_info_data;

         currnode->text.charset = conf.charset;

         info_rdaddsc(&currnode->text, "\037\nFile: ");

         info_rdaddsc(&currnode->text, conf.filename);

         info_rdaddsc(&currnode->text, ",  Node: ");

         info_rdaddsc(&currnode->text, currnode->name);

642 if (currnode->prev) {

             info_rdaddsc(&currnode->text, ",  Prev: ");

             info_rdaddsc(&currnode->text, currnode->prev->name);

645 }

         info_rdaddsc(&currnode->text, ",  Up: ");

         info_rdaddsc(&currnode->text, (currnode->up ?

                                        currnode->up->name : "(dir)"));

649 if (currnode->next) {

             info_rdaddsc(&currnode->text, ",  Next: ");

             info_rdaddsc(&currnode->text, currnode->next->name);

652 }

         info_rdaddsc(&currnode->text, "\n\n");

         info_rdaddsc(&currnode->text, origtext);

655 /*

656 * Just make _absolutely_ sure we end with a newline.

657 */

         if (currnode->text.output.text[currnode->text.output.pos-1] != '\n')

             info_rdaddc(&currnode->text, '\n');

660

661 sfree(origtext);

662 }

663

664 /*

665 * Compute the offsets for the tag table.

666 */

667 filepos = intro_text.output.pos;

     for (currnode = topnode; currnode; currnode = currnode->listnext) {

669 currnode->pos = filepos;

         filepos += currnode->text.output.pos;

671 }

672

673 /*

674 * Split into sub-files.

675 */

     if (conf.maxfilesize > 0) {

         int currfilesize = intro_text.output.pos, currfilenum = 1;

         for (currnode = topnode; currnode; currnode = currnode->listnext) {

             if (currfilesize > intro_text.output.pos &&

                 currfilesize + currnode->text.output.pos > conf.maxfilesize) {

681 currfilenum++;

682 currfilesize = intro_text.output.pos;

683 }

684 currnode->filenum = currfilenum;

             currfilesize += currnode->text.output.pos;

686 }

687 }

688

689 /*

690 * Write the primary output file.

691 */

     fp = fopen(conf.filename, "w");

693 if (!fp) {

694 err_cantopenw(conf.filename);

695 return;

696 }

     fputs(intro_text.output.text, fp);

     if (conf.maxfilesize == 0) {

         for (currnode = topnode; currnode; currnode = currnode->listnext)

             fputs(currnode->text.output.text, fp);

701 } else {

702 int filenum = 0;

         fprintf(fp, "\037\nIndirect:\n");

         for (currnode = topnode; currnode; currnode = currnode->listnext)

             if (filenum != currnode->filenum) {

706 filenum = currnode->filenum;

                 fprintf(fp, "%s-%d: %d\n", conf.filename, filenum,

708 currnode->pos);

709 }

710 }

     fprintf(fp, "\037\nTag Table:\n");

     if (conf.maxfilesize > 0)

         fprintf(fp, "(Indirect)\n");

     for (currnode = topnode; currnode; currnode = currnode->listnext)

         fprintf(fp, "Node: %s\177%d\n", currnode->name, currnode->pos);

     fprintf(fp, "\037\nEnd Tag Table\n");

717 fclose(fp);

718

719 /*

720 * Write the subfiles.

721 */

     if (conf.maxfilesize > 0) {

723 int filenum = 0;

724 fp = NULL;

725

         for (currnode = topnode; currnode; currnode = currnode->listnext) {

             if (filenum != currnode->filenum) {

728 char *fname;

729

730 filenum = currnode->filenum;

731

732 if (fp)

733 fclose(fp);

                 fname = snewn(strlen(conf.filename) + 40, char);

                 sprintf(fname, "%s-%d", conf.filename, filenum);

                 fp = fopen(fname, "w");

737 if (!fp) {

738 err_cantopenw(fname);

739 return;

740 }

741 sfree(fname);

                 fputs(intro_text.output.text, fp);

743 }

             fputs(currnode->text.output.text, fp);

745 }

746

747 if (fp)

748 fclose(fp);

749 }

750 }

751

 static int info_check_index(word *w, node *n, indexdata *idx)

753 {

754 int ret = 0;

755

     for (; w; w = w->next) {

         if (w->type == word_IndexRef) {

758 indextag *tag;

759 int i;

760

             tag = index_findtag(idx, w->text);

762 if (!tag)

763 break;

764

             for (i = 0; i < tag->nrefs; i++) {

                 indexentry *entry = tag->refs[i];

                 info_idx *ii = (info_idx *)entry->backend_data;

768

                 if (ii->nnodes > 0 && ii->nodes[ii->nnodes-1] == n) {

770 /*

771 * If the same index term is indexed twice

772 * within the same section, we only want to

773 * mention it once in the index. So do nothing

774 * here.

775 */

776 continue;

777 }

778

                 if (ii->nnodes >= ii->nodesize) {

780 ii->nodesize += 32;

                     ii->nodes = sresize(ii->nodes, ii->nodesize, node *);

782 }

783

                 ii->nodes[ii->nnodes++] = n;

785

786 ret = 1;

787 }

788 }

789 }

790

791 return ret;

792 }

793

 static word *info_transform_wordlist(word *words, keywordlist *keywords)

795 {

     word *ret = dup_word_list(words);

797 word *w;

798 keyword *kwl;

799

     for (w = ret; w; w = w->next) {

801 w->private_data = NULL;

         if (w->type == word_UpperXref || w->type == word_LowerXref) {

             kwl = kw_lookup(keywords, w->text);

804 if (kwl) {

                 if (kwl->para->type == para_NumberedList ||

806 kwl->para->type == para_BiblioCited) {

807 /*

808 * In Info, we do nothing special for xrefs to

809 * numbered list items or bibliography entries.

810 */

811 continue;

812 } else {

813 /*

814 * An xref to a different section has its text

815 * completely replaced.

816 */

817 word *w2, *w3, *w4;

818 w2 = w3 = w->next;

819 w4 = NULL;

820 while (w2) {

                         if (w2->type == word_XrefEnd) {

822 w4 = w2->next;

823 w2->next = NULL;

824 break;

825 }

826 w2 = w2->next;

827 }

828 free_word_list(w3);

829

830 /*

831 * Now w is the UpperXref / LowerXref we

832 * started with, and w4 is the next word after

833 * the corresponding XrefEnd (if any). The

834 * simplest thing is just to stick a pointer to

835 * the target node structure in the private

836 * data field of the xref word, and let

837 * info_rdaddwc and friends read the node name

838 * out from there.

839 */

840 w->next = w4;

                     w->private_data = kwl->para->private_data;

842 assert(w->private_data);

843 }

844 }

845 }

846 }

847

848 return ret;

849 }

850

 static int info_rdaddwc(info_data *id, word *words, word *end, int xrefs,

852 infoconfig *cfg) {

853 int ret = 0;

854

     for (; words && words != end; words = words->next) switch (words->type) {

856 case word_HyperLink:

857 case word_HyperEnd:

858 case word_XrefEnd:

859 case word_IndexRef:

860 break;

861

862 case word_Normal:

863 case word_Emph:

864 case word_Code:

865 case word_WeakCode:

866 case word_WhiteSpace:

867 case word_EmphSpace:

868 case word_CodeSpace:

869 case word_WkCodeSpace:

870 case word_Quote:

871 case word_EmphQuote:

872 case word_CodeQuote:

873 case word_WkCodeQuote:

         assert(words->type != word_CodeQuote &&

875 words->type != word_WkCodeQuote);

         if (towordstyle(words->type) == word_Emph &&

             (attraux(words->aux) == attr_First ||

              attraux(words->aux) == attr_Only))

             ret += info_rdadds(id, cfg->startemph);

         else if (towordstyle(words->type) == word_Code &&

                  (attraux(words->aux) == attr_First ||

                   attraux(words->aux) == attr_Only))

             ret += info_rdadds(id, cfg->lquote);

         if (removeattr(words->type) == word_Normal) {

             if (cvt_ok(id->charset, words->text) || !words->alt)

                 ret += info_rdadds(id, words->text);

887 else

                 ret += info_rdaddwc(id, words->alt, NULL, FALSE, cfg);

         } else if (removeattr(words->type) == word_WhiteSpace) {

             ret += info_rdadd(id, L' ');

         } else if (removeattr(words->type) == word_Quote) {

             ret += info_rdadds(id, quoteaux(words->aux) == quote_Open ?

893 cfg->lquote : cfg->rquote);

894 }

         if (towordstyle(words->type) == word_Emph &&

             (attraux(words->aux) == attr_Last ||

              attraux(words->aux) == attr_Only))

             ret += info_rdadds(id, cfg->endemph);

         else if (towordstyle(words->type) == word_Code &&

                  (attraux(words->aux) == attr_Last ||

                   attraux(words->aux) == attr_Only))

             ret += info_rdadds(id, cfg->rquote);

903 break;

904

905 case word_UpperXref:

906 case word_LowerXref:

         if (xrefs && words->private_data) {

908 /*

909 * This bit is structural and so must be done in char

910 * rather than wchar_t.

911 */

             ret += info_rdaddsc(id, "*Note ");

             ret += info_rdaddsc(id, ((node *)words->private_data)->name);

             ret += info_rdaddsc(id, "::");

915 }

916 break;

917 }

918

919 return ret;

920 }

921

 static int info_width_internal(word *words, int xrefs, infoconfig *cfg);

923

 static int info_width_internal_list(word *words, int xrefs, infoconfig *cfg) {

925 int w = 0;

926 while (words) {

         w += info_width_internal(words, xrefs, cfg);

928 words = words->next;

929 }

930 return w;

931 }

932

 static int info_width_internal(word *words, int xrefs, infoconfig *cfg) {

934 int wid;

935 int attr;

936

937 switch (words->type) {

938 case word_HyperLink:

939 case word_HyperEnd:

940 case word_XrefEnd:

941 case word_IndexRef:

942 return 0;

943

944 case word_UpperXref:

945 case word_LowerXref:

         if (xrefs && words->private_data) {

947 /* "*Note " plus "::" comes to 8 characters */

             return 8 + strwid(((node *)words->private_data)->name,

949 cfg->charset);

950 } else

951 return 0;

952 }

953

     assert(words->type < word_internal_endattrs);

955

956 wid = 0;

     attr = towordstyle(words->type);

958

     if (attr == word_Emph || attr == word_Code) {

         if (attraux(words->aux) == attr_Only ||

             attraux(words->aux) == attr_First)

             wid += ustrwid(attr == word_Emph ? cfg->startemph : cfg->lquote,

963 cfg->charset);

964 }

     if (attr == word_Emph || attr == word_Code) {

         if (attraux(words->aux) == attr_Only ||

             attraux(words->aux) == attr_Last)

             wid += ustrwid(attr == word_Emph ? cfg->startemph : cfg->lquote,

969 cfg->charset);

970 }

971

972 switch (words->type) {

973 case word_Normal:

974 case word_Emph:

975 case word_Code:

976 case word_WeakCode:

         if (cvt_ok(cfg->charset, words->text) || !words->alt)

             wid += ustrwid(words->text, cfg->charset);

979 else

             wid += info_width_internal_list(words->alt, xrefs, cfg);

981 return wid;

982

983 case word_WhiteSpace:

984 case word_EmphSpace:

985 case word_CodeSpace:

986 case word_WkCodeSpace:

987 case word_Quote:

988 case word_EmphQuote:

989 case word_CodeQuote:

990 case word_WkCodeQuote:

         assert(words->type != word_CodeQuote &&

992 words->type != word_WkCodeQuote);

         if (removeattr(words->type) == word_Quote) {

             if (quoteaux(words->aux) == quote_Open)

                 wid += ustrwid(cfg->lquote, cfg->charset);

996 else

                 wid += ustrwid(cfg->rquote, cfg->charset);

998 } else

999 wid++; /* space */

1000 }

1001 return wid;

1002 }

1003

 static int info_width_noxrefs(void *ctx, word *words)

1005 {

     return info_width_internal(words, FALSE, (infoconfig *)ctx);

1007 }

 static int info_width_xrefs(void *ctx, word *words)

1009 {

     return info_width_internal(words, TRUE, (infoconfig *)ctx);

1011 }

1012

 static void info_heading(info_data *text, word *tprefix,

1014 word *words, alignstruct align,

1015 int width, infoconfig *cfg) {

1016 int length;

1017 int firstlinewidth, wrapwidth;

1018 wrappedline *wrapping, *p;

1019

1020 length = 0;

1021 if (tprefix) {

         length += info_rdaddwc(text, tprefix, NULL, FALSE, cfg);

         length += info_rdadds(text, cfg->sectsuffix);

1024 }

1025

1026 wrapwidth = width;

1027 firstlinewidth = width - length;

1028

     wrapping = wrap_para(words, firstlinewidth, wrapwidth,

1030 info_width_noxrefs, cfg, 0);

     for (p = wrapping; p; p = p->next) {

         length += info_rdaddwc(text, p->begin, p->end, FALSE, cfg);

         info_rdadd(text, L'\n');

1034 if (*align.underline) {

             while (length > 0) {

                 info_rdadds(text, align.underline);

                 length -= ustrwid(align.underline, cfg->charset);

1038 }

             info_rdadd(text, L'\n');

1040 }

1041 length = 0;

1042 }

1043 wrap_free(wrapping);

     info_rdadd(text, L'\n');

1045 }

1046

 static void info_rule(info_data *text, int indent, int width, infoconfig *cfg)

1048 {

     while (indent--) info_rdadd(text, L' ');

     while (width > 0) {

         info_rdadds(text, cfg->rule);

         width -= ustrwid(cfg->rule, cfg->charset);

1053 }

     info_rdadd(text, L'\n');

     info_rdadd(text, L'\n');

1056 }

1057

 static void info_para(info_data *text, word *prefix, wchar_t *prefixextra,

                       word *input, keywordlist *keywords, int indent,

                       int extraindent, int width, infoconfig *cfg) {

1061 wrappedline *wrapping, *p;

1062 word *words;

1063 int e;

1064 int i;

1065 int firstlinewidth = width;

1066

     words = info_transform_wordlist(input, keywords);

1068

1069 if (prefix) {

         for (i = 0; i < indent; i++)

             info_rdadd(text, L' ');

         e = info_rdaddwc(text, prefix, NULL, FALSE, cfg);

1073 if (prefixextra)

             e += info_rdadds(text, prefixextra);

1075 /* If the prefix is too long, shorten the first line to fit. */

1076 e = extraindent - e;

         if (e < 0) {

1078 firstlinewidth += e; /* this decreases it, since e < 0 */

             if (firstlinewidth < 0) {

1080 e = indent + extraindent;

1081 firstlinewidth = width;

                 info_rdadd(text, L'\n');

1083 } else

1084 e = 0;

1085 }

1086 } else

1087 e = indent + extraindent;

1088

     wrapping = wrap_para(words, firstlinewidth, width, info_width_xrefs,

1090 cfg, 0);

     for (p = wrapping; p; p = p->next) {

         for (i = 0; i < e; i++)

             info_rdadd(text, L' ');

         info_rdaddwc(text, p->begin, p->end, TRUE, cfg);

         info_rdadd(text, L'\n');

1096 e = indent + extraindent;

1097 }

1098 wrap_free(wrapping);

     info_rdadd(text, L'\n');

1100

1101 free_word_list(words);

1102 }

1103

 static void info_codepara(info_data *text, word *words,

1105 int indent, int width) {

1106 int i;

1107

     for (; words; words = words->next) if (words->type == word_WeakCode) {

         for (i = 0; i < indent; i++)

             info_rdadd(text, L' ');

         if (info_rdadds(text, words->text) > width) {

1112 /* FIXME: warn */

1113 }

         info_rdadd(text, L'\n');

1115 }

1116

     info_rdadd(text, L'\n');

1118 }

1119

 static void info_versionid(info_data *text, word *words, infoconfig *cfg) {

     info_rdadd(text, L'[');

     info_rdaddwc(text, words, NULL, FALSE, cfg);

     info_rdadds(text, L"]\n");

1124 }

1125

 static node *info_node_new(char *name, int charset)

1127 {

1128 node *n;

1129

1130 n = snew(node);

1131 n->text = empty_info_data;

1132 n->text.charset = charset;

     n->up = n->next = n->prev = n->lastchild = n->listnext = NULL;

     n->name = dupstr(name);

1135 n->started_menu = FALSE;

1136

1137 return n;

1138 }

1139

 static char *info_node_name_core(info_data *id, filepos *fpos)

1141 {

1142 char *p, *q;

1143

1144 /*

1145 * We cannot have commas, colons or parentheses in a node name.

1146 * Remove any that we find, with a warning.

1147 */

     p = q = id->output.text;

1149 while (*p) {

         if (*p == ':' || *p == ',' || *p == '(' || *p == ')') {

1151 err_infonodechar(fpos, *p);

1152 } else {

1153 *q++ = *p;

1154 }

1155 p++;

1156 }

1157 *q = '\0';

1158

1159 return id->output.text;

1160 }

1161

 static char *info_node_name_for_para(paragraph *par, infoconfig *cfg)

1163 {

1164 info_data id = EMPTY_INFO_DATA;

1165

1166 id.charset = cfg->charset;

     info_rdaddwc(&id, par->kwtext ? par->kwtext : par->words,

1168 NULL, FALSE, cfg);

1169 info_rdaddsc(&id, NULL);

1170

     return info_node_name_core(&id, &par->fpos);

1172 }

1173

 static char *info_node_name_for_text(wchar_t *text, infoconfig *cfg)

1175 {

1176 info_data id = EMPTY_INFO_DATA;

1177

1178 id.charset = cfg->charset;

1179 info_rdadds(&id, text);

1180 info_rdaddsc(&id, NULL);

1181

     return info_node_name_core(&id, NULL);

1183 }

1184

 static void info_menu_item(info_data *text, node *n, paragraph *p,

1186 infoconfig *cfg)

1187 {

1188 /*

1189 * FIXME: Depending on how we're doing node names in this info

1190 * file, we might want to do

1191 *

1192 * * Node name:: Chapter title

1193 *

1194 * _or_

1195 *

1196 * * Chapter number: Node name.

1197 *

1198 * This function mostly works in char rather than wchar_t,

1199 * because a menu item is a structural component.

1200 */

     info_rdaddsc(text, "* ");

     info_rdaddsc(text, n->name);

     info_rdaddsc(text, "::");

1204 if (p) {

         info_rdaddc(text, ' ');

         info_rdaddwc(text, p->words, NULL, FALSE, cfg);

1207 }

     info_rdaddc(text, '\n');

1209 }

1210

1211 /*

1212 * These functions implement my wrapper on the rdadd* calls which

1213 * allows me to switch arbitrarily between literal octet-string

1214 * text and charset-translated Unicode. (Because no matter what

1215 * character set I write the actual text in, I expect info readers

1216 * to treat node names and file names literally and to expect

1217 * keywords like `*Note' in their canonical form, so I have to take

1218 * steps to ensure that those structural elements of the file

1219 * aren't messed with.)

1220 */

 static int info_rdadds(info_data *d, wchar_t const *wcs)

1222 {

1223 if (!d->wcmode) {

1224 d->state = charset_init_state;

1225 d->wcmode = TRUE;

1226 }

1227

1228 if (wcs) {

1229 char buf[256];

1230 int len, width, ret;

1231

         width = ustrwid(wcs, d->charset);

1233

1234 len = ustrlen(wcs);

         while (len > 0) {

1236 int prevlen = len;

1237

             ret = charset_from_unicode(&wcs, &len, buf, lenof(buf),

                                        d->charset, &d->state, NULL);

1240

1241 assert(len < prevlen);

1242

             if (ret > 0) {

1244 buf[ret] = '\0';

                 rdaddsc(&d->output, buf);

1246 }

1247 }

1248

1249 return width;

1250 } else

1251 return 0;

1252 }

1253

 static int info_rdaddsc(info_data *d, char const *cs)

1255 {

1256 if (d->wcmode) {

1257 char buf[256];

1258 int ret;

1259

         ret = charset_from_unicode(NULL, 0, buf, lenof(buf),

                                    d->charset, &d->state, NULL);

         if (ret > 0) {

1263 buf[ret] = '\0';

             rdaddsc(&d->output, buf);

1265 }

1266

1267 d->wcmode = FALSE;

1268 }

1269

1270 if (cs) {

         rdaddsc(&d->output, cs);

         return strwid(cs, d->charset);

1273 } else

1274 return 0;

1275 }

1276

 static int info_rdadd(info_data *d, wchar_t wc)

1278 {

1279 wchar_t wcs[2];

1280 wcs[0] = wc;

     wcs[1] = L'\0';

     return info_rdadds(d, wcs);

1283 }

1284

 static int info_rdaddc(info_data *d, char c)

1286 {

1287 char cs[2];

1288 cs[0] = c;

     cs[1] = '\0';

     return info_rdaddsc(d, cs);

1291 }