texinfo/makeinfo/html.c

56160Sru/* html.c -- html-related utilities.
146515Sru   $Id: html.c,v 1.28 2004/12/06 01:13:06 karl Exp $
56160Sru
146515Sru   Copyright (C) 1999, 2000, 2001, 2002, 2003, 2004 Free Software
146515Sru   Foundation, Inc.
56160Sru
56160Sru   This program is free software; you can redistribute it and/or modify
56160Sru   it under the terms of the GNU General Public License as published by
56160Sru   the Free Software Foundation; either version 2, or (at your option)
56160Sru   any later version.
56160Sru
56160Sru   This program is distributed in the hope that it will be useful,
56160Sru   but WITHOUT ANY WARRANTY; without even the implied warranty of
56160Sru   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
56160Sru   GNU General Public License for more details.
56160Sru
56160Sru   You should have received a copy of the GNU General Public License
56160Sru   along with this program; if not, write to the Free Software Foundation,
56160Sru   Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.  */
56160Sru
56160Sru#include "system.h"
56160Sru#include "cmds.h"
146515Sru#include "files.h"
56160Sru#include "html.h"
56160Sru#include "lang.h"
56160Sru#include "makeinfo.h"
146515Sru#include "node.h"
56160Sru#include "sectioning.h"
56160Sru
56160Sru
116525Sru/* Append CHAR to BUFFER, (re)allocating as necessary.  We don't handle
116525Sru   null characters.  */
116525Sru
116525Srutypedef struct
116525Sru{
116525Sru  unsigned size;    /* allocated */
116525Sru  unsigned length;  /* used */
116525Sru  char *buffer;
116525Sru} buffer_type;
116525Sru
116525Srustatic buffer_type *
146515Sruinit_buffer (void)
116525Sru{
116525Sru  buffer_type *buf = xmalloc (sizeof (buffer_type));
116525Sru  buf->length = 0;
116525Sru  buf->size = 0;
116525Sru  buf->buffer = NULL;
116525Sru
116525Sru  return buf;
116525Sru}
116525Sru
116525Srustatic void
146515Sruappend_char (buffer_type *buf, int c)
116525Sru{
116525Sru  buf->length++;
116525Sru  if (buf->length >= buf->size)
116525Sru    {
116525Sru      buf->size += 100;
116525Sru      buf->buffer = xrealloc (buf->buffer, buf->size);
116525Sru    }
116525Sru  buf->buffer[buf->length - 1] = c;
116525Sru  buf->buffer[buf->length] = 0;
116525Sru}
116525Sru
116525Sru/* Read the cascading style-sheet file FILENAME.  Write out any @import
116525Sru   commands, which must come first, by the definition of css.  If the
116525Sru   file contains any actual css code following the @imports, return it;
116525Sru   else return NULL.  */
116525Srustatic char *
146515Sruprocess_css_file (char *filename)
116525Sru{
146515Sru  int c;
146515Sru  int lastchar = 0;
116525Sru  FILE *f;
116525Sru  buffer_type *import_text = init_buffer ();
116525Sru  buffer_type *inline_text = init_buffer ();
116525Sru  unsigned lineno = 1;
116525Sru  enum { null_state, comment_state, import_state, inline_state } state
116525Sru    = null_state, prev_state;
116525Sru
146515Sru  prev_state = null_state;
146515Sru
116525Sru  /* read from stdin if `-' is the filename.  */
116525Sru  f = STREQ (filename, "-") ? stdin : fopen (filename, "r");
116525Sru  if (!f)
116525Sru    {
116525Sru      error (_("%s: could not open --css-file: %s"), progname, filename);
116525Sru      return NULL;
116525Sru    }
116525Sru
116525Sru  /* Read the file.  The @import statements must come at the beginning,
116525Sru     with only whitespace and comments allowed before any inline css code.  */
116525Sru  while ((c = getc (f)) >= 0)
116525Sru    {
116525Sru      if (c == '\n')
116525Sru        lineno++;
116525Sru
116525Sru      switch (state)
116525Sru        {
116525Sru        case null_state: /* between things */
116525Sru          if (c == '@')
146515Sru            { /* Only @import and @charset should switch into
146515Sru                 import_state, other @-commands, such as @media, should
146515Sru                 put us into inline_state.  I don't think any other css
146515Sru                 @-commands start with `i' or `c', although of course
146515Sru                 this will break when such a command is defined.  */
146515Sru              int nextchar = getc (f);
146515Sru              if (nextchar == 'i' || nextchar == 'c')
146515Sru                {
146515Sru                  append_char (import_text, c);
146515Sru                  state = import_state;
146515Sru                }
146515Sru              else
146515Sru                {
146515Sru                  ungetc (nextchar, f);  /* wasn't an @import */
146515Sru                  state = inline_state;
146515Sru                }
116525Sru            }
116525Sru          else if (c == '/')
116525Sru            { /* possible start of a comment */
116525Sru              int nextchar = getc (f);
116525Sru              if (nextchar == '*')
116525Sru                state = comment_state;
116525Sru              else
116525Sru                {
116525Sru                  ungetc (nextchar, f); /* wasn't a comment */
116525Sru                  state = inline_state;
116525Sru                }
116525Sru            }
116525Sru          else if (isspace (c))
116525Sru            ; /* skip whitespace; maybe should use c_isspace?  */
116525Sru
116525Sru          else
116525Sru            /* not an @import, not a comment, not whitespace: we must
116525Sru               have started the inline text.  */
116525Sru            state = inline_state;
116525Sru
116525Sru          if (state == inline_state)
116525Sru            append_char (inline_text, c);
116525Sru
116525Sru          if (state != null_state)
116525Sru            prev_state = null_state;
116525Sru          break;
116525Sru
116525Sru        case comment_state:
116525Sru          if (c == '/' && lastchar == '*')
116525Sru            state = prev_state;  /* end of comment */
116525Sru          break;  /* else ignore this comment char */
116525Sru
116525Sru        case import_state:
116525Sru          append_char (import_text, c);  /* include this import char */
116525Sru          if (c == ';')
116525Sru            { /* done with @import */
116525Sru              append_char (import_text, '\n');  /* make the output nice */
116525Sru              state = null_state;
116525Sru              prev_state = import_state;
116525Sru            }
116525Sru          break;
116525Sru
116525Sru        case inline_state:
116525Sru          /* No harm in writing out comments, so don't bother parsing
116525Sru             them out, just append everything.  */
116525Sru          append_char (inline_text, c);
116525Sru          break;
116525Sru        }
116525Sru
116525Sru      lastchar = c;
116525Sru    }
116525Sru
116525Sru  /* Reached the end of the file.  We should not be still in a comment.  */
116525Sru  if (state == comment_state)
116525Sru    warning (_("%s:%d: --css-file ended in comment"), filename, lineno);
116525Sru
116525Sru  /* Write the @import text, if any.  */
116525Sru  if (import_text->buffer)
116525Sru    {
116525Sru      add_word (import_text->buffer);
116525Sru      free (import_text->buffer);
116525Sru      free (import_text);
116525Sru    }
116525Sru
116525Sru  /* We're wasting the buffer struct memory, but so what.  */
116525Sru  return inline_text->buffer;
116525Sru}
146515Sru
146515SruHSTACK *htmlstack = NULL;
116525Sru
146515Sru/* See html.h.  */
146515Sruint html_output_head_p = 0;
146515Sruint html_title_written = 0;
116525Sru
146515Sruvoid
146515Sruhtml_output_head (void)
146515Sru{
146515Sru  static const char *html_title = NULL;
146515Sru  char *encoding;
146515Sru
146515Sru  if (html_output_head_p)
146515Sru    return;
146515Sru  html_output_head_p = 1;
146515Sru
146515Sru  encoding = current_document_encoding ();
146515Sru
146515Sru  /* The <title> should not have markup, so use text_expansion.  */
146515Sru  if (!html_title)
146515Sru    html_title = escape_string (title ?
146515Sru        text_expansion (title) : (char *) _("Untitled"));
146515Sru
146515Sru  /* Make sure this is the very first string of the output document.  */
146515Sru  output_paragraph_offset = 0;
146515Sru
146515Sru  add_html_block_elt_args ("<html lang=\"%s\">\n<head>\n",
146515Sru      language_table[language_code].abbrev);
146515Sru
146515Sru  /* When splitting, add current node's name to title if it's available and not
146515Sru     Top.  */
146515Sru  if (splitting && current_node && !STREQ (current_node, "Top"))
146515Sru    add_word_args ("<title>%s - %s</title>\n",
146515Sru        escape_string (xstrdup (current_node)), html_title);
146515Sru  else
146515Sru    add_word_args ("<title>%s</title>\n",  html_title);
146515Sru
146515Sru  add_word ("<meta http-equiv=\"Content-Type\" content=\"text/html");
146515Sru  if (encoding && *encoding)
146515Sru    add_word_args ("; charset=%s", encoding);
146515Sru
146515Sru  add_word ("\">\n");
146515Sru
146515Sru  if (!document_description)
146515Sru    document_description = html_title;
146515Sru
146515Sru  add_word_args ("<meta name=\"description\" content=\"%s\">\n",
146515Sru                 document_description);
146515Sru  add_word_args ("<meta name=\"generator\" content=\"makeinfo %s\">\n",
146515Sru                 VERSION);
146515Sru
146515Sru  /* Navigation bar links.  */
146515Sru  if (!splitting)
146515Sru    add_word ("<link title=\"Top\" rel=\"top\" href=\"#Top\">\n");
146515Sru  else if (tag_table)
146515Sru    {
146515Sru      /* Always put a top link.  */
146515Sru      add_word ("<link title=\"Top\" rel=\"start\" href=\"index.html#Top\">\n");
146515Sru
146515Sru      /* We already have a top link, avoid duplication.  */
146515Sru      if (tag_table->up && !STREQ (tag_table->up, "Top"))
146515Sru        add_link (tag_table->up, "rel=\"up\"");
146515Sru
146515Sru      if (tag_table->prev)
146515Sru        add_link (tag_table->prev, "rel=\"prev\"");
146515Sru
146515Sru      if (tag_table->next)
146515Sru        add_link (tag_table->next, "rel=\"next\"");
146515Sru
146515Sru      /* fixxme: Look for a way to put links to various indices in the
146515Sru         document.  Also possible candidates to be added here are First and
146515Sru         Last links.  */
146515Sru    }
146515Sru  else
146515Sru    {
146515Sru      /* We are splitting, but we neither have a tag_table.  So this must be
146515Sru         index.html.  So put a link to Top. */
146515Sru      add_word ("<link title=\"Top\" rel=\"start\" href=\"#Top\">\n");
146515Sru    }
146515Sru
146515Sru  add_word ("<link href=\"http://www.gnu.org/software/texinfo/\" \
146515Srurel=\"generator-home\" title=\"Texinfo Homepage\">\n");
146515Sru
146515Sru  if (copying_text)
146515Sru    { /* It is not ideal that we include the html markup here within
146515Sru         <head>, so we use text_expansion.  */
146515Sru      insert_string ("<!--\n");
146515Sru      insert_string (text_expansion (copying_text));
146515Sru      insert_string ("-->\n");
146515Sru    }
146515Sru
146515Sru  /* Put the style definitions in a comment for the sake of browsers
146515Sru     that don't support <style>.  */
146515Sru  add_word ("<meta http-equiv=\"Content-Style-Type\" content=\"text/css\">\n");
146515Sru  add_word ("<style type=\"text/css\"><!--\n");
146515Sru
146515Sru  {
146515Sru    char *css_inline = NULL;
146515Sru
146515Sru    if (css_include)
146515Sru      /* This writes out any @import commands from the --css-file,
146515Sru         and returns any actual css code following the imports.  */
146515Sru      css_inline = process_css_file (css_include);
146515Sru
146515Sru    /* This seems cleaner than adding <br>'s at the end of each line for
146515Sru       these "roman" displays.  It's hardly the end of the world if the
146515Sru       browser doesn't do <style>s, in any case; they'll just come out in
146515Sru       typewriter.  */
146515Sru#define CSS_FONT_INHERIT "font-family:inherit"
146515Sru    add_word_args ("  pre.display { %s }\n", CSS_FONT_INHERIT);
146515Sru    add_word_args ("  pre.format  { %s }\n", CSS_FONT_INHERIT);
146515Sru
146515Sru    /* Alternatively, we could do <font size=-1> in insertion.c, but this
146515Sru       way makes it easier to override.  */
146515Sru#define CSS_FONT_SMALLER "font-size:smaller"
146515Sru    add_word_args ("  pre.smalldisplay { %s; %s }\n", CSS_FONT_INHERIT,
146515Sru                   CSS_FONT_SMALLER);
146515Sru    add_word_args ("  pre.smallformat  { %s; %s }\n", CSS_FONT_INHERIT,
146515Sru                   CSS_FONT_SMALLER);
146515Sru    add_word_args ("  pre.smallexample { %s }\n", CSS_FONT_SMALLER);
146515Sru    add_word_args ("  pre.smalllisp    { %s }\n", CSS_FONT_SMALLER);
146515Sru
146515Sru    /* Since HTML doesn't have a sc element, we use span with a bit of
146515Sru       CSS spice instead.  */
146515Sru#define CSS_FONT_SMALL_CAPS "font-variant:small-caps"
146515Sru    add_word_args ("  span.sc    { %s }\n", CSS_FONT_SMALL_CAPS);
146515Sru
146515Sru    /* Roman (default) font class, closest we can come.  */
146515Sru#define CSS_FONT_ROMAN "font-family:serif; font-weight:normal;"
146515Sru    add_word_args ("  span.roman { %s } \n", CSS_FONT_ROMAN);
146515Sru
146515Sru    /* Sans serif font class.  */
146515Sru#define CSS_FONT_SANSSERIF "font-family:sans-serif; font-weight:normal;"
146515Sru    add_word_args ("  span.sansserif { %s } \n", CSS_FONT_SANSSERIF);
146515Sru
146515Sru    /* Write out any css code from the user's --css-file.  */
146515Sru    if (css_inline)
146515Sru      insert_string (css_inline);
146515Sru
146515Sru    add_word ("--></style>\n");
146515Sru  }
146515Sru
146515Sru  add_word ("</head>\n<body>\n");
146515Sru
146515Sru  if (title && !html_title_written && titlepage_cmd_present)
146515Sru    {
146515Sru      add_word_args ("<h1 class=\"settitle\">%s</h1>\n", html_title);
146515Sru      html_title_written = 1;
146515Sru    }
146515Sru
146515Sru  free (encoding);
146515Sru}
116525Sru
56160Sru/* Escape HTML special characters in the string if necessary,
56160Sru   returning a pointer to a possibly newly-allocated one. */
56160Sruchar *
146515Sruescape_string (char *string)
56160Sru{
146515Sru  char *newstring;
146515Sru  int i = 0, newlen = 0;
56160Sru
56160Sru  do
56160Sru    {
56160Sru      /* Find how much to allocate. */
56160Sru      switch (string[i])
56160Sru        {
146515Sru        case '"':
146515Sru          newlen += 6;          /* `&quot;' */
146515Sru          break;
56160Sru        case '&':
56160Sru          newlen += 5;          /* `&amp;' */
56160Sru          break;
56160Sru        case '<':
56160Sru        case '>':
56160Sru          newlen += 4;          /* `&lt;', `&gt;' */
56160Sru          break;
56160Sru        default:
56160Sru          newlen++;
56160Sru        }
56160Sru    }
93139Sru  while (string[i++]);
56160Sru
56160Sru  if (newlen == i) return string; /* Already OK. */
56160Sru
93139Sru  newstring = xmalloc (newlen);
56160Sru  i = 0;
56160Sru  do
56160Sru    {
56160Sru      switch (string[i])
56160Sru        {
146515Sru        case '"':
146515Sru          strcpy (newstring, "&quot;");
146515Sru          newstring += 6;
146515Sru          break;
56160Sru        case '&':
56160Sru          strcpy (newstring, "&amp;");
56160Sru          newstring += 5;
56160Sru          break;
56160Sru        case '<':
56160Sru          strcpy (newstring, "&lt;");
56160Sru          newstring += 4;
56160Sru          break;
56160Sru        case '>':
56160Sru          strcpy (newstring, "&gt;");
56160Sru          newstring += 4;
56160Sru          break;
56160Sru        default:
56160Sru          newstring[0] = string[i];
56160Sru          newstring++;
56160Sru        }
56160Sru    }
56160Sru  while (string[i++]);
56160Sru  free (string);
93139Sru  return newstring - newlen;
56160Sru}
114472Sru
114472Sru/* Save current tag.  */
146515Srustatic void
146515Srupush_tag (char *tag, char *attribs)
114472Sru{
114472Sru  HSTACK *newstack = xmalloc (sizeof (HSTACK));
56160Sru
114472Sru  newstack->tag = tag;
146515Sru  newstack->attribs = xstrdup (attribs);
114472Sru  newstack->next = htmlstack;
114472Sru  htmlstack = newstack;
114472Sru}
114472Sru
114472Sru/* Get last tag.  */
146515Srustatic void
146515Srupop_tag (void)
114472Sru{
114472Sru  HSTACK *tos = htmlstack;
114472Sru
114472Sru  if (!tos)
114472Sru    {
114472Sru      line_error (_("[unexpected] no html tag to pop"));
114472Sru      return;
114472Sru    }
114472Sru
146515Sru  free (htmlstack->attribs);
146515Sru
114472Sru  htmlstack = htmlstack->next;
114472Sru  free (tos);
114472Sru}
114472Sru
146515Sru/* Check if tag is an empty or a whitespace only element.
146515Sru   If so, remove it, keeping whitespace intact.  */
146515Sruint
146515Srurollback_empty_tag (char *tag)
146515Sru{
146515Sru  int check_position = output_paragraph_offset;
146515Sru  int taglen = strlen (tag);
146515Sru  int rollback_happened = 0;
146515Sru  char *contents = "";
146515Sru  char *contents_canon_white = "";
146515Sru
146515Sru  /* If output_paragraph is empty, we cannot rollback :-\  */
146515Sru  if (output_paragraph_offset <= 0)
146515Sru    return 0;
146515Sru
146515Sru  /* Find the end of the previous tag.  */
146515Sru  while (output_paragraph[check_position-1] != '>' && check_position > 0)
146515Sru    check_position--;
146515Sru
146515Sru  /* Save stuff between tag's end to output_paragraph's end.  */
146515Sru  if (check_position != output_paragraph_offset)
146515Sru    {
146515Sru      contents = xmalloc (output_paragraph_offset - check_position + 1);
146515Sru      memcpy (contents, output_paragraph + check_position,
146515Sru          output_paragraph_offset - check_position);
146515Sru
146515Sru      contents[output_paragraph_offset - check_position] = '\0';
146515Sru
146515Sru      contents_canon_white = xstrdup (contents);
146515Sru      canon_white (contents_canon_white);
146515Sru    }
146515Sru
146515Sru  /* Find the start of the previous tag.  */
146515Sru  while (output_paragraph[check_position-1] != '<' && check_position > 0)
146515Sru    check_position--;
146515Sru
146515Sru  /* Check to see if this is the tag.  */
146515Sru  if (strncmp ((char *) output_paragraph + check_position, tag, taglen) == 0
146515Sru      && (whitespace (output_paragraph[check_position + taglen])
146515Sru          || output_paragraph[check_position + taglen] == '>'))
146515Sru    {
146515Sru      if (!contents_canon_white || !*contents_canon_white)
146515Sru        {
146515Sru          /* Empty content after whitespace removal, so roll it back.  */
146515Sru          output_paragraph_offset = check_position - 1;
146515Sru          rollback_happened = 1;
146515Sru
146515Sru          /* Original contents may not be empty (whitespace.)  */
146515Sru          if (contents && *contents)
146515Sru            {
146515Sru              insert_string (contents);
146515Sru              free (contents);
146515Sru            }
146515Sru        }
146515Sru    }
146515Sru
146515Sru  return rollback_happened;
146515Sru}
146515Sru
56160Sru/* Open or close TAG according to START_OR_END. */
56160Sruvoid
146515Sru#if defined (VA_FPRINTF) && __STDC__
146515Sruinsert_html_tag_with_attribute (int start_or_end, char *tag, char *format, ...)
146515Sru#else
146515Sruinsert_html_tag_with_attribute (start_or_end, tag, format, va_alist)
56160Sru     int start_or_end;
56160Sru     char *tag;
146515Sru     char *format;
146515Sru     va_dcl
146515Sru#endif
56160Sru{
114472Sru  char *old_tag = NULL;
146515Sru  char *old_attribs = NULL;
146515Sru  char formatted_attribs[2000]; /* xx no fixed limits */
114472Sru  int do_return = 0;
146515Sru  extern int in_html_elt;
114472Sru
56160Sru  if (start_or_end != START)
116525Sru    pop_tag ();
114472Sru
114472Sru  if (htmlstack)
146515Sru    {
146515Sru      old_tag = htmlstack->tag;
146515Sru      old_attribs = htmlstack->attribs;
146515Sru    }
146515Sru
146515Sru  if (format)
146515Sru    {
146515Sru#ifdef VA_SPRINTF
146515Sru      va_list ap;
146515Sru#endif
114472Sru
146515Sru      VA_START (ap, format);
146515Sru#ifdef VA_SPRINTF
146515Sru      VA_SPRINTF (formatted_attribs, format, ap);
146515Sru#else
146515Sru      sprintf (formatted_attribs, format, a1, a2, a3, a4, a5, a6, a7, a8);
146515Sru#endif
146515Sru      va_end (ap);
146515Sru    }
146515Sru  else
146515Sru    formatted_attribs[0] = '\0';
146515Sru
146515Sru  /* Exception: can nest multiple spans.  */
114472Sru  if (htmlstack
146515Sru      && STREQ (htmlstack->tag, tag)
146515Sru      && !(STREQ (tag, "span") && STREQ (old_attribs, formatted_attribs)))
114472Sru    do_return = 1;
114472Sru
114472Sru  if (start_or_end == START)
146515Sru    push_tag (tag, formatted_attribs);
114472Sru
114472Sru  if (do_return)
114472Sru    return;
114472Sru
146515Sru  in_html_elt++;
146515Sru
114472Sru  /* texinfo.tex doesn't support more than one font attribute
114472Sru     at the same time.  */
146515Sru  if ((start_or_end == START) && old_tag && *old_tag
146515Sru      && !rollback_empty_tag (old_tag))
146515Sru    add_word_args ("</%s>", old_tag);
114472Sru
114472Sru  if (*tag)
114472Sru    {
146515Sru      if (start_or_end == START)
146515Sru        add_word_args (format ? "<%s %s>" : "<%s>", tag, formatted_attribs);
146515Sru      else if (!rollback_empty_tag (tag))
146515Sru        /* Insert close tag only if we didn't rollback,
146515Sru           in which case the opening tag is removed.  */
146515Sru        add_word_args ("</%s>", tag);
114472Sru    }
114472Sru
114472Sru  if ((start_or_end != START) && old_tag && *old_tag)
146515Sru    add_word_args (strlen (old_attribs) > 0 ? "<%s %s>" : "<%s>",
146515Sru        old_tag, old_attribs);
146515Sru
146515Sru  in_html_elt--;
56160Sru}
56160Sru
146515Sruvoid
146515Sruinsert_html_tag (int start_or_end, char *tag)
146515Sru{
146515Sru  insert_html_tag_with_attribute (start_or_end, tag, NULL);
146515Sru}
116525Sru
56160Sru/* Output an HTML <link> to the filename for NODE, including the
56160Sru   other string as extra attributes. */
56160Sruvoid
146515Sruadd_link (char *nodename, char *attributes)
56160Sru{
93139Sru  if (nodename)
56160Sru    {
93139Sru      add_html_elt ("<link ");
93139Sru      add_word_args ("%s", attributes);
93139Sru      add_word_args (" href=\"");
93139Sru      add_anchor_name (nodename, 1);
146515Sru      add_word_args ("\" title=\"%s\">\n", nodename);
56160Sru    }
56160Sru}
56160Sru
56160Sru/* Output NAME with characters escaped as appropriate for an anchor
146515Sru   name, i.e., escape URL special characters with our _00hh convention
146515Sru   if OLD is zero.  (See the manual for details on the new scheme.)
146515Sru
146515Sru   If OLD is nonzero, generate the node name with the 4.6-and-earlier
146515Sru   convention of %hh (and more special characters output as-is, notably
146515Sru   - and *).  This is only so that external references to old names can
146515Sru   still work with HTML generated by the new makeinfo; the gcc folks
146515Sru   needed this.  Our own HTML does not refer to these names.  */
146515Sru
56160Sruvoid
146515Sruadd_escaped_anchor_name (char *name, int old)
56160Sru{
146515Sru  canon_white (name);
146515Sru
146515Sru  if (!old && !strchr ("abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ",
146515Sru                       *name))
146515Sru    { /* XHTML does not allow anything but an ASCII letter to start an
146515Sru         identifier.  Therefore kludge in this constant string if we
146515Sru         have a nonletter.  */
146515Sru      add_word ("g_t");
146515Sru    }
146515Sru
56160Sru  for (; *name; name++)
56160Sru    {
146515Sru      if (cr_or_whitespace (*name))
146515Sru        add_char ('-');
146515Sru
146515Sru      else if (!old && !URL_SAFE_CHAR (*name))
56160Sru        /* Cast so characters with the high bit set are treated as >128,
56160Sru           for example o-umlaut should be 246, not -10.  */
146515Sru        add_word_args ("_00%x", (unsigned char) *name);
146515Sru
146515Sru      else if (old && !URL_SAFE_CHAR (*name) && !OLD_URL_SAFE_CHAR (*name))
146515Sru        /* Different output convention, but still cast as above.  */
56160Sru        add_word_args ("%%%x", (unsigned char) *name);
146515Sru
56160Sru      else
56160Sru        add_char (*name);
56160Sru    }
56160Sru}
56160Sru
56160Sru/* Insert the text for the name of a reference in an HTML anchor
146515Sru   appropriate for NODENAME.
146515Sru
146515Sru   If HREF is zero, generate text for name= in the new node name
146515Sru     conversion convention.
146515Sru   If HREF is negative, generate text for name= in the old convention.
146515Sru   If HREF is positive, generate the name for an href= attribute, i.e.,
146515Sru     including the `#' if it's an internal reference.   */
56160Sruvoid
146515Sruadd_anchor_name (char *nodename, int href)
56160Sru{
146515Sru  if (href > 0)
93139Sru    {
93139Sru      if (splitting)
93139Sru	add_url_name (nodename, href);
93139Sru      add_char ('#');
93139Sru    }
93139Sru  /* Always add NODENAME, so that the reference would pinpoint the
93139Sru     exact node on its file.  This is so several nodes could share the
93139Sru     same file, in case of file-name clashes, but also for more
93139Sru     accurate browser positioning.  */
93139Sru  if (strcasecmp (nodename, "(dir)") == 0)
93139Sru    /* Strip the parens, but keep the original letter-case.  */
93139Sru    add_word_args ("%.3s", nodename + 1);
146515Sru  else if (strcasecmp (nodename, "top") == 0)
146515Sru    add_word ("Top");
93139Sru  else
146515Sru    add_escaped_anchor_name (nodename, href < 0);
93139Sru}
56160Sru
93139Sru/* Insert the text for the name of a reference in an HTML url, aprropriate
93139Sru   for NODENAME */
93139Sruvoid
146515Sruadd_url_name (char *nodename, int href)
93139Sru{
93139Sru    add_nodename_to_filename (nodename, href);
56160Sru}
93139Sru
146515Sru/* Convert non [A-Za-z0-9] to _00xx, where xx means the hexadecimal
146515Sru   representation of the ASCII character.  Also convert spaces and
146515Sru   newlines to dashes.  */
146515Srustatic void
146515Srufix_filename (char *filename)
146515Sru{
146515Sru  int i;
146515Sru  int len = strlen (filename);
146515Sru  char *oldname = xstrdup (filename);
93139Sru
146515Sru  *filename = '\0';
93139Sru
146515Sru  for (i = 0; i < len; i++)
93139Sru    {
146515Sru      if (cr_or_whitespace (oldname[i]))
146515Sru        strcat (filename, "-");
146515Sru      else if (URL_SAFE_CHAR (oldname[i]))
146515Sru        strncat (filename, (char *) oldname + i, 1);
146515Sru      else
146515Sru        {
146515Sru          char *hexchar = xmalloc (6 * sizeof (char));
146515Sru          sprintf (hexchar, "_00%x", (unsigned char) oldname[i]);
146515Sru          strcat (filename, hexchar);
146515Sru          free (hexchar);
146515Sru        }
146515Sru
146515Sru      /* Check if we are nearing boundaries.  */
146515Sru      if (strlen (filename) >= PATH_MAX - 20)
146515Sru        break;
93139Sru    }
146515Sru
146515Sru  free (oldname);
93139Sru}
93139Sru
93139Sru/* As we can't look-up a (forward-referenced) nodes' html filename
93139Sru   from the tentry, we take the easy way out.  We assume that
93139Sru   nodenames are unique, and generate the html filename from the
93139Sru   nodename, that's always known.  */
93139Srustatic char *
146515Srunodename_to_filename_1 (char *nodename, int href)
93139Sru{
93139Sru  char *p;
93139Sru  char *filename;
93139Sru  char dirname[PATH_MAX];
93139Sru
93139Sru  if (strcasecmp (nodename, "Top") == 0)
93139Sru    {
93139Sru      /* We want to convert references to the Top node into
93139Sru	 "index.html#Top".  */
93139Sru      if (href)
93139Sru	filename = xstrdup ("index.html"); /* "#Top" is added by our callers */
93139Sru      else
93139Sru	filename = xstrdup ("Top");
93139Sru    }
93139Sru  else if (strcasecmp (nodename, "(dir)") == 0)
93139Sru    /* We want to convert references to the (dir) node into
93139Sru       "../index.html".  */
93139Sru    filename = xstrdup ("../index.html");
93139Sru  else
93139Sru    {
93139Sru      filename = xmalloc (PATH_MAX);
93139Sru      dirname[0] = '\0';
93139Sru      *filename = '\0';
93139Sru
93139Sru      /* Check for external reference: ``(info-document)node-name''
93139Sru	 Assume this node lives at: ``../info-document/node-name.html''
93139Sru
93139Sru	 We need to handle the special case (sigh): ``(info-document)'',
93139Sru	 ie, an external top-node, which should translate to:
93139Sru	 ``../info-document/info-document.html'' */
93139Sru
93139Sru      p = nodename;
93139Sru      if (*nodename == '(')
93139Sru	{
93139Sru	  int length;
93139Sru
93139Sru	  p = strchr (nodename, ')');
93139Sru	  if (p == NULL)
93139Sru	    {
114472Sru	      line_error (_("[unexpected] invalid node name: `%s'"), nodename);
114472Sru	      xexit (1);
93139Sru	    }
93139Sru
93139Sru	  length = p - nodename - 1;
93139Sru	  if (length > 5 &&
93139Sru	      FILENAME_CMPN (p - 5, ".info", 5) == 0)
93139Sru	    length -= 5;
93139Sru	  /* This is for DOS, and also for Windows and GNU/Linux
93139Sru	     systems that might have Info files copied from a DOS 8+3
93139Sru	     filesystem.  */
93139Sru	  if (length > 4 &&
93139Sru	      FILENAME_CMPN (p - 4, ".inf", 4) == 0)
93139Sru	    length -= 4;
93139Sru	  strcpy (filename, "../");
93139Sru	  strncpy (dirname, nodename + 1, length);
93139Sru	  *(dirname + length) = '\0';
93139Sru	  fix_filename (dirname);
93139Sru	  strcat (filename, dirname);
93139Sru	  strcat (filename, "/");
93139Sru	  p++;
93139Sru	}
93139Sru
93139Sru      /* In the case of just (info-document), there will be nothing
93139Sru	 remaining, and we will refer to ../info-document/, which will
93139Sru	 work fine.  */
93139Sru      strcat (filename, p);
93139Sru      if (*p)
93139Sru	{
93139Sru	  /* Hmm */
93139Sru	  fix_filename (filename + strlen (filename) - strlen (p));
93139Sru	  strcat (filename, ".html");
93139Sru	}
93139Sru    }
93139Sru
93139Sru  /* Produce a file name suitable for the underlying filesystem.  */
93139Sru  normalize_filename (filename);
93139Sru
93139Sru#if 0
93139Sru  /* We add ``#Nodified-filename'' anchor to external references to be
93139Sru     prepared for non-split HTML support.  Maybe drop this. */
93139Sru  if (href && *dirname)
93139Sru    {
93139Sru      strcat (filename, "#");
93139Sru      strcat (filename, p);
93139Sru      /* Hmm, again */
93139Sru      fix_filename (filename + strlen (filename) - strlen (p));
93139Sru    }
93139Sru#endif
93139Sru
93139Sru  return filename;
93139Sru}
93139Sru
93139Sru/* If necessary, ie, if current filename != filename of node, output
93139Sru   the node name.  */
93139Sruvoid
146515Sruadd_nodename_to_filename (char *nodename, int href)
93139Sru{
93139Sru  /* for now, don't check: always output filename */
93139Sru  char *filename = nodename_to_filename_1 (nodename, href);
93139Sru  add_word (filename);
93139Sru  free (filename);
93139Sru}
93139Sru
93139Sruchar *
146515Srunodename_to_filename (char *nodename)
93139Sru{
93139Sru  /* The callers of nodename_to_filename use the result to produce
93139Sru     <a href=, so call nodename_to_filename_1 with last arg non-zero.  */
93139Sru  return nodename_to_filename_1 (nodename, 1);
93139Sru}