tta/perl/Texinfo/Convert/Converter.pm - texinfo - Git at Google

 # Converter.pm: Common code for Converters modules loader and functions not
 #               in XS interface
 #
 # Copyright 2011-2026 Free Software Foundation, Inc.
 #
 # This program is free software; you can redistribute it and/or modify
 # it under the terms of the GNU General Public License as published by
 # the Free Software Foundation; either version 3 of the License,
 # or (at your option) any later version.
 #
 # This program is distributed in the hope that it will be useful,
 # but WITHOUT ANY WARRANTY; without even the implied warranty of
 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 # GNU General Public License for more details.
 #
 # You should have received a copy of the GNU General Public License
 # along with this program.  If not, see <https://www.gnu.org/licenses/>.
 #
 # Original author: Patrice Dumas <pertusus@free.fr>

 # ALTIMP C/convert/converter.c

 package Texinfo::Convert::Converter;

 use 5.006;
 use strict;

 # To check if there is no erroneous autovivification
 #no autovivification qw(fetch delete exists store strict);

 # for fileparse
 use File::Basename;
 # for file names portability
 use Encode qw(decode);
 #use Data::Dumper;

 use Carp qw(cluck confess);

 eval { require Devel::Refcount; Devel::Refcount->import(); };
 eval { require Devel::FindRef; Devel::FindRef->import(); };

 my $devel_findref_loading_error = $@;

 eval { require Devel::Cycle; Devel::Cycle->import(); };

 use Texinfo::XSLoader;

 use Texinfo::Options;
 use Texinfo::CommandsValues;
 use Texinfo::UnicodeData;

 use Texinfo::TreeElement;

 use Texinfo::Common;

 use Texinfo::ManipulateTree;

 use Texinfo::Convert::Utils;
 use Texinfo::Convert::Unicode;
 use Texinfo::Convert::Texinfo;
 use Texinfo::Convert::NodeNameNormalization;
 use Texinfo::OutputUnits;

 use Texinfo::Translations;

 require Exporter;
 our @ISA = qw(Exporter);

 our @EXPORT_OK = qw(
 xml_protect_text
 xml_comment
 xml_accent
 xml_accents
 );

 our $VERSION = '7.3dev';

 BEGIN {
   my $shared_library_name = "ConvertConverterXS";
   if (!Texinfo::XSLoader::XS_convert_enabled()) {
     undef $shared_library_name;
   }
   Texinfo::XSLoader::init (
     "Texinfo::Convert::Converter",
     "Texinfo::Convert::ConverterNonXS",
     $shared_library_name,
     undef,
     ['texinfo', 'texinfoxs', 'texinfo-convert', 'texinfo-convertxs'],
   );
 }

 # values for integer and string options in code generated from
 # Texinfo/Convert/converters_defaults.txt
 my $regular_defaults
   = Texinfo::Options::get_regular_options('converter_defaults');

 my %defaults = %$regular_defaults;

 # For translation of in document string.
 if (0) {
   my $self;
   # TRANSLATORS: expansion of @error{} as Texinfo code
   $self->cdt('error@arrow{}');
 }

 our %default_args_code_style = (
   'email' => [1],
   'anchor' => [1],
   'namedanchor' => [1],
   'uref' => [1],
   'url' => [1],
   'math' => [1],
   'inforef' => [1,undef,1],
   'image' => [1, 1, 1, undef, 1],
 # and type?
   'float' => [1],
 );

 foreach my $code_style_command (keys(%Texinfo::Commands::brace_code_commands)) {
   $default_args_code_style{$code_style_command} = [1];
 }
 foreach my $ref_cmd ('pxref', 'xref', 'ref') {
   $default_args_code_style{$ref_cmd} = [1, undef, undef, 1];
 }

 ################################################################
 # converter API

 # convert_tree() and convert() should be implemented in converters.
 # Except for very specific converters, output() should also be
 # implemented by Converters.  The simple implementation of
 # convert_output_unit() below is likely to be ok for most converters.

 # Functions that should be defined in specific converters
 sub converter_defaults($;$) {
   return \%defaults;
 }

 # should be redefined by specific converters
 sub converter_initialize($) {
 }

 sub conversion_initialization($;$) {
   my ($converter, $document) = @_;

   if (defined($document)) {
     $converter->set_document($document);
   }
 }

 sub conversion_finalization($) {
   #my $converter = shift;
 }

 sub output_internal_links($) {
   my $self = shift;

   return undef;
 }

 # this function is designed so as to be used in specific Converters
 # and not redefined.
 sub converter($;$) {
   my ($class, $conf) = @_;

   my $converter = {};

   bless $converter, $class;

   my $format_defaults = $converter->converter_defaults($conf);

   _generic_converter_init($converter, $format_defaults, $conf);

   $converter->converter_initialize();

   return $converter;
 }

 sub convert_output_unit($$) {
   my ($self, $output_unit) = @_;

   my $result = '';
   foreach my $element (@{$output_unit->{'unit_contents'}}) {
     $result .= $self->convert_tree($element);
   }
   return $result;
 }

 # should be redefined by specific converters
 sub conversion_output_begin($;$$) {
   my ($self, $output_file, $output_filename) = @_;

   return '';
 }

 sub conversion_output_end($) {
   my $self = shift;

   return '';
 }

 sub output_tree($$;$) {
   my ($self, $document, $tree_handle_only) = @_;

   $self->conversion_initialization($document);

   # to avoid passing undef to XS
   $tree_handle_only = 0 unless (defined($tree_handle_only));

   my $root = $document->tree($tree_handle_only);

   if (ref($root) eq 'HASH') {
     confess("Converter output_tree unblessed root\n");
   }

   my ($output_file, $destination_directory, $output_filename)
     = $self->determine_files_and_directory(
                               $self->get_conf('TEXINFO_OUTPUT_FORMAT'));

   my ($encoded_destination_directory, $dir_encoding)
     = $self->encoded_output_file_name($destination_directory);
   my $succeeded
     = $self->create_destination_directory($encoded_destination_directory,
                                           $destination_directory);
   unless ($succeeded) {
     $self->conversion_finalization();
     return undef;
   }

   my $fh;
   my $encoded_output_file;
   if ($output_file ne '') {
     my $path_encoding;
     ($encoded_output_file, $path_encoding)
       = $self->encoded_output_file_name($output_file);
     my $error_message;
     # the third return information, set if the file has already been used
     # in this files_information is not checked as this cannot happen.
     ($fh, $error_message) = Texinfo::Convert::Utils::output_files_open_out(
                               $self->output_files_information(),
                               $encoded_output_file, undef,
                               $self->get_conf('OUTPUT_ENCODING_NAME'));
     if (!defined($fh)) {
       $self->converter_document_error(
            sprintf(__("could not open %s for writing: %s"),
                                     $output_file, $error_message));
       $self->conversion_finalization();
       return undef;
     }
   }

   my $output_beginning
     = $self->conversion_output_begin($output_file, $output_filename);

   my $result = '';
   $result .= $self->write_or_return($output_beginning, $fh);
   $result .= $self->write_or_return($self->convert_tree($root), $fh);

   my $output_end = $self->conversion_output_end();

   $result .= $self->write_or_return($output_end, $fh);

   # Do not close STDOUT now such that the file descriptor is not reused
   # by open, which uses the lowest-numbered file descriptor not open,
   # for another filehandle.  Closing STDOUT is handled by the caller.
   if (defined($fh) and $output_file ne '-') {
     Texinfo::Convert::Utils::output_files_register_closed(
                   $self->output_files_information(), $encoded_output_file);
     if (!close ($fh)) {
       $self->converter_document_error(
             sprintf(__("error on closing %s: %s"),
                                     $output_file, $!));
     }
   }
   $self->conversion_finalization();
   return $result;
 }

 # Only called by pure Perl converters.  Allows to retrieve later on the
 # output units lists and the output units.
 # No similar C/XS code needed, as in C the units are necessarily registered
 # for memory management and available from the document or converter.
 # TODO document
 sub register_output_units_lists($$) {
   my ($self, $output_units_lists) = @_;

   return unless defined($output_units_lists);

   foreach my $output_unit_list (@$output_units_lists) {
     push @{$self->{'output_units_lists'}}, $output_unit_list
       unless(!defined($output_unit_list));
   }
 }

 # There is no XS override. The output units lists returned are the
 # output units registered by pure Perl converters.
 #
 # There should not be any need to access output units lists for output
 # units created in C and built to Perl, as all the codes for output
 # units management are available from XS and called from there.
 # (If access to those output units is nevertheless needed, for example
 # for debugging, there is a separate function that only returns output
 # units lists of output units created in C only, XS_get_output_units_lists.)
 sub get_output_units_lists($) {
   my $self = shift;

   return $self->{'output_units_lists'};
 }

 # should be redefined by converters if needed
 sub converter_release_output_units($) {
   my $self = shift;
 }

 my $output_unit_SV_target_count = 2;
 my $output_unit_object_target_count = 1;

 # ALTIMP convert/converter.c destroy_converter_output_units
 # Also called from C.
 sub perl_converter_remove_output_units($) {
   my $self = shift;

   # call format specific method
   $self->converter_release_output_units();

   # Pure Perl converters register the output units in converter, not
   # C/XS converters.
   # For a C/XS converter, we go through the C data output units lists
   # and remove references to output units Perl data for each of the output
   # units, in a separate code called through converter_remove_output_units
   # XS interface.
   my $output_units_lists = $self->get_output_units_lists();

   if (defined($output_units_lists)) {
     my $check_output_units_references = 0;
     my $test_level = $self->get_conf('TEST');
     $check_output_units_references = 1
       if (defined($test_level) and $test_level > 1);

     # need to go through all the output unit lists before checking
     # reference counts, as there could be cross references, in practice
     # associated_document_unit from associated special units
     # to output units.
     foreach my $output_units_list (@$output_units_lists) {
       Texinfo::OutputUnits::release_output_units_list($output_units_list);

       #find_cycle($output_units_list);
     }

     #if (1) {
     if ($check_output_units_references) {
       foreach my $output_units_list (@$output_units_lists) {
         foreach my $output_unit (@$output_units_list) {
           my $reference_count
            = Texinfo::ManipulateTree::SvREFCNT($output_unit,
                                                $output_unit_SV_target_count);
           my $object_count = Devel::Refcount::refcount($output_unit);
           # only one object count remaining corresponding to the last refcount
           # of the output unit.
           # Two references, the $output_unit variable and the reference in the
           # output_units_list array
           #if (1) {
           if ($reference_count != $output_unit_SV_target_count
               or $object_count != $output_unit_object_target_count) {
             my $findref_info;
             if ($devel_findref_loading_error) {
               $findref_info = '';
             } else {
               $findref_info = Devel::FindRef::track($output_unit)."\n";
             }
             my $message = "Output unit refcount ($reference_count, $object_count) != ".
                "($output_unit_SV_target_count, $output_unit_object_target_count)";
             warn "You found a bug: $message for $output_unit\n\n".$findref_info;
             # pass as warning to have t/*.t tests fail
             $self->converter_document_warn($message);
           }
         }
       }
     }

     # remove the output units lists to release the output units
     @$output_units_lists = ();
   }
 }

 # Should be redefined in converters if needed
 sub converter_destroy($) {
   my $self = shift;
 }

 # ALTIMP convert/converter.c free_converter
 # Also called from C program
 sub converter_perl_release($) {
   my $self = shift;

   # output format converter specific
   $self->converter_destroy();

   # generic
   delete $self->{'document'};
   delete $self->{'document_units'};
   delete $self->{'output_units_lists'};

   if (exists($self->{'convert_text_options'})) {
     delete $self->{'convert_text_options'}->{'converter'};
     # common translations cache
     delete $self->{'convert_text_options'}->{'current_lang_translations'};
   }

   if (exists($self->{'index_formatting_text_options'})) {
     delete $self->{'index_formatting_text_options'}->{'converter'};
   }

   # common translations cache
   delete $self->{'current_lang_translations'};
 }

 sub output_files_information($) {
   my $self = shift;

   return $self->{'output_files'};
 }


 # translations and languages

 sub cdt($$;$$) {
   my ($self, $string, $replaced_substrings, $translation_context) = @_;

   return Texinfo::Translations::gdt($string,
                                     $self->{'current_lang_translations'},
                                     $replaced_substrings,
                                     $self->get_conf('DEBUG'),
                                     $translation_context);
 }

 sub cdt_string($$;$$) {
   my ($self, $string, $replaced_substrings, $translation_context) = @_;

   return Texinfo::Translations::gdt_string($string,
                                     $self->{'current_lang_translations'},
                                     $replaced_substrings,
                                     $translation_context);
 }

 sub pcdt($$;$$) {
   my ($self, $translation_context, $string, $replaced_substrings) = @_;

   return $self->cdt($string, $replaced_substrings, $translation_context);
 }

 # TODO document
 sub converter_set_documentlanguage($$) {
   my ($self, $documentlanguage) = @_;

   my $lang_translation
     = Texinfo::Translations::set_translations_documentlanguage(
          $Texinfo::Translations::converters_translation_cache,
          $documentlanguage,
          $self->{'current_lang_translations'});

   $self->{'current_lang_translations'} = $lang_translation
          if (defined($lang_translation));
 }

 sub converter_set_documentscript($$) {
   my ($self, $documentscript) = @_;

   my $lang_translation
     = Texinfo::Translations::set_translations_documentscript(
          $Texinfo::Translations::converters_translation_cache,
          $documentscript,
          $self->{'current_lang_translations'});

   $self->{'current_lang_translations'} = $lang_translation
          if (defined($lang_translation));
 }

 sub converter_set_documentlanguagevariant($$) {
  my ($self, $documentlanguagevariant) = @_;

   my $lang_translation
     = Texinfo::Translations::set_translations_documentlanguagevariant(
          $Texinfo::Translations::converters_translation_cache,
          $documentlanguagevariant,
          $self->{'current_lang_translations'});

   $self->{'current_lang_translations'} = $lang_translation
          if (defined($lang_translation));
 }

 # language
 sub current_bcp47_locale($) {
   my $self = shift;

   if (!exists($self->{'current_lang_translations'})) {
     return '';
   }
   return $self->{'current_lang_translations'}->[0]->{'bcp47_locale'};
 }

 sub set_converter_preamble_language_commands($) {
   my $self = shift;

   # For now, the method is called at the beginning of output, so this
   # is not needed.  However, it is more consistent to do it
   # anyway
   $self->set_global_document_commands('before',
                    ['documentlanguage', 'documentscript']);

   if (exists($self->{'document'})) {
     my $document_info = $self->{'document'}->global_information();

     my $lang_translation
         = Texinfo::Translations::set_preamble_language_commands(
            $document_info->{'preamble_lang_cmd'},
            $Texinfo::Translations::converters_translation_cache,
            $self->get_conf('documentlanguage'),
            $self->get_conf('documentscript'));

     $self->{'current_lang_translations'} = $lang_translation
            if (defined($lang_translation));
   }
 }


 #####################################################################
 # Elements and output units file names
 #
 # - default file names setting for sectioning commands and nodes
 # - output units files API
 # - set_output_units_files, which uses both default file names setting
 #   and output units files API

 sub _id_to_filename($$) {
   my ($self, $id) = @_;

   my $basefilename_length = $self->get_conf('BASEFILENAME_LENGTH');
   if (defined($basefilename_length) and $basefilename_length >= 0) {
     return substr($id, 0, $basefilename_length);
   } else {
     return $id;
   }
 }

 sub normalized_sectioning_command_filename($$) {
   my ($self, $command, $no_unidecode) = @_;

   $no_unidecode = 1 if (defined($self->get_conf('USE_UNIDECODE'))
                         and !$self->get_conf('USE_UNIDECODE'));
   my $in_test;
   $in_test = 1 if ($self->get_conf('TEST'));

   my $label_element;
   if ($Texinfo::Commands::root_commands{$command->{'cmdname'}}) {
     # for root level sectioning commands, the first element is the
     # arguments_line element, it contains the label element
     $label_element = $command->{'contents'}->[0]->{'contents'}->[0];
   } else {
     # @*heading commands
     $label_element = $command->{'contents'}->[0];
   }
   my $normalized_name;
   if ($self->get_conf('TRANSLITERATE_FILE_NAMES')) {
     $normalized_name
     = Texinfo::Convert::NodeNameNormalization::normalize_transliterate_texinfo(
         Texinfo::TreeElement::new(
          {'contents' => $label_element->{'contents'}}), $in_test,
                   $no_unidecode);
   } else {
     $normalized_name
      = Texinfo::Convert::NodeNameNormalization::convert_to_identifier(
            Texinfo::TreeElement::new(
              { 'contents' => $label_element->{'contents'} }));
   }

   my $filename = $self->_id_to_filename($normalized_name);
   $filename .= '.'.$self->get_conf('EXTENSION')
     if (defined($self->get_conf('EXTENSION'))
       and $self->get_conf('EXTENSION') ne '');
   return ($normalized_name, $filename);
 }

 sub node_information_filename($$$) {
   my ($self, $normalized, $label_element) = @_;

   my $no_unidecode;
   $no_unidecode = 1 if (defined($self->get_conf('USE_UNIDECODE'))
                         and !$self->get_conf('USE_UNIDECODE'));
   my $in_test;
   $in_test = 1 if ($self->get_conf('TEST'));

   my $filename;
   if (defined($normalized)) {
     if ($self->get_conf('TRANSLITERATE_FILE_NAMES')) {
       $filename
   = Texinfo::Convert::NodeNameNormalization::normalize_transliterate_texinfo(
      Texinfo::TreeElement::new(
        {'contents' => $label_element->{'contents'}}), $in_test,
             $no_unidecode);
     } else {
       $filename = $normalized;
     }
   } elsif (defined($label_element)) {
     $filename
      = Texinfo::Convert::NodeNameNormalization::convert_to_node_identifier(
            Texinfo::TreeElement::new(
              { 'contents' => $label_element->{'contents'} }));
   } else {
     $filename = '';
   }
   $filename = $self->_id_to_filename($filename);
   return $filename;
 }

 sub top_node_filename($$) {
   my ($self, $document_name) = @_;

   if (defined($self->get_conf('TOP_FILE'))
       and $self->get_conf('TOP_FILE') ne '') {
     return $self->get_conf('TOP_FILE');
   } elsif (defined($document_name)) {
     my $top_node_filename = $document_name;
     if (defined($self->get_conf('EXTENSION'))
         and $self->get_conf('EXTENSION') ne '') {
       $top_node_filename .= '.'.$self->get_conf('EXTENSION')
     }
     return $top_node_filename
   }
   return undef;
 }

 sub initialize_output_units_files($) {
   my $self = shift;

   $self->{'out_filepaths'} = {};
   $self->{'file_counters'} = {};
   $self->{'filenames'} = {};
 }

 # If CASE_INSENSITIVE_FILENAMES is set, reuse the first
 # filename with the same name insensitive to the case.
 sub register_normalize_case_filename($$) {
   my ($self, $filename) = @_;

   if ($self->get_conf('CASE_INSENSITIVE_FILENAMES')) {
     if (exists($self->{'filenames'}->{lc($filename)})) {
       if ($self->get_conf('DEBUG')) {
         print STDERR "Reusing case-insensitive ".
                    $self->{'filenames'}->{lc($filename)}." for $filename\n";
       }
       $filename = $self->{'filenames'}->{lc($filename)};
     } else {
       $self->{'filenames'}->{lc($filename)} = $filename;
     }
   } else {
     if (exists($self->{'filenames'}->{$filename})) {
       if ($self->get_conf('DEBUG')) {
         print STDERR "Reusing ".$self->{'filenames'}->{$filename}
                      ." for $filename\n";
       }
     } else {
       $self->{'filenames'}->{$filename} = $filename;
     }
   }
   return $filename;
 }

 # Sets $output_unit->{'unit_filename'}.
 sub set_output_unit_file($$$) {
   my ($self, $output_unit, $filename) = @_;

   if (!defined($filename)) {
     cluck("set_output_unit_file: filename not defined\n");
   }
   if (!defined($output_unit)) {
     cluck("set_output_unit_file: output_unit not defined\n");
   }

   $filename = $self->register_normalize_case_filename($filename);

   # This should never happen, set_output_unit_file is called once per
   # tree unit.
   if (exists($output_unit->{'unit_filename'})) {
     if ($output_unit->{'unit_filename'} eq $filename) {
       print STDERR "set_output_unit_file: already set: $filename\n"
          if ($self->get_conf('DEBUG'));
     } else {
       print STDERR "set_output_unit_file: unit_filename reset: "
         .$output_unit->{'unit_filename'}.", $filename\n"
            if ($self->get_conf('DEBUG'));
     }
   }
   $output_unit->{'unit_filename'} = $filename;
 }

 # sets out_filepaths converter state, associating a file name
 # to a file path.
 # $FILEPATH can be given explicitly, otherwise it is based on $FILENAME
 # and $DESTINATION_DIRECTORY
 sub set_file_path($$$;$) {
   my ($self, $filename, $destination_directory, $filepath) = @_;

   if (!defined($filename)) {
     cluck("set_file_path: filename not defined\n");
   }

   $filename = $self->register_normalize_case_filename($filename);

   if (not defined($filepath)) {
     if (defined($destination_directory) and $destination_directory ne '') {
       $filepath = join('/', ($destination_directory, $filename));
     } else {
       $filepath = $filename;
     }
   }
   # the file path should be set only once per file name.  With
   # CASE_INSENSITIVE_FILENAMES the same file path can appear more
   # than once when files differ in case.
   if (defined($self->{'out_filepaths'}->{$filename})) {
     if ($self->{'out_filepaths'}->{$filename} eq $filepath) {
       print STDERR "set_file_path: filepath set: $filepath\n"
          if ($self->get_conf('DEBUG'));
     } else {
       print STDERR  "set_file_path: filepath reset: "
         .$self->{'out_filepaths'}->{$filename}.", $filepath\n"
          if ($self->get_conf('DEBUG'));
     }
   }
   $self->{'out_filepaths'}->{$filename} = $filepath;
 }

 sub _get_root_element($$) {
   my ($self, $command) = @_;

   my $current = $command;

   while (1) {
     if (exists($current->{'associated_unit'})) {
       return $current->{'associated_unit'};
     }
     if (exists($current->{'parent'})) {
       $current = $current->{'parent'};
     } else {
       return undef;
     }
   }
 }

 # TODO document?
 # Called in Texinfo::Converter::Plaintext.  The HTML converter defines its
 # own version.
 # set file_counters converter state
 sub set_output_units_files($$$$$$) {
   my ($self, $output_units, $output_file, $destination_directory,
       $output_filename, $document_name) = @_;

   # Ensure that the document has pages
   return undef if (!defined($output_units) or !scalar(@$output_units));

   $self->initialize_output_units_files();

   my $extension = '';
   $extension = '.'.$self->get_conf('EXTENSION')
             if (defined($self->get_conf('EXTENSION'))
                 and $self->get_conf('EXTENSION') ne '');

   if (!$self->get_conf('SPLIT')) {
     $self->set_file_path($output_filename, undef, $output_file);
     foreach my $output_unit (@$output_units) {
       $self->set_output_unit_file($output_unit, $output_filename);
     }
   } else {
     my $node_top;

     my $identifiers_target;
     if (exists($self->{'document'})) {
       $identifiers_target = $self->{'document'}->labels_information();
     }

     $node_top = $identifiers_target->{'Top'}
                             if (defined($identifiers_target));

     my $top_node_filename = $self->top_node_filename($document_name);
     # first determine the top node file name.
     if (defined($node_top) and defined($top_node_filename)) {
       my $node_top_unit = $self->_get_root_element($node_top);
       if (!defined($node_top_unit)) {
         print STDERR "No element for top node (".scalar(@$output_units)." units)\n"
          if ($self->get_conf('DEBUG'));
       } else {
         $self->set_file_path($top_node_filename, $destination_directory);
         $self->set_output_unit_file($node_top_unit, $top_node_filename);
       }
     }
     my $file_nr = 0;
     my $previous_page;
     foreach my $output_unit (@$output_units) {
       # For Top node.
       next if (defined($output_unit->{'unit_filename'}));
       my $file_output_unit = $output_unit->{'first_in_page'};
       if (!$file_output_unit) {
         cluck ("No first_in_page for $output_unit\n");
       }
       if (!defined($file_output_unit->{'unit_filename'})) {
         foreach my $root_command (@{$file_output_unit->{'unit_contents'}}) {
           if (exists($root_command->{'cmdname'})
               and $root_command->{'cmdname'} eq 'node') {
             my $node_filename;
             # double node are not normalized, they are handled here
             if (!defined($root_command->{'extra'}->{'identifier'})
                 or !defined($identifiers_target->{
                                $root_command->{'extra'}->{'identifier'}})) {
               $node_filename = 'unknown_node';
             } else {
               # arguments_line type element
               my $arguments_line = $root_command->{'contents'}->[0];
               $node_filename
                = $self->node_information_filename(
                                $root_command->{'extra'}->{'identifier'},
                         # node label is the first arguments_line content,
                         # the first argument on the line
                                   $arguments_line->{'contents'}->[0]);
             }
             $node_filename .= $extension;
             $self->set_file_path($node_filename,$destination_directory);
             $self->set_output_unit_file($file_output_unit, $node_filename);
             last;
           }
         }
         if (!defined($file_output_unit->{'unit_filename'})) {
           # use section to do the file name if there is no node
           my $command = $file_output_unit->{'unit_section'};
           if ($command) {
             if ($command->{'element'}->{'cmdname'} eq 'top'
                 and !defined($node_top)
                 and defined($top_node_filename)) {
               $self->set_file_path($top_node_filename, $destination_directory);
               $self->set_output_unit_file($file_output_unit, $top_node_filename);
             } else {
               my ($normalized_name, $filename)
                  = $self->normalized_sectioning_command_filename(
                                        $command->{'element'});
               $self->set_file_path($filename, $destination_directory);
               $self->set_output_unit_file($file_output_unit, $filename);
             }
           } else {
             # when everything else has failed
             if ($file_nr == 0 and !defined($node_top)
                 and defined($top_node_filename)) {
               $self->set_file_path($top_node_filename, $destination_directory);
               $self->set_output_unit_file($file_output_unit, $top_node_filename);
             } else {
               my $filename = $document_name . "_$file_nr";
               $filename .= $extension;
               $self->set_file_path($filename, $destination_directory);
               $self->set_output_unit_file($output_unit, $filename);
             }
             $file_nr++;
           }
         }
       }
       $self->set_output_unit_file($output_unit,
                     $file_output_unit->{'unit_filename'});
     }
   }

   foreach my $output_unit (@$output_units) {
     my $output_unit_filename = $output_unit->{'unit_filename'};
     $self->{'file_counters'}->{$output_unit_filename} = 0
        if (!exists($self->{'file_counters'}->{$output_unit_filename}));
     $self->{'file_counters'}->{$output_unit_filename}++;
     print STDERR 'Page '
      # uncomment for Perl object name
      #."$output_unit "
      .Texinfo::OutputUnits::output_unit_texi($output_unit)
      .": $output_unit_filename($self->{'file_counters'}->{$output_unit_filename})\n"
               if ($self->get_conf('DEBUG'));
   }
 }


 #############################################################
 # useful methods for Converters.
 # First methods are also used in this module.

 # Generic/overall document methods

 sub create_destination_directory($$$) {
   my ($self, $destination_directory_path, $destination_directory_name) = @_;

   if (defined($destination_directory_path)
       and ! -d $destination_directory_path) {
     if (!mkdir($destination_directory_path, oct(755))) {
       $self->converter_document_error(sprintf(__(
                                 "could not create directory `%s': %s"),
                                    $destination_directory_name, $!));
       return 0;
     }
   }
   return 1;
 }

 # output fo $fh if defined, otherwise return the text.
 sub write_or_return($$$) {
   my ($self, $text, $fh) = @_;

   if (defined($fh)) {
     print $fh $text;
     return '';
   } else {
     return $text;
   }
 }

 my $STDIN_DOCU_NAME = 'stdin';

 # this requires a document, and is, in general, used in output(), therefore
 # a document need to be associated with the converter, not only a tree.
 sub determine_files_and_directory($$) {
   my ($self, $output_format) = @_;

   # determine input file base name
   my $input_basefile;
   my $document_info;

   if (exists($self->{'document'})) {
     $document_info = $self->{'document'}->global_information();
   }

   if (defined($document_info) and exists($document_info->{'input_file_name'})) {
     # 'input_file_name' is not decoded, as it is derived from input
     # file which is not decoded either.  We want to return only
     # decoded character strings such that they can easily be mixed
     # with other character strings, so we decode here.
     my $input_file_name_bytes = $document_info->{'input_file_name'};
     my $encoding = $self->get_conf('COMMAND_LINE_ENCODING');
     if (defined($encoding)) {
       $input_basefile = decode($encoding, $input_file_name_bytes, sub { '?' });
       # use '?' as replacement character rather than U+FFFD in case it
       # is re-encoded to an encoding without this character
     } else {
       $input_basefile = $input_file_name_bytes;
     }
   } else {
     # This could happen if called on a piece of Texinfo and not a full manual.
     $input_basefile = '';
   }

   my $input_basename;
   if ($input_basefile eq '-') {
     $input_basename = $STDIN_DOCU_NAME;
   } else {
     $input_basename = $input_basefile;
     $input_basename =~ s/\.te?x(i|info)?$//;
   }

   my $setfilename;
   if (defined($self->get_conf('setfilename'))) {
     $setfilename = $self->get_conf('setfilename');
   } elsif (defined($document_info)
            and exists($document_info->{'setfilename'})) {
     $setfilename = $document_info->{'setfilename'};
   }

   my $input_basename_for_outfile = $input_basename;
   my $setfilename_for_outfile = $setfilename;
   # PREFIX overrides both setfilename and the input file base name
   if (defined($self->get_conf('PREFIX'))) {
     $setfilename_for_outfile = undef;
     $input_basename_for_outfile = $self->get_conf('PREFIX');
   }

   # the document path, in general the outfile without
   # extension and can be set from setfilename if outfile is not set
   my $document_path;
   # determine output file and output file name
   my $output_file;
   if (!defined($self->get_conf('OUTFILE'))) {
     if (defined($setfilename_for_outfile)) {
       $document_path = $setfilename_for_outfile;
       $document_path =~ s/\.[^\.]*$//;
       if (!$self->get_conf('USE_SETFILENAME_EXTENSION')) {
         $output_file = $document_path;
         $output_file .= '.'.$self->get_conf('EXTENSION')
           if (defined($self->get_conf('EXTENSION'))
               and $self->get_conf('EXTENSION') ne '');
       } else {
         $output_file = $setfilename_for_outfile;
       }
     } elsif ($input_basename_for_outfile ne '') {
       $output_file = $input_basename_for_outfile;
       $document_path = $input_basename_for_outfile;
       $output_file .= '.'.$self->get_conf('EXTENSION')
         if (defined($self->get_conf('EXTENSION'))
             and $self->get_conf('EXTENSION') ne '');
     } else {
       $output_file = '';
       $document_path = $output_file;
     }
     if (defined($self->get_conf('SUBDIR')) and $output_file ne '') {
       my $dir
         = Texinfo::Common::file_separator_canonpath($self->get_conf('SUBDIR'));
       $output_file = join('/', ($dir, $output_file));
     }
   } else {
     $document_path = $self->get_conf('OUTFILE');
     $document_path =~ s/\.[^\.]*$//;
     $output_file = $self->get_conf('OUTFILE');
   }

   # the output file path, in general same as the outfile but can be
   # set from setfilename if outfile is not set.
   my $output_filepath = $output_file;
   # in this case one wants to get the result in a string and there
   # is a setfilename.  The setfilename is used to get something.
   # This happens in the test suite.
   if ($output_file eq '' and defined($setfilename_for_outfile)) {
     $output_filepath = $setfilename_for_outfile;
     $document_path = $setfilename_for_outfile;
     $document_path =~ s/\.[^\.]*$//;
   }

   # $document_name is the name of the document, which is the output
   # file basename, $output_filename, without extension.
   my ($document_name, $output_filename, $directories, $suffix);
   # We may be handling setfilename there, so it is not obvious that we
   # want to use fileparse and not consider unixish separators.  However,
   # if this is setfilename, it should be a simple file name, so it
   # should hopefully be harmless to use fileparse
   ($document_name, $directories, $suffix) = fileparse($document_path);
   ($output_filename, $directories, $suffix) = fileparse($output_filepath);
   my $destination_directory;
   if ($self->get_conf('SPLIT')) {
     if (defined($self->get_conf('OUTFILE'))) {
       $destination_directory = $self->get_conf('OUTFILE');
     } elsif (defined($self->get_conf('SUBDIR'))) {
       $destination_directory = $self->get_conf('SUBDIR');
     } else {
       $destination_directory = $document_name;
       if (defined($output_format) and $output_format ne '') {
         $destination_directory .= '_'.$output_format;
       }
     }
   } else {
     # $output_file_filename is not used, but $output_filename should be
     # the same as long as $output_file is the same as $output_filepath
     # which is the case except if $output_file is ''.
     # Note that fileparse may return a string for the directory part even
     # for a relative file without directory, ie
     # myfile.html -> $output_dir = './'
     # In that case the $destination_directory will never be ''.
     my ($output_file_filename, $output_dir, $suffix) = fileparse($output_file);
     $destination_directory = $output_dir;
   }
   if ($destination_directory ne '') {
     $destination_directory
       = Texinfo::Common::file_separator_canonpath($destination_directory);
   }
   return ($output_file, $destination_directory, $output_filename,
           $document_name, $input_basefile);
 }

 # ALTIMP partial in structuring_transfo/structuring.c
 # For user-defined HTML customization, documented in the specific manual.
 # The bulk of the function could be better in Texinfo::Structuring, but since
 # it is not used internally, it is kept here.
 sub converter_node_relations_of_node($$) {
   my ($self, $node_element) = @_;

   if (!exists($self->{'document'})) {
     return undef;
   }
   if (!exists($node_element->{'extra'})
       or not $node_element->{'extra'}->{'node_number'}) {
     return undef;
   }

   my $nodes_list = $self->{'document'}->nodes_list();

   return $nodes_list->[$node_element->{'extra'}->{'node_number'} -1];
 }

 # No equivalent in C.
 # For user-defined HTML customization, documented in the specific manual.
 sub converter_section_relations_of_section($$) {
   my ($self, $element) = @_;

   if (!exists($self->{'document'})) {
     return undef;
   }
   # Note that this cannot happen if the element is actually a sectioning
   # command tree element.
   if (!exists($element->{'extra'})
       or not $element->{'extra'}->{'section_number'}) {
     return undef;
   }

   my $sections_list = $self->{'document'}->sections_list();

   return $sections_list->[$element->{'extra'}->{'section_number'} -1];
 }

 # No equivalent in C.
 # For user-defined HTML customization, documented in the specific manual.
 sub converter_heading_relations_of_heading($$) {
   my ($self, $element) = @_;

   if (!exists($self->{'document'})) {
     return undef;
   }
   # Note that this cannot happen if the element is actually a heading
   # command tree element.
   if (!exists($element->{'extra'})
       or not $element->{'extra'}->{'heading_number'}) {
     return undef;
   }

   my $headings_list = $self->{'document'}->headings_list();

   return $headings_list->[$element->{'extra'}->{'heading_number'} -1];
 }

 # Reverse the decoding of the file name from the input encoding.
 # A wrapper around Texinfo::Utils::encoded_input_file_name().
 sub encoded_input_file_name($$;$) {
   my ($self, $file_name, $input_file_encoding) = @_;

   my $input_file_name_encoding = $self->get_conf('INPUT_FILE_NAME_ENCODING');
   my $doc_encoding_for_input_file_name
     = $self->get_conf('DOC_ENCODING_FOR_INPUT_FILE_NAME');
   my $locale_encoding = $self->get_conf('LOCALE_ENCODING');

   return Texinfo::Convert::Utils::encoded_input_file_name($file_name,
                  $input_file_name_encoding,
                  $doc_encoding_for_input_file_name, $locale_encoding,
                  $self->{'document'}, $input_file_encoding);
 }

 # A wrapper around Texinfo::Utils::encoded_output_file_name().
 sub encoded_output_file_name($$) {
   my ($self, $file_name) = @_;

   my $output_file_name_encoding = $self->get_conf('OUTPUT_FILE_NAME_ENCODING');
   my $doc_encoding_for_output_file_name
     = $self->get_conf('DOC_ENCODING_FOR_OUTPUT_FILE_NAME');
   my $locale_encoding = $self->get_conf('LOCALE_ENCODING');

   return Texinfo::Convert::Utils::encoded_output_file_name($file_name,
                  $output_file_name_encoding,
                  $doc_encoding_for_output_file_name, $locale_encoding,
                  $self->{'document'});
 }

 sub translated_command_tree($$) {
   my ($converter, $cmdname) = @_;

   return Texinfo::Convert::Utils::translated_command_tree(
                                   $converter->{'translated_commands'},
                                   $cmdname, undef, undef, $converter);
 }

 # wrapper around Texinfo::Utils::expand_verbatiminclude.
 sub expand_verbatiminclude($$) {
   my ($converter, $current) = @_;

   my $input_file_name_encoding
     = $converter->get_conf('INPUT_FILE_NAME_ENCODING');
   my $doc_encoding_for_input_file_name
     = $converter->get_conf('DOC_ENCODING_FOR_INPUT_FILE_NAME');
   my $locale_encoding = $converter->get_conf('LOCALE_ENCODING');

   my $include_directories
     = $converter->get_conf('INCLUDE_DIRECTORIES');

   my $document = $converter->{'document'};

   return Texinfo::Convert::Utils::expand_verbatiminclude($current,
               $include_directories,
               $input_file_name_encoding,
               $doc_encoding_for_input_file_name, $locale_encoding,
               $document, $converter);
 }

 sub expand_today($) {
   my $converter = shift;

   my $test = $converter->get_conf('TEST');
   return Texinfo::Convert::Utils::expand_today($test, undef, undef,
                                                $converter);
 }

 # determine the default, with $INIT_CONF if set, or the default common
 # to all the converters
 sub get_command_init($$) {
   my ($global_command, $init_conf) = @_;

   # Where init_conf values are set, It should be made sure that there are only
   # Texinfo::Common::document_settable_at_commands, we do not check here.
   # If it is not the case, it should not make a difference anyway, as this
   # function should only be called with those commands in argument.
   if (exists($init_conf->{$global_command})) {
     return $init_conf->{$global_command};
   }
   return $Texinfo::Common::document_settable_at_commands{$global_command};
 }

 sub present_bug_message($$;$) {
   my ($self, $message, $current) = @_;

   my $line_message = '';
   my $current_element_message = '';
   if (defined($current)) {
     if (exists($current->{'source_info'})) {
       my $source_info = $current->{'source_info'};
       my $file = $source_info->{'file_name'};
       $line_message
         = "in: $source_info->{'file_name'}:$source_info->{'line_nr'}";
       if ($source_info->{'macro'} ne '') {
         $line_message .= " (possibly involving $source_info->{'macro'})";
       }
       $line_message .= "\n";
     }
     $current_element_message = "current: ".
       Texinfo::Common::debug_print_element($current, 1);
   }
   my $additional_information = '';
   if ($line_message.$current_element_message ne '') {
     $additional_information = "Additional information:\n".
        $line_message.$current_element_message."\n";
   }
   warn "You found a bug: $message\n\n".$additional_information;
 }

 # ALTIMP main/convert_utils.c
 # This is used when the formatted text has no comment nor new line, but
 # one want to add the comment or new line from the original arg
 sub comment_or_end_line($$) {
   my ($self, $element) = @_;

   if (exists($element->{'contents'})) {
     my $last_arg = $element->{'contents'}->[-1];
     if (exists($last_arg->{'contents'})) {
       my $last_content = $last_arg->{'contents'}->[-1];
       if (exists($last_content->{'cmdname'})
                and ($last_content->{'cmdname'} eq 'comment'
                     or $last_content->{'cmdname'} eq 'c')) {
         return ($last_content, undef);
       } elsif (exists($last_content->{'text'})) {
         my $text = $last_content->{'text'};
         if (chomp($text)) {
           return (undef, "\n");
         }
       }
     }
   }
   return (undef, '');
 }

 sub comment_end_line_end_space($$) {
   my ($self, $element) = @_;

   my $end_spaces = '';
   my $end_line = '';
   my $end_comment;

   if (exists($element->{'contents'})) {
     my $end_idx = scalar(@{$element->{'contents'}}) - 1;
     while ($end_idx >= 0) {
       my $content = $element->{'contents'}->[$end_idx];
       if (exists($content->{'type'})
           and ($content->{'type'} eq 'spaces_after_argument'
                or $content->{'type'} eq 'spaces_before_argument')) {
         my $text = $content->{'text'};
         if (chomp($text)) {
           $end_line = "\n";
         }
         $end_spaces = $text . $end_spaces;
         $end_idx--;
       } elsif (exists($content->{'cmdname'})
                and ($content->{'cmdname'} eq 'comment'
                     or $content->{'cmdname'} eq 'c')) {
         $end_comment = $content;
         $end_idx--;
       } else {
         last;
       }
     }
   }
   return ($end_spaces, $end_line, $end_comment);
 }


 # Specific elements formatting helper functions

 sub txt_image_text($$$) {
   my ($self, $element, $basefile) = @_;

   my ($text_file_name, $file_name_encoding)
     = $self->encoded_input_file_name($basefile.'.txt');

   my $txt_file = Texinfo::Common::locate_include_file($text_file_name,
                                   $self->get_conf('INCLUDE_DIRECTORIES'));
   if (!defined($txt_file)) {
     return undef, undef;
   } else {
     my $filehandle = do { local *FH };
     if (open($filehandle, $txt_file)) {
       my $encoding
           = Texinfo::Common::associated_processing_encoding($element);
       if (defined($encoding)) {
         binmode($filehandle, ":encoding($encoding)");
       }
       my $result = '';
       my $max_width = 0;
       while (<$filehandle>) {
         my $width = Texinfo::Convert::Unicode::string_width($_);
         if ($width > $max_width) {
           $max_width = $width;
         }
         $result .= $_;
       }
       if (!close ($filehandle)) {
         my $decoded_file_name = $txt_file;
         $decoded_file_name = Encode::decode($file_name_encoding, $txt_file)
           if (defined($file_name_encoding));
         $self->converter_document_warn(
            sprintf(__("error on closing image text file %s: %s"),
                                      $decoded_file_name, $!));
       }
       return $result, $max_width;
     } else {
       my $decoded_file_name = $txt_file;
       $decoded_file_name = Encode::decode($file_name_encoding, $txt_file)
         if (defined($file_name_encoding));
       $self->converter_line_warn(
                sprintf(__("\@image file `%s' unreadable: %s"),
                           $decoded_file_name, $!), $element->{'source_info'});
     }
   }
   return undef, undef;
 }

 sub float_type_number($$) {
   my ($self, $float) = @_;

   my $type_element;
   if ($float->{'extra'}->{'float_type'} ne '') {
     # first content of arguments_line type element
     $type_element = $float->{'contents'}->[0]->{'contents'}->[0];
   }
   my $float_number = $float->{'extra'}->{'float_number'};

   my $tree;
   if (defined($type_element)) {
     if (defined($float_number)) {
       $tree = $self->cdt("{float_type} {float_number}",
                          {'float_type' => $type_element,
                           'float_number' =>
                       Texinfo::TreeElement::new({'text' => $float_number})});
     } else {
       $tree = $self->cdt("{float_type}",
                          {'float_type' => $type_element});
     }
   } elsif (defined($float_number)) {
     $tree = $self->cdt("{float_number}",
                        {'float_number' =>
                     Texinfo::TreeElement::new({'text' => $float_number})});
   }
   return $tree;
 }

 sub float_name_caption($$) {
   my ($self, $element) = @_;

   my $caption_element;
   my ($caption, $shortcaption)
     = Texinfo::Common::find_float_caption_shortcaption($element);

   if (defined($caption)) {
     $caption_element = $caption;
   } elsif (defined($shortcaption)) {
     $caption_element = $shortcaption;
   }
   #if ($self->get_conf('DEBUG')) {
   #  my $caption_texi =
   #    Texinfo::Convert::Texinfo::convert_to_texinfo(
   #    Texinfo::TreeElement::new(
   #       { 'contents' => $caption_element->{'contents'}}));
   #  print STDERR "  CAPTION: $caption_texi\n";
   #}

   my $substrings = {};

   my $float_number_element;
   if (exists($element->{'extra'})
       and defined($element->{'extra'}->{'float_number'})) {
     $float_number_element = Texinfo::TreeElement::new(
        {'text' => $element->{'extra'}->{'float_number'}});
     $substrings->{'float_number'} = $float_number_element;
   }

   my $prepended;
   if (exists($element->{'extra'})
       and exists($element->{'extra'}->{'float_type'})
       and $element->{'extra'}->{'float_type'} ne '') {
     # first content of arguments_line type element.
     $substrings->{'float_type'}
        = $element->{'contents'}->[0]->{'contents'}->[0];
     if (defined($caption_element)) {
       if (defined($float_number_element)) {
         # TRANSLATORS: added before caption
         $prepended = $self->cdt('{float_type} {float_number}: ', $substrings);
       } else {
         # TRANSLATORS: added before caption, no float label
         $prepended = $self->cdt('{float_type}: ', $substrings);
       }
     } else {
       if (defined($float_number_element)) {
         $prepended = $self->cdt("{float_type} {float_number}", $substrings);
       } else {
         $prepended = $self->cdt("{float_type}", $substrings);
       }
     }
   } elsif (defined($float_number_element)) {
     if (defined($caption_element)) {
       # TRANSLATORS: added before caption, no float type
       $prepended = $self->cdt('{float_number}: ', $substrings);
     } else {
       $prepended = $self->cdt("{float_number}", $substrings);
     }
   }
   return ($caption_element, $prepended);
 }

 # $ELEMENT should be an item, itemx or headitem command element
 # No parent is set in this parallel tree, such that there is no
 # cycle and Perl can release the elements as soon as they are out of scope.
 sub table_item_content_tree($$) {
   my ($self, $element) = @_;

   # not in a @*table item/itemx.  Exemple in test with @itemx in @itemize
   # in @table
   if (!exists($element->{'parent'}->{'type'})
       or $element->{'parent'}->{'type'} ne 'table_term') {
     return undef;
   }
   my $table_command = $element->{'parent'}->{'parent'}->{'parent'};

   # table command arguments_line type element
   my $arguments_line = $table_command->{'contents'}->[0];
   my $block_line_arg = $arguments_line->{'contents'}->[0];

   my $command_as_argument
     = Texinfo::Common::block_item_line_command($block_line_arg);

   # should always be true with current code
   if (defined($command_as_argument)) {
     my $element_tree
      = Texinfo::Common::non_leading_trailing_tree($element->{'contents'}->[0]);
     if (!defined($element_tree)) {
       confess();
     }

     my $command_as_argument_cmdname = $command_as_argument->{'cmdname'};
     my $command = Texinfo::TreeElement::new(
                   {'cmdname' => $command_as_argument_cmdname,
                    'source_info' => $element->{'source_info'},});
     if (exists($table_command->{'extra'})
         and $table_command->{'extra'}->{'command_as_argument_kbd_code'}) {
       $command->{'extra'} = {'code' => 1};
     }
     # command name for the Texinfo::Commands hashes tests
     my $builtin_cmdname;
     if (exists($command_as_argument->{'type'})
         and $command_as_argument->{'type'} eq 'definfoenclose_command') {
       $command->{'type'} = $command_as_argument->{'type'};
       $command->{'extra'} = {} if (!exists($command->{'extra'}));
       $command->{'extra'}->{'begin'}
         = $command_as_argument->{'extra'}->{'begin'};
       $command->{'extra'}->{'end'} = $command_as_argument->{'extra'}->{'end'};
       $builtin_cmdname = 'definfoenclose_command';
     } else {
       $builtin_cmdname = $command_as_argument_cmdname;
     }
     my $arg;
     if ($Texinfo::Commands::brace_commands{$builtin_cmdname} eq 'context') {
       # This corresponds to a bogus @*table line with command line @footnote
       # or @math.  We do not really care about the formatting of the result
       # but we want to avoid debug messages, so we setup expected trees
       # for those @-commands.
       $arg = Texinfo::TreeElement::new({'type' => 'brace_command_context',});
       if ($Texinfo::Commands::math_commands{$builtin_cmdname}) {
         $arg->{'contents'} = [$element_tree];
       } else {
         my $paragraph
          = Texinfo::TreeElement::new({'type' => 'paragraph',
                             'contents' => [$element_tree],});
         $arg->{'contents'} = [$paragraph];
       }
     } elsif ($Texinfo::Commands::brace_commands{$builtin_cmdname}
                                                    eq 'arguments') {
       $arg = Texinfo::TreeElement::new({'type' => 'brace_arg',
                       'contents' => [$element_tree],});
     } else {
       $arg = Texinfo::TreeElement::new({'type' => 'brace_container',
                          'contents' => [$element_tree],});
     }
     $command->{'contents'} = [$arg];
     return $command;
   }
   return undef;
 }

 sub convert_accents($$$;$$) {
   my ($self, $accent, $format_accents, $output_encoded_characters,
       $in_upper_case) = @_;

   my ($contents_element, $stack)
     = Texinfo::Common::find_innermost_accent_contents($accent);
   my $arg_text = '';
   if (defined($contents_element)) {
     $arg_text = $self->convert_tree($contents_element);
   }

   if ($output_encoded_characters) {
     my $encoded = Texinfo::Convert::Unicode::encoded_accents($self,
                                        $arg_text, $stack,
                                        $self->get_conf('OUTPUT_ENCODING_NAME'),
                                        $format_accents,
                                        $in_upper_case);
     if (defined($encoded)) {
       return $encoded;
     }
   }
   my $result = $arg_text;
   for (my $i = scalar(@$stack) -1; $i >= 0; $i--) {
     my $accent_command = $stack->[$i];
     $result = &$format_accents($self, $result, $accent_command, $i,
                                $stack, $in_upper_case);
   }
   return $result;
 }


 # sort_element_counts code

 sub _count_converted_text($$) {
   my ($converted_text, $count_words) = @_;

   if ($count_words) {
     my @res = split /\W+/, $converted_text;
     return scalar(@res);
   } else {
     my @res = split /^/, $converted_text;
     return scalar(@res);
   }
 }

 # This method allows to count words in elements and returns an array
 # and a text already formatted.
 sub sort_element_counts($$;$$) {
   my ($converter, $document, $use_sections, $count_words) = @_;

   $converter->conversion_initialization($document);

   my $output_units;
   if ($use_sections) {
     $output_units = Texinfo::OutputUnits::split_by_section($document);
   } else {
     $output_units = Texinfo::OutputUnits::split_by_node($document);
   }
   $converter->register_output_units_lists([$output_units]);

   my $max_count = 0;
   my @name_counts_array;

   foreach my $output_unit (@$output_units) {
     my $name;
     my $command_relations;
     if ($use_sections) {
       $command_relations = $output_unit->{'unit_section'};
     } else {
       $command_relations = $output_unit->{'unit_node'};
     }
     if (defined($command_relations)) {
       my $command = $command_relations->{'element'};
       # arguments_line type element
       my $arguments_line = $command->{'contents'}->[0];
       my $line_arg = $arguments_line->{'contents'}->[0];
       if (!Texinfo::Common::empty_spaces_argument($line_arg)) {
         # convert contents to avoid outputting end of lines
         $name = "\@$command->{'cmdname'} "
          .Texinfo::Convert::Texinfo::convert_contents_to_texinfo(
                                                                $line_arg);
       }
     }
     $name = 'UNNAMED output unit' if (!defined($name));
     my $converted_text = $converter->convert_output_unit($output_unit);
     my $count = _count_converted_text($converted_text, $count_words);
     push @name_counts_array, [$count, $name];
     if ($count > $max_count) {
       $max_count = $count;
     }
   }
   $converter->conversion_finalization();

   my @sorted_name_counts_array = sort {$a->[0] <=> $b->[0]} @name_counts_array;
   @sorted_name_counts_array = reverse(@sorted_name_counts_array);

   my $max_length = length($max_count);
   my $result = '';
   foreach my $sorted_count (@sorted_name_counts_array) {
     $result .=  sprintf("%${max_length}d  $sorted_count->[1]\n",
                         $sorted_count->[0]);
   }
   return (\@sorted_name_counts_array, $result);
 }


 ########################################################################
 # XML related methods and variables that may be used in different
 # XML Converters.

 my $xml_numeric_entity_mdash = '&#'.hex('2014').';'; #8212
 my $xml_numeric_entity_ndash = '&#'.hex('2013').';'; #8211
 my $xml_numeric_entity_ldquo = '&#'.hex('201C').';'; #8220
 my $xml_numeric_entity_rdquo = '&#'.hex('201D').';'; #8221
 my $xml_numeric_entity_lsquo = '&#'.hex('2018').';'; #8216
 my $xml_numeric_entity_rsquo = '&#'.hex('2019').';'; #8217

 sub xml_format_text_with_numeric_entities($$) {
   my ($self, $text) = @_;

   $text =~ s/``/$xml_numeric_entity_ldquo/g;
   $text =~ s/\'\'/$xml_numeric_entity_rdquo/g;
   $text =~ s/`/$xml_numeric_entity_lsquo/g;
   $text =~ s/\'/$xml_numeric_entity_rsquo/g;
   $text =~ s/---/$xml_numeric_entity_mdash/g;
   $text =~ s/--/$xml_numeric_entity_ndash/g;

   return $text;
 }

 sub xml_protect_text($$) {
   my ($self, $text) = @_;

   if (!defined($text)) {
     confess('xml_protect_text: undef text in');
   }

   $text =~ s/&/&amp;/g;
   $text =~ s/</&lt;/g;
   $text =~ s/>/&gt;/g;
   $text =~ s/\"/&quot;/g;
   return $text;
 }

 our %xml_text_entity_no_arg_commands_formatting
   = %Texinfo::CommandsValues::xml_text_entity_no_arg_commands;

 foreach my $brace_no_arg_command
      (keys(%Texinfo::CommandsValues::text_brace_no_arg_commands)) {
   if (!exists($xml_text_entity_no_arg_commands_formatting{
                                                 $brace_no_arg_command})) {
     $xml_text_entity_no_arg_commands_formatting{$brace_no_arg_command}
       = $Texinfo::CommandsValues::text_brace_no_arg_commands{
                                                 $brace_no_arg_command};
   }
 }

 foreach my $no_brace_command
                 (keys(%Texinfo::CommandsValues::nobrace_symbol_text)) {
   if (!exists($xml_text_entity_no_arg_commands_formatting{
                                                 $no_brace_command})) {
     # some values are empty strings
     $xml_text_entity_no_arg_commands_formatting{$no_brace_command}
       = $Texinfo::CommandsValues::nobrace_symbol_text{$no_brace_command};
   }
 }

 sub xml_comment($$) {
   my ($self, $text) = @_;

   chomp $text;
   $text =~ s/--+/-/go;
   return '<!--' . $text . ' -->' . "\n";
 }

 our %xml_accent_entities = (
           '"',  'uml',
           '~',  'tilde',
           '^',  'circ',
           '`',  'grave',
           "'", 'acute',
           ",", 'cedil',
           'ringaccent', 'ring',
           'ogonek', 'ogon',
           'dotless', 'nodot',
           # HTML 5
           'dotaccent', 'dot',
           '=', 'macr',
           'u', 'breve',
           'v', 'caron',
           'H', 'dblac',
          );

 # There are more in HTML 5.0, and letters associated with other accent
 # entities.  We stick to HTML 4 entities to keep compatibility as
 # there is no clear gain to have more accent entities, numeric
 # entities used instead work well.
 # https://en.wikipedia.org/wiki/List_of_XML_and_HTML_character_entity_references
 # https://html.spec.whatwg.org/multipage/named-characters.html#named-character-references
 our %xml_accent_text_with_entities = (
       'ringaccent' => 'aA',
       "'"          => 'aeiouyAEIOUY',
       ','          => 'cC',
       '^'          => 'aeiouAEIOU',
       '`'          => 'aeiouAEIOU',
       '~'          => 'nNaoAO',
       '"'          => 'aeiouyAEIOU',
       'dotless'    => 'i',
 # HTML 5
 #      'ogonek'     => 'aeiuAEIU',
 );

 sub xml_numeric_entity_accent($$) {
   my ($accent, $text) = @_;

   if (exists($Texinfo::UnicodeData::unicode_accented_letters{$accent})
       and exists($Texinfo::UnicodeData::unicode_accented_letters{$accent}->{$text})) {
     return '&#' .
       hex($Texinfo::UnicodeData::unicode_accented_letters{$accent}->{$text}). ';';
   }
   if (exists($Texinfo::CommandsValues::unicode_diacritics{$accent})) {
     my $diacritic = '&#'
        .hex($Texinfo::CommandsValues::unicode_diacritics{$accent}). ';';
     if ($accent ne 'tieaccent') {
       return $text . $diacritic;
     } else {
       # tieaccent diacritic is naturally and correctly composed
       # between two characters
       my $remaining_text = $text;
       # we consider that letters are either characters or entities
       if ($remaining_text =~ s/^([\p{L}\d]|&[a-zA-Z0-9]+;)([\p{L}\d]|&[a-zA-Z0-9]+;)(.*)$/$3/) {
         return $1.$diacritic.$2 . $remaining_text;
       } else {
         return $text . $diacritic;
       }
     }
   }
   return undef;
 }

 sub xml_accent($$$;$$$$) {
   my ($self, $text, $command, $index_in_stack, $accents_stack,
       $in_upper_case, $use_numeric_entities) = @_;

   my $accent = $command->{'cmdname'};

   if ($in_upper_case and $text =~ /^\w$/) {
     $text = uc($text);
   }

   # do not return a dotless i or j as such if it is further composed
   # with an accented letter, return the letter as is
   if ($accent eq 'dotless'
       and exists($Texinfo::UnicodeData::unicode_accented_letters{$accent})
       and exists($Texinfo::UnicodeData::unicode_accented_letters{$accent}->{$text})
       and ($index_in_stack > 0
            and $Texinfo::UnicodeData::unicode_accented_letters{
                          $accents_stack->[$index_in_stack-1]->{'cmdname'}})) {
     return $text;
   }

   if ($use_numeric_entities) {
     my $formatted_accent = xml_numeric_entity_accent($accent, $text);
     if (defined($formatted_accent)) {
       return $formatted_accent;
     }
   } else {
     return "&${text}$xml_accent_entities{$accent};"
       if (defined($xml_accent_entities{$accent})
           and defined($xml_accent_text_with_entities{$accent})
           and ($text =~ /^[$xml_accent_text_with_entities{$accent}]$/));
     my $formatted_accent = xml_numeric_entity_accent($accent, $text);
     if (defined($formatted_accent)) {
       return $formatted_accent;
     }
   }

   # There are diacritics for every accent command except for dotless.
   # We should only get there with dotless if the argument is not recognized.
   return $text;
 }

 sub _xml_numeric_entities_accent($$$;$$$) {
   my ($self, $text, $command, $index_in_stack, $accents_stack,
       $in_upper_case) = @_;

   return xml_accent($self, $text, $command, $index_in_stack,
                     $accents_stack, $in_upper_case, 1);
 }

 sub xml_accents($$;$) {
   my ($self, $accent, $in_upper_case) = @_;

   my $format_accents;
   if ($self->get_conf('USE_NUMERIC_ENTITY')) {
     $format_accents = \&_xml_numeric_entities_accent;
   } else {
     $format_accents = \&xml_accent;
   }

   return $self->convert_accents($accent, $format_accents,
                                 $self->get_conf('OUTPUT_CHARACTERS'),
                                 $in_upper_case);
 }

 1;

 __END__

 =head1 NAME

 Texinfo::Convert::Converter - Parent class for Texinfo tree converters

 =head1 SYNOPSIS

   package Texinfo::Convert::MyConverter;

   use Texinfo::Convert::Converter;
   @ISA = qw(Texinfo::Convert::Converter);

   sub converter_defaults ($;$) {
     return \%myconverter_defaults;
   }
   sub converter_initialize($) {
     my $self = shift;
     ...
   }

   sub conversion_initialization($;$) {
     my $self = shift;
     my $document = shift;

     if ($document) {
       $self->set_document($document);
     }

     $self->set_global_document_commands('before', \@global_commands);
     ...

     $self->{'document_context'} = [{}];
     ...
   }

   sub conversion_finalization($) {
     my $self = shift;
   }

   sub convert_tree($$) {
     ...
   }

   sub convert($$) {
     my $self = shift;
     my $document = shift;

     $self->conversion_initialization($document);

     ...
     $self->conversion_finalization();
   }

   sub output($$) {
     my $self = shift;
     my $document = shift;

     $self->conversion_initialization($document);

     ...
     $self->conversion_finalization();
     ...
   }

   # if some data needs to be released explicitly
   sub converter_destroy($) {
     my $self = shift;

     ...
   }

   # end of Texinfo::Convert::MyConverter

   my $converter = Texinfo::Convert::MyConverter->converter();
   $converter->output($texinfo_parsed_document);

 =head1 NOTES

 The Texinfo Perl module main purpose is to be used in C<texi2any> to convert
 Texinfo to other formats.  There is no promise of API stability.

 =head1 DESCRIPTION

 C<Texinfo::Convert::Converter> is a super class that can be used to
 simplify converters initialization.  The class also provide some
 useful methods.  In turn, the converter should define some methods for
 conversion.  In general C<convert_tree>, C<output> and C<convert> should be
 defined.

 =over

 =item $result = $converter->convert_tree($tree)
 X<C<convert_tree>>

 The C<convert_tree> method is mandatory and should convert portions of Texinfo
 tree. Takes a I<$converter> and Texinfo tree I<$tree> in arguments.  Returns
 the converted output.

 This method should not perform converter initialization, as it should only
 be called with converter setup for immediate conversion, in general when
 conversion is already ongoing.

 =item $result = $converter->output($document)

 =item $result = $converter->output_tree($document)
 X<C<output>>X<C<output_tree>>

 The C<output> method is used by converters as entry point for conversion
 to a file with headers and so on.  This method should be implemented by
 converters.  C<output> is called from C<texi2any>.  C<output> takes a
 I<$converter> and a Texinfo parsed document C<Texinfo::Document> I<$document>
 as arguments.

 C<Texinfo::Convert::Converter> implements a generic C<output_tree>
 function suitable for conversion of the Texinfo tree, with the conversion
 result output into a file or returned from the function. C<output_tree>
 takes a I<$converter> and a Texinfo parsed document C<Texinfo::Document>
 I<$document> as arguments. In a converter that uses C<output_tree>,
 C<output> is in general defined as:

   sub output($$) {
     my $self = shift;
     my $document = shift;

     return $self->output_tree($document);
   }

 In general, C<output> and C<output_tree> output to files and return C<undef>.
 When the output file name is an empty string, however, it is customary
 for C<output> and C<output_tree> to return the output as a character string
 instead.  The output file name is obtained in C<output_tree> through a call to
 L<<< C<determine_files_and_directory>|/($output_file, $destination_directory, $output_filename, $document_name, $input_basefile) = $converter->determine_files_and_directory($output_format) >>>.
 In general C<determine_files_and_directory> is also used when C<output_tree> is not used.

 =item $result = $converter->convert($document)
 X<C<convert>>

 Entry point for the conversion of a Texinfo parsed document to an output
 format, without the headers usually done when outputting to a file.  C<convert>
 takes a I<$converter> and a Texinfo parsed document C<Texinfo::Document>
 I<$document> as arguments.  Returns the output as a character string.  Not
 mandatory, not called from C<texi2any>, but used in the C<texi2any> test suite.

 =back

 Two methods, C<converter_defaults> and C<converter_initialize> are
 used for initialization, to give information
 to C<Texinfo::Convert::Converter> and can be redefined in converters.

 To help with the conversion, the C<set_document> function associates a
 C<Texinfo::Document> to a converter.  Other methods are called in default
 implementations to be redefined to call code at specific moments of the
 conversion. C<conversion_initialization>, for instance, is generally
 called at the beginning of C<output>, C<output_tree> and C<convert>.
 C<conversion_finalization> is generally called at the end of C<output_tree>,
 C<output> and C<convert>.  C<output_tree> also calls the
 C<conversion_output_begin> method before the Texinfo tree conversion to obtain
 the beginning of the output. C<output_tree> calls the
 C<conversion_output_end> method after the Texinfo tree conversion to obtain
 the end of the output.

 For output formats based on output units conversion, the
 C<Texinfo::Convert::Plaintext> C<output> method could be a good starting
 point.  HTML and Info output are also based on output units conversion.
 Output units are not relevant for all the formats, the Texinfo tree can also be
 converted directly, in general by using C<output_tree>.  This is how the other
 Converters are implemented.

 Existing backends based on C<output_tree> may be used as examples.
 C<Texinfo::Convert::Texinfo> together with C<Texinfo::Convert::PlainTexinfo>,
 as well as C<Texinfo::Convert::TextContent> are trivial examples.
 C<Texinfo::Convert::Text> is less trivial, although still simple, while
 C<Texinfo::Convert::DocBook> is a real converter that is also not too complex.

 The documentation of L<Texinfo::Common>, L<Texinfo::OutputUnits>,
 L<Texinfo::Convert::Unicode> and L<Texinfo::Convert::Text> describes modules or
 additional function that may be useful for backends, while the parsed Texinfo
 tree is described in L<Texinfo::Parser>.


 =head1 METHODS

 =head2 Converter Initialization

 X<C<converter>>
 X<C<Texinfo::Convert::Converter> initialization>

 A module subclassing C<Texinfo::Convert::Converter> is created by calling
 the C<converter> method that should be inherited from
 C<Texinfo::Convert::Converter>.

 =over

 =item $converter = MyConverter->converter($options)
 X<C<converter>>

 The I<$options> hash reference holds options for the converter.
 These options should be Texinfo customization options.  The
 customization options are described in the Texinfo manual or in the
 customization API manual.

 The C<converter> function returns a converter object (a blessed hash
 reference) after checking the options and performing some initializations.

 =back

 To help with the initializations, the modules subclassing C<Texinfo::Convert::Converter>
 can define two methods:

 =over

 =item \%defaults = $converter_or_class->converter_defaults($options)
 X<C<converter_defaults>>

 Returns a reference on a hash with defaults for the converter module
 customization options or C<undef>.  The optional I<$options> hash reference
 holds options for the converter.  This method is called through a converter
 by L<<< C<converter>|/$converter = MyConverter->converter($options) >>>,
 but it may also be called through a converter module class.

 =item $converter->converter_initialize()
 X<C<converter_initialize>>

 This method is called at the end of the C<Texinfo::Convert::Converter>
 converter initialization.

 =back

 =head2 Conversion

 For conversion with C<output> and C<convert> a document to convert should be
 associated with the converter, in general the document passed in argument of
 C<output> or C<convert>.  The C<set_document> function associates a
 C<Texinfo::Document> to a converter.  This function is used in the default
 implementations.

 =over

 =item $converter->set_document($document)
 X<C<set_document>>

 Associate I<$document> to I<$converter>.  Also set the encoding related customization
 options based on I<$converter> customization information and information on
 document encoding, and setup converter hash C<convert_text_options> value that
 can be used to call L<C<Texinfo::Convert::Text::convert_to_text>|Texinfo::Convert::Text/$result = convert_to_text($tree, $text_options)>.

 =back

 The C<conversion_initialization>, C<conversion_finalization>,
 C<conversion_output_begin> and C<conversion_output_end> can be redefined to
 call code at diverse moments:

 =over

 =item $converter->conversion_initialization($document)

 =item $converter->conversion_finalization()
 X<C<conversion_initialization>>X<C<conversion_finalization>>

 C<conversion_initialization> is called at the beginning of C<output_tree> and
 of the default implementations of the C<output> and C<convert> functions.
 C<conversion_finalization> is called at the end of C<output_tree> and of
 the default C<output> and C<convert> methods implementations.
 These functions should be redefined to have code run before a document
 conversion and after the document conversion.

 In the default case, C<conversion_initialization> calls
 L<< set_document|/$converter->set_document($document) >> to associate the C<Texinfo::Document>
 document passed in argument to the converter.  A subclass converter redefining
 C<conversion_initialization> should in general call C<set_document> in the
 redefined function too to associate the converted document to the converter.

 For a converter to be reusable for multiple documents conversion, variables
 values corresponding to @-commands that can be set in the document
 and influence formatting should be reset at conversion initialization.
 This can be done with L<< C<set_global_document_commands>|/$converter->set_global_document_commands($commands_location, $selected_commands) >>.  If the list
 of such @-commands is C<@global_commands>, the following call would reset them
 to the values they had before starting the conversion:

   $self->set_global_document_commands('before', \@global_commands);

 =item $beginning = $converter->conversion_output_begin($output_file, $output_filename)

 =item $end = $converter->conversion_output_end()
 X<C<conversion_output_begin>>X<C<conversion_output_end>>

 C<conversion_output_begin> returned string I<$beginning> is output
 by the C<output_tree> calling method before the Texinfo tree conversion.
 The I<$output_file> argument is the output file path.
 If I<$output_file> is an empty string, it means that text will be returned by
 the converter instead of being written to an output file.
 I<$output_filename> is, in general, the file name portion of I<$output_file>
 (without directory) but can also be set based on C<@setfilename>.

 C<conversion_output_end> returned string I<$end> is output
 by the C<output_tree> calling method after the Texinfo tree conversion.

 The default methods implementations return an empty string.

 =back

 Calling C<conversion_initialization> and, if needed, C<conversion_finalization>
 in redefined C<output> and C<convert> methods is not mandated, but it is
 recommended to have similar converter codes.  In subclassed converters that do
 not need to define C<conversion_initialization>, calling the default
 C<Texinfo::Convert::Converter> C<conversion_initialization> implementation is
 also recommended to avoid having to explictely call C<set_document>.
 If C<conversion_initialization> is defined in a converter subclass it is
 recommended to call C<set_document> at the very beginning of the function to
 have the document associated with the converter.

 If a converter uses output units, the C<convert_output_unit> method can
 be used and can be redefined if needed:

 =over

 =item $result = $converter->convert_output_unit($output_unit)
 X<C<convert_output_unit>>

 Can be used for the conversion of output units by converters.
 C<convert_output_unit> takes a I<$converter> and an output unit
 I<$output_unit> as argument.  This method is not needed for all the converters.
 The implementation of
 C<convert_output_unit> of C<Texinfo::Convert::Converter> could be suitable in
 many cases.  Output units are typically returned by L<C<Texinfo::OutputUnits>
 C<split_by_section>|Texinfo::OutputUnits/$output_units = split_by_section($document)>
 or L<C<Texinfo::OutputUnits> C<split_by_node>|Texinfo::OutputUnits/$output_units =
 split_by_node($document)>.

 =back

 =head2 Output units and converter destruction

 Removing output units and destroying the converter is only needed if one
 want to be sure that the memory held is released or reused.  It is optional,
 and in general takes longer than having the memory be released at the
 end of a script.

 Output units associated with a converter are removed by calling
 the C<converter_remove_output_units> method that should be inherited from
 C<Texinfo::Convert::Converter>.

 =over

 =item $converter->converter_remove_output_units()
 X<C<destroy_converter>>

 Release the output units associated with a converter.  It does not necessarily
 means that the output units are explicitly undefined, it could be that cycles
 in output units are removed such that Perl can release or reuse the memory.

 =back

 To help with the output units release, the modules subclassing
 C<Texinfo::Convert::Converter> can define the method:

 =over

 =item $converter->converter_release_output_units()
 X<C<converter_release_output_units>>

 This method is called at the beginning of the C<Texinfo::Convert::Converter>
 converter output units removal.

 =back

 A module subclassing C<Texinfo::Convert::Converter> is destroyed by calling
 the C<destroy_converter> method that should be inherited from
 C<Texinfo::Convert::Converter>.

 =over

 =item $converter->destroy_converter()
 X<C<destroy_converter>>

 Destroy converter data.

 =back

 To help with the destruction, the modules subclassing
 C<Texinfo::Convert::Converter> can define the method:

 =over

 =item $converter->converter_destroy()
 X<C<converter_destroy>>

 This method is called at the beginning of the C<Texinfo::Convert::Converter>
 converter destruction.

 =back

 The default C<converter_release_output_units> and C<converter_destroy>
 methods do nothing.


 =head2 Getting and setting customization variables

 C<Texinfo::Convert::Converter> implements a simple interface to
 set and retrieve Texinfo customization variables.  Helper
 functions from diverse Texinfo modules needing customization
 information expect an object implementing C<get_conf> and/or
 C<set_conf>.  The converter itself can therefore be used in
 such cases.

 Customization variables are typically setup when
 initializing a converter with L<<< C<converter>|/$converter = MyConverter->converter($options) >>>
 and completed by Texinfo informative @-commands tree element values,
 for commands such as C<@frenchspacing> or C<@footnotestyle>.

 =over

 =item $converter->force_conf($variable_name, $variable_value)
 X<C<force_conf>>

 Set the Texinfo customization option I<$variable_name> to I<$variable_value>.
 This should rarely be used, but the purpose of this method is to be able
 to revert a customization that is always wrong for a given output
 format, like the splitting for example.

 =item $converter->get_conf($variable_name)
 X<C<get_conf>>

 Returns the value of the Texinfo customization variable I<$variable_name>.

 =item $status = $converter->set_conf($variable_name, $variable_value)
 X<C<set_conf>>

 Set the Texinfo customization option I<$variable_name> to I<$variable_value> if
 not set as a converter option.  Returns false if the customization options
 was not set.

 =back

 =head2 Registering error and warning messages

 C<Texinfo::Convert::Converter> implements an interface to register error and
 warning messages in the converter, that can be retrieved later on.
 Underneath, C<Texinfo::Report> is used to setup the messages data structure.

 =over

 =item $converter->converter_document_error($text, $continuation)

 =item $converter->converter_document_warn($text, $continuation)
 X<C<converter_document_error>>X<C<converter_document_warn>>

 Register a warning or an error.  The I<$text> is the text of the error or
 warning.

 The I<$continuation> optional arguments, if true, conveys that the line is a
 continuation line of a message.

 =item $converter->converter_line_error($text, $error_location_info, $continuation)

 =item $converter->converter_line_warn($text, $error_location_info, $continuation)
 X<C<converter_line_error>>X<C<converter_line_warn>>

 Register a warning or an error with a line information.  The I<$text> is the
 text of the error or warning.  The I<$error_location_info> argument holds the
 information on the error or warning location.  The I<$error_location_info>
 reference on hash may be obtained from Texinfo elements I<source_info> keys.
 It may also be setup to point to a file name, using the C<file_name> key and to
 a line number, using the C<line_nr> key.  The C<file_name> key value should be
 a binary string.

 The I<$continuation> optional arguments, if true, conveys that
 the line is a continuation line of a message.

 =item \@error_warning_messages = $converter->get_converter_errors()
 X<C<get_converter_errors>>

 Return a reference on an array containing the error or warning messages
 registered in the converter.  Error and warning messages are hash references as
 described in L<Texinfo::Report::count_errors|Texinfo::Report/$error_count
  = count_errors ($error_messages)>.

 =back

 =head2 Translations in output documents

 C<Texinfo::Convert::Converter> provides wrappers around
 L<Texinfo::Translations> methods that use the current language.  The
 current language is set by a call to C<converter_set_documentlanguage>, like:

  $converter->converter_set_documentlanguage($documentlanguage);

 The C<cdt> and C<pcdt> methods are used to translate strings to be output in
 converted documents, and return a Texinfo tree.  The C<cdt_string> is similar
 but returns a simple string, for already converted strings.

 =over

 =item $tree = $converter->cdt($string, $replaced_substrings, $translation_context)

 =item $string = $converter->cdt_string($string, $replaced_substrings, $translation_context)
 X<C<cdt>> X<C<cdt_string>>

 The I<$string> is a string to be translated.  With C<cdt>
 the function returns a Texinfo tree, as the string is interpreted
 as Texinfo code after translation.  With C<cdt_string> a string
 is returned.

 I<$replaced_substrings> is an optional hash reference specifying
 some substitution to be done after the translation.  The key of the
 I<$replaced_substrings> hash reference identifies what is to be substituted.
 In the string to be translated word in brace matching keys of
 I<$replaced_substrings> are replaced.
 For C<cdt>, the value is a Texinfo tree that is substituted in the
 resulting Texinfo tree. For C<cdt_string>, the value is a string that
 is replaced in the resulting string.

 The I<$translation_context> is optional.  If not C<undef> this is a translation
 context string for I<$string>.  It is the first argument of C<pgettext>
 in the C API of Gettext.

 =item $tree = $object->pcdt($translation_context, $string, $replaced_substrings)
 X<C<pcdt>>

 Same to C<cdt> except that the I<$translation_context> is not optional.
 This function is useful to mark strings with a translation context for
 translation.  This function is similar to pgettext in the Gettext C API.

 =back

 =head2 Index sorting

 You should call the following methods to sort indices in conversion:

 =over

 =item $sorted_indices = $converter->get_converter_indices_sorted_by_index()

 =item $sorted_indices = $converter->get_converter_indices_sorted_by_letter()
 X<C<get_converter_indices_sorted_by_index>>
 X<C<get_converter_indices_sorted_by_letter>>

 C<get_converter_indices_sorted_by_letter> returns the indices sorted by index
 and letter, while C<get_converter_indices_sorted_by_index> returns the indices
 with all entries of an index together.

 When sorting by letter, an array reference of letter hash references is
 associated with each index name.  Each letter hash reference has two
 keys, a I<letter> key with the letter, and an I<entries> key with an array
 reference of sorted index entries beginning with the letter.  The letter
 is a character string suitable for sorting letters, but is not necessarily
 the best to use for output.

 When simply sorting, the array of the sorted index entries is associated
 with the index name.

 The functions call L<< C<Texinfo::Document::sorted_indices_by_letter>|Texinfo::Document/$sorted_indices = sorted_indices_by_letter($document, $converter, $use_unicode_collation, $locale_lang) >>
 or L<< C<Texinfo::Document::sorted_indices_by_index>|Texinfo::Document/$sorted_indices = sorted_indices_by_index($document, $converter, $use_unicode_collation, $locale_lang) >>
 with arguments based on C<USE_UNICODE_COLLATION>, C<COLLATION_LANGUAGE> and
 C<DOCUMENTLANGUAGE_COLLATION> customization options, and, if relevant, current
 C<@documentlanguage>.

 =back

 =head2 Accents conversion

 Accent @-commands that take arguments can be nested in Texinfo code, as in
 C<@'{@^a}>.  To handle this situation, a user defined function can be called
 for each of the accent commands, starting by the innermost accent command.  For
 this the user-defined function and the outermost accent command tree elements
 should be given to the C<convert_accents> function:

 =over

 =item $result = $converter->convert_accents($accent_command, \&format_accents, $output_encoded_characters, $in_upper_case)
 X<C<convert_accents>>

 I<$accent_command> is an accent command tree elements, which may have other
 accent commands tree elements nested inside.  The function returns the accents
 formatted either as encoded letters if I<$output_encoded_characters> is set, or
 formatted by calling I<\&format_accents> repeatedly starting from the innermost
 accent command tree element within I<$accent_command>.  The innermost accent
 command argument (usually a letter), is also converted, by calling
 L<< C<< $converter->convert_tree >>|/$result = $converter->convert_tree($tree) >>. If I<$in_upper_case> is
 set, the result should be uppercased.

 =item $result = &$format_accents($self, $text, $accent_command, $index_in_stack, $accents_stack, $in_upper_case)

 I<$self> is the converter in the call to C<convert_accents>.
 For the innermost accent command, I<$text> is the text appearing within
 the accent command converted.  For the other accent commands,
 I<$text> is the result of the previously converted
 accent command.  I<$accent_command> the Texinfo tree element corresponding
 to the accent command being converted.  I<$index_in_stack> is the position
 in the I<$accents_stack> of the accent command being converted.  The
 I<$accents_stack> is an array holding the nested accent command
 Texinfo tree elements.  The innermost tree element command is last.
 I<$in_upper_case> is optional, and, if set, the text should be put
 in upper case.  The function should return the converted accent argument
 to be processed by the following accent command.

 =back

 =head2 Conversion to XML

 Some C<Texinfo::Convert::Converter> methods target conversion to XML.
 Most methods take a I<$converter> as argument to get some
 information and use methods for error reporting.

 =over

 =item $formatted_text = $converter->xml_format_text_with_numeric_entities($text)
 X<C<xml_format_text_with_numeric_entities>>

 Replace quotation marks and hyphens used to represent dash in
 Texinfo text with numeric XML entities.

 =item $protected_text = $converter->xml_protect_text($text)
 X<C<xml_protect_text>>

 Protect special XML characters (&, E<lt>, E<gt>, ") of I<$text>.

 =item $comment = $converter->xml_comment($text)
 X<C<xml_comment>>

 Returns an XML comment for I<$text>.

 =item $result = xml_accent($self, $text, $accent_command, $index_in_stack, $accents_stack, $in_upper_case, $use_numeric_entities)
 X<C<xml_accent>>

 I<$self> is an object, in general a converter.
 I<$text> is the text appearing within an accent command.  I<$accent_command>
 should be a Texinfo tree element corresponding to an accent command taking
 an argument.  I<$index_in_stack> is the position in the I<$accents_stack>
 of the accent command being converted.  It is optional, but if not present
 the formatting cannot take into account the position of the accent in
 the current accents group being converted.
 I<$in_upper_case> is optional, and, if set, the text is put
 in upper case.  The function returns the accented letter as XML named entity
 if possible, falling back to numeric entities if there is no named entity
 and returns the argument as last resort.  I<$use_numeric_entities>
 is optional.  If set, numerical entities are used instead of named entities
 if possible.

 This function is similar to the accent formatting function passed
 to C<convert_accents> for L<Accents conversion>.

 =item $result = $converter->xml_accents($accent_command, $in_upper_case)
 X<C<xml_accents>>

 I<$accent_command> is an accent command, which may have other accent
 commands nested.  If I<$in_upper_case> is set, the result should be
 upper cased.  The function returns the accents formatted as XML.

 =item $result = xml_numeric_entity_accent($accent_command_name, $text)
 X<C<xml_numeric_entity_accent>>

 I<$accent_command_name> is the name of an accent command.  I<$text> is the text
 appearing within the accent command.  Returns the accented letter as XML numeric
 entity, or C<undef> if there is no such entity.

 =back

 The following hashes, defined as C<our> variable are also available:

 =over

 =item %xml_text_entity_no_arg_commands_formatting
 X<C<%xml_text_entity_no_arg_commands_formatting>>

 Values are entities or, if not available, ASCII representation of
 single character non-alphabetical commands without brace such as C<*> or C<:>
 and of commands with empty braces such as C<atchar>, C<LaTeX>, C<arrow>,
 C<quoteleft> or C<AA>.

 =back

 =head2 Helper methods

 The module provides methods that may be useful for converter.
 Most methods take a I<$converter> as argument to get some
 information and use methods for error reporting, see L</Registering error and
 warning messages>.  Also to translate strings, see L</Translations in output
 documents>.  For useful methods that need a converter optionally and can be
 used in converters that do not inherit from C<Texinfo::Convert::Converter>, see
 L<Texinfo::Convert::Utils>.

 =over

 =item $succeeded = $converter->create_destination_directory($destination_directory_path, $destination_directory_name)
 X<C<create_destination_directory>>

 Create destination directory I<$destination_directory_path>.
 I<$destination_directory_path> should be a binary string, while
 I<$destination_directory_name> should be a character string, that can be used in
 error messages.  I<$succeeded> is true if the creation was successful or
 uneeded, false otherwise.

 =item ($output_file, $destination_directory, $output_filename, $document_name, $input_basefile) = $converter->determine_files_and_directory($output_format)
 X<C<determine_files_and_directory>>

 Determine output file and directory, as well as names related to files.  The
 result depends on the presence of C<@setfilename>, on the Texinfo input file
 name, and on customization options such as C<OUTPUT>, C<SUBDIR> or C<SPLIT>,
 as described in the Texinfo manual.  If I<$output_format> is defined and not an
 empty string, C<_$output_format> is prepended to the default directory name.

 I<$output_file> is mainly relevant when not split and should be used as the
 output file name.  In general, if not split and I<$output_file> is an empty
 string, it means that text should be returned by the converter instead of being
 written to an output file.  This is used in the test suite.
 I<$destination_directory> is either the directory I<$output_file> is in, or if
 split, the directory where the files should be created.  I<$output_filename>
 is, in general, the file name portion of I<$output_file> (without directory)
 but can also be set based on C<@setfilename>, in particular when
 I<$output_file> is an empty string. I<$document_name> is I<$output_filename>
 without extension.  I<$input_basefile> is based on the input Texinfo file name,
 with the file name portion only (without directory).

 The strings returned are text strings.

 =item ($encoded_name, $encoding) = $converter->encoded_input_file_name($character_string_name, $input_file_encoding)

 =item ($encoded_name, $encoding) = $converter->encoded_output_file_name($character_string_name)
 X<C<encoded_input_file_name>> X<C<encoded_output_file_name>>

 Encode I<$character_string_name> in the same way as other file names are
 encoded in the converter, based on customization variables, and possibly
 on the input file encoding.  Return the encoded name and the encoding
 used to encode the name.  The C<encoded_input_file_name> and
 C<encoded_output_file_name> functions use different customization variables to
 determine the encoding.

 The I<$input_file_encoding> argument is optional.  If set, it is used for
 the input file encoding.  It is useful if there is more precise information
 on the input file encoding where the file name appeared.

 Note that these functions are wrappers around functions from
 L<Texinfo::Convert::Utils> with the same names.

 =item $tree = $converter->expand_today()

 Expand today's date, as a Texinfo tree with translations.

 =item ($caption, $prepended) = $converter->float_name_caption($float)
 X<C<float_name_caption>>

 I<$float> is a Texinfo tree C<@float> element.  This function
 returns the caption element that should be used for the float formatting
 and the I<$prepended> Texinfo tree combining the type and label
 of the float.

 =item $tree = $converter->float_type_number($float)
 X<C<float_type_number>>

 I<$float> is a Texinfo tree C<@float> element.  This function
 returns the type and number of the float as a Texinfo tree with
 translations.

 =item $filename = $converter->node_information_filename($normalized, $label_element)
 X<C<node_information_filename>>

 Returns the normalized file name corresponding to the I<$normalized>
 node name and to the I<$label_element> node name element contents.

 =item ($normalized_name, $filename) = $converter->normalized_sectioning_command_filename($element)
 X<C<normalized_sectioning_command_filename>>

 Returns a normalized name I<$normalized_name> corresponding to a sectioning
 command tree element I<$element>, expanding the command argument using
 transliteration and characters protection.  Also returns I<$filename>
 the corresponding filename based on I<$normalized_name> taking into
 account additional constraint on file names and adding a file extension.

 =item $converter->present_bug_message($message, $element)
 X<C<present_bug_message>>

 Show a bug message using I<$message> text.  Use information on
 I<$element> tree element if given in argument.

 =item $converter->set_global_document_commands($commands_location, $selected_commands)
 X<C<set_global_document_commands>>

 Set the Texinfo customization options for @-commands.  I<$selected_commands>
 is an array reference containing the @-commands set.  I<$commands_location>
 specifies where in the document the value should be taken from. The
 possibilities are:

 =over

 =item before

 Set to the values before document conversion, from defaults and command-line.

 =item last

 Set to the last value for the command.

 =item preamble

 Set sequentially to the values in the Texinfo preamble.

 =item preamble_or_first

 Set to the first value of the command if the first command is not
 in the Texinfo preamble, else set as with I<preamble>,
 sequentially to the values in the Texinfo preamble.

 =back

 Notice that the only effect of this function is to set a customization
 variable value, no @-command side effects are run, no associated customization
 variables are set.

 For more information on the function used to set the value for each of the command, see
 L<C<Texinfo::Common> C<set_global_document_command>|Texinfo::Common/$element = set_global_document_command($customization_information, $global_commands_information, $cmdname, $command_location)>.

 =item $table_item_tree = $converter->table_item_content_tree($element)
 X<C<table_item_content_tree>>

 I<$element> should be an C<@item> or C<@itemx> tree element.
 Returns a tree in which the @-command in argument of C<@*table>
 of the I<$element> has been applied to the I<$element> line argument,
 or C<undef>.

 =item $result = $converter->top_node_filename($document_name)
 X<C<top_node_filename>>

 Returns a file name for the Top node file using either C<TOP_FILE>
 customization value, or C<EXTENSION> customization value and I<$document_name>.

 =item $tree = $converter->expand_verbatiminclude($verbatiminclude)
 X<C<expand_verbatiminclude>>

 I<$verbatiminclude> is a C<@verbatiminclude> tree element.  This function
 returns a C<@verbatim> tree elements after finding the included file and
 reading it.

 =back

 Finally, there is:

 =over

 =item $result = $converter->output_internal_links()
 X<C<output_internal_links>>

 At this level, the method just returns undef.  It is used in the HTML
 output, following the C<--internal-links> option of C<texi2any>
 specification.

 =back

 =head1 SEE ALSO

 L<Texinfo::Common>, L<Texinfo::Convert::Unicode>, L<Texinfo::Report>,
 L<Texinfo::Translations>, L<Texinfo::Convert::Utils> and L<Texinfo::Parser>.

 =head1 AUTHOR

 Patrice Dumas, E<lt>bug-texinfo@gnu.orgE<gt>

 =head1 COPYRIGHT AND LICENSE

 Copyright 2011- Free Software Foundation, Inc.  See the source file for
 all copyright years.

 This library is free software; you can redistribute it and/or modify
 it under the terms of the GNU General Public License as published by
 the Free Software Foundation; either version 3 of the License, or (at
 your option) any later version.

 =cut