gcc/ada/scng.adb - gcc - Git at Google

 ------------------------------------------------------------------------------
 --                                                                          --
 --                         GNAT COMPILER COMPONENTS                         --
 --                                                                          --
 --                                 S C N G                                  --
 --                                                                          --
 --                                 B o d y                                  --
 --                                                                          --
 --          Copyright (C) 1992-2003 Free Software Foundation, Inc.          --
 --                                                                          --
 -- GNAT is free software;  you can  redistribute it  and/or modify it under --
 -- terms of the  GNU General Public License as published  by the Free Soft- --
 -- ware  Foundation;  either version 2,  or (at your option) any later ver- --
 -- sion.  GNAT is distributed in the hope that it will be useful, but WITH- --
 -- OUT ANY WARRANTY;  without even the  implied warranty of MERCHANTABILITY --
 -- or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License --
 -- for  more details.  You should have  received  a copy of the GNU General --
 -- Public License  distributed with GNAT;  see file COPYING.  If not, write --
 -- to  the Free Software Foundation,  59 Temple Place - Suite 330,  Boston, --
 -- MA 02111-1307, USA.                                                      --
 --                                                                          --
 -- GNAT was originally developed  by the GNAT team at  New York University. --
 -- Extensive contributions were provided by Ada Core Technologies Inc.      --
 --                                                                          --
 ------------------------------------------------------------------------------

 with Csets;    use Csets;
 with Err_Vars; use Err_Vars;
 with Hostparm; use Hostparm;
 with Namet;    use Namet;
 with Opt;      use Opt;
 with Scans;    use Scans;
 with Sinput;   use Sinput;
 with Snames;   use Snames;
 with Stringt;  use Stringt;
 with Stylesw;  use Stylesw;
 with Uintp;    use Uintp;
 with Urealp;   use Urealp;
 with Widechar; use Widechar;

 with System.CRC32;
 with System.WCh_Con; use System.WCh_Con;

 package body Scng is

    use ASCII;
    --  Make control characters visible

    Special_Characters : array (Character) of Boolean := (others => False);
    --  For characters that are Special token, the value is True

    Comment_Is_Token : Boolean := False;
    --  True if comments are tokens

    End_Of_Line_Is_Token : Boolean := False;
    --  True if End_Of_Line is a token

    -----------------------
    -- Local Subprograms --
    -----------------------

    procedure Accumulate_Checksum (C : Character);
    pragma Inline (Accumulate_Checksum);
    --  This routine accumulates the checksum given character C. During the
    --  scanning of a source file, this routine is called with every character
    --  in the source, excluding blanks, and all control characters (except
    --  that ESC is included in the checksum). Upper case letters not in string
    --  literals are folded by the caller. See Sinput spec for the documentation
    --  of the checksum algorithm. Note: checksum values are only used if we
    --  generate code, so it is not necessary to worry about making the right
    --  sequence of calls in any error situation.

    procedure Accumulate_Checksum (C : Char_Code);
    pragma Inline (Accumulate_Checksum);
    --  This version is identical, except that the argument, C, is a character
    --  code value instead of a character. This is used when wide characters
    --  are scanned. We use the character code rather than the ASCII characters
    --  so that the checksum is independent of wide character encoding method.

    procedure Initialize_Checksum;
    pragma Inline (Initialize_Checksum);
    --  Initialize checksum value

    -------------------------
    -- Accumulate_Checksum --
    -------------------------

    procedure Accumulate_Checksum (C : Character) is
    begin
       System.CRC32.Update (System.CRC32.CRC32 (Checksum), C);
    end Accumulate_Checksum;

    procedure Accumulate_Checksum (C : Char_Code) is
    begin
       Accumulate_Checksum (Character'Val (C / 256));
       Accumulate_Checksum (Character'Val (C mod 256));
    end Accumulate_Checksum;

    ----------------------------
    -- Determine_Token_Casing --
    ----------------------------

    function Determine_Token_Casing return Casing_Type is
    begin
       return Determine_Casing (Source (Token_Ptr .. Scan_Ptr - 1));
    end Determine_Token_Casing;

    -------------------------
    -- Initialize_Checksum --
    -------------------------

    procedure Initialize_Checksum is
    begin
       System.CRC32.Initialize (System.CRC32.CRC32 (Checksum));
    end Initialize_Checksum;

    ------------------------
    -- Initialize_Scanner --
    ------------------------

    procedure Initialize_Scanner
      (Unit  : Unit_Number_Type;
       Index : Source_File_Index)
    is
    begin
       --  Set up Token_Type values in Names Table entries for reserved keywords
       --  We use the Pos value of the Token_Type value. Note we are relying on
       --  the fact that Token_Type'Val (0) is not a reserved word!

       Set_Name_Table_Byte (Name_Abort,      Token_Type'Pos (Tok_Abort));
       Set_Name_Table_Byte (Name_Abs,        Token_Type'Pos (Tok_Abs));
       Set_Name_Table_Byte (Name_Abstract,   Token_Type'Pos (Tok_Abstract));
       Set_Name_Table_Byte (Name_Accept,     Token_Type'Pos (Tok_Accept));
       Set_Name_Table_Byte (Name_Access,     Token_Type'Pos (Tok_Access));
       Set_Name_Table_Byte (Name_And,        Token_Type'Pos (Tok_And));
       Set_Name_Table_Byte (Name_Aliased,    Token_Type'Pos (Tok_Aliased));
       Set_Name_Table_Byte (Name_All,        Token_Type'Pos (Tok_All));
       Set_Name_Table_Byte (Name_Array,      Token_Type'Pos (Tok_Array));
       Set_Name_Table_Byte (Name_At,         Token_Type'Pos (Tok_At));
       Set_Name_Table_Byte (Name_Begin,      Token_Type'Pos (Tok_Begin));
       Set_Name_Table_Byte (Name_Body,       Token_Type'Pos (Tok_Body));
       Set_Name_Table_Byte (Name_Case,       Token_Type'Pos (Tok_Case));
       Set_Name_Table_Byte (Name_Constant,   Token_Type'Pos (Tok_Constant));
       Set_Name_Table_Byte (Name_Declare,    Token_Type'Pos (Tok_Declare));
       Set_Name_Table_Byte (Name_Delay,      Token_Type'Pos (Tok_Delay));
       Set_Name_Table_Byte (Name_Delta,      Token_Type'Pos (Tok_Delta));
       Set_Name_Table_Byte (Name_Digits,     Token_Type'Pos (Tok_Digits));
       Set_Name_Table_Byte (Name_Do,         Token_Type'Pos (Tok_Do));
       Set_Name_Table_Byte (Name_Else,       Token_Type'Pos (Tok_Else));
       Set_Name_Table_Byte (Name_Elsif,      Token_Type'Pos (Tok_Elsif));
       Set_Name_Table_Byte (Name_End,        Token_Type'Pos (Tok_End));
       Set_Name_Table_Byte (Name_Entry,      Token_Type'Pos (Tok_Entry));
       Set_Name_Table_Byte (Name_Exception,  Token_Type'Pos (Tok_Exception));
       Set_Name_Table_Byte (Name_Exit,       Token_Type'Pos (Tok_Exit));
       Set_Name_Table_Byte (Name_For,        Token_Type'Pos (Tok_For));
       Set_Name_Table_Byte (Name_Function,   Token_Type'Pos (Tok_Function));
       Set_Name_Table_Byte (Name_Generic,    Token_Type'Pos (Tok_Generic));
       Set_Name_Table_Byte (Name_Goto,       Token_Type'Pos (Tok_Goto));
       Set_Name_Table_Byte (Name_If,         Token_Type'Pos (Tok_If));
       Set_Name_Table_Byte (Name_In,         Token_Type'Pos (Tok_In));
       Set_Name_Table_Byte (Name_Is,         Token_Type'Pos (Tok_Is));
       Set_Name_Table_Byte (Name_Limited,    Token_Type'Pos (Tok_Limited));
       Set_Name_Table_Byte (Name_Loop,       Token_Type'Pos (Tok_Loop));
       Set_Name_Table_Byte (Name_Mod,        Token_Type'Pos (Tok_Mod));
       Set_Name_Table_Byte (Name_New,        Token_Type'Pos (Tok_New));
       Set_Name_Table_Byte (Name_Not,        Token_Type'Pos (Tok_Not));
       Set_Name_Table_Byte (Name_Null,       Token_Type'Pos (Tok_Null));
       Set_Name_Table_Byte (Name_Of,         Token_Type'Pos (Tok_Of));
       Set_Name_Table_Byte (Name_Or,         Token_Type'Pos (Tok_Or));
       Set_Name_Table_Byte (Name_Others,     Token_Type'Pos (Tok_Others));
       Set_Name_Table_Byte (Name_Out,        Token_Type'Pos (Tok_Out));
       Set_Name_Table_Byte (Name_Package,    Token_Type'Pos (Tok_Package));
       Set_Name_Table_Byte (Name_Pragma,     Token_Type'Pos (Tok_Pragma));
       Set_Name_Table_Byte (Name_Private,    Token_Type'Pos (Tok_Private));
       Set_Name_Table_Byte (Name_Procedure,  Token_Type'Pos (Tok_Procedure));
       Set_Name_Table_Byte (Name_Protected,  Token_Type'Pos (Tok_Protected));
       Set_Name_Table_Byte (Name_Raise,      Token_Type'Pos (Tok_Raise));
       Set_Name_Table_Byte (Name_Range,      Token_Type'Pos (Tok_Range));
       Set_Name_Table_Byte (Name_Record,     Token_Type'Pos (Tok_Record));
       Set_Name_Table_Byte (Name_Rem,        Token_Type'Pos (Tok_Rem));
       Set_Name_Table_Byte (Name_Renames,    Token_Type'Pos (Tok_Renames));
       Set_Name_Table_Byte (Name_Requeue,    Token_Type'Pos (Tok_Requeue));
       Set_Name_Table_Byte (Name_Return,     Token_Type'Pos (Tok_Return));
       Set_Name_Table_Byte (Name_Reverse,    Token_Type'Pos (Tok_Reverse));
       Set_Name_Table_Byte (Name_Select,     Token_Type'Pos (Tok_Select));
       Set_Name_Table_Byte (Name_Separate,   Token_Type'Pos (Tok_Separate));
       Set_Name_Table_Byte (Name_Subtype,    Token_Type'Pos (Tok_Subtype));
       Set_Name_Table_Byte (Name_Tagged,     Token_Type'Pos (Tok_Tagged));
       Set_Name_Table_Byte (Name_Task,       Token_Type'Pos (Tok_Task));
       Set_Name_Table_Byte (Name_Terminate,  Token_Type'Pos (Tok_Terminate));
       Set_Name_Table_Byte (Name_Then,       Token_Type'Pos (Tok_Then));
       Set_Name_Table_Byte (Name_Type,       Token_Type'Pos (Tok_Type));
       Set_Name_Table_Byte (Name_Until,      Token_Type'Pos (Tok_Until));
       Set_Name_Table_Byte (Name_Use,        Token_Type'Pos (Tok_Use));
       Set_Name_Table_Byte (Name_When,       Token_Type'Pos (Tok_When));
       Set_Name_Table_Byte (Name_While,      Token_Type'Pos (Tok_While));
       Set_Name_Table_Byte (Name_With,       Token_Type'Pos (Tok_With));
       Set_Name_Table_Byte (Name_Xor,        Token_Type'Pos (Tok_Xor));

       --  Initialize scan control variables

       Current_Source_File       := Index;
       Source                    := Source_Text (Current_Source_File);
       Current_Source_Unit       := Unit;
       Scan_Ptr                  := Source_First (Current_Source_File);
       Token                     := No_Token;
       Token_Ptr                 := Scan_Ptr;
       Current_Line_Start        := Scan_Ptr;
       Token_Node                := Empty;
       Token_Name                := No_Name;
       Start_Column              := Set_Start_Column;
       First_Non_Blank_Location  := Scan_Ptr;

       Initialize_Checksum;

       --  Do not call Scan, otherwise the License stuff does not work in Scn.

    end Initialize_Scanner;

    ------------------------------
    -- Reset_Special_Characters --
    ------------------------------

    procedure Reset_Special_Characters is
    begin
       Special_Characters := (others => False);
    end Reset_Special_Characters;

    ----------
    -- Scan --
    ----------

    procedure Scan is

       Start_Of_Comment : Source_Ptr;

       procedure Check_End_Of_Line;
       --  Called when end of line encountered. Checks that line is not
       --  too long, and that other style checks for the end of line are met.

       function Double_Char_Token (C : Character) return Boolean;
       --  This function is used for double character tokens like := or <>. It
       --  checks if the character following Source (Scan_Ptr) is C, and if so
       --  bumps Scan_Ptr past the pair of characters and returns True. A space
       --  between the two characters is also recognized with an appropriate
       --  error message being issued. If C is not present, False is returned.
       --  Note that Double_Char_Token can only be used for tokens defined in
       --  the Ada syntax (it's use for error cases like && is not appropriate
       --  since we do not want a junk message for a case like &-space-&).

       procedure Error_Illegal_Character;
       --  Give illegal character error, Scan_Ptr points to character.
       --  On return, Scan_Ptr is bumped past the illegal character.

       procedure Error_Illegal_Wide_Character;
       --  Give illegal wide character message. On return, Scan_Ptr is bumped
       --  past the illegal character, which may still leave us pointing to
       --  junk, not much we can do if the escape sequence is messed up!

       procedure Error_Long_Line;
       --  Signal error of excessively long line

       procedure Error_No_Double_Underline;
       --  Signal error of double underline character

       procedure Nlit;
       --  This is the procedure for scanning out numeric literals. On entry,
       --  Scan_Ptr points to the digit that starts the numeric literal (the
       --  checksum for this character has not been accumulated yet). On return
       --  Scan_Ptr points past the last character of the numeric literal, Token
       --  and Token_Node are set appropriately, and the checksum is updated.

       procedure Slit;
       --  This is the procedure for scanning out string literals. On entry,
       --  Scan_Ptr points to the opening string quote (the checksum for this
       --  character has not been accumulated yet). On return Scan_Ptr points
       --  past the closing quote of the string literal, Token and Token_Node
       --  are set appropriately, and the checksum is upated.

       -----------------------
       -- Check_End_Of_Line --
       -----------------------

       procedure Check_End_Of_Line is
          Len : constant Int := Int (Scan_Ptr) - Int (Current_Line_Start);

       begin
          if Style_Check and Style_Check_Max_Line_Length then
             Style.Check_Line_Terminator (Len);

          elsif Len > Hostparm.Max_Line_Length then
             Error_Long_Line;
          end if;
       end Check_End_Of_Line;

       -----------------------
       -- Double_Char_Token --
       -----------------------

       function Double_Char_Token (C : Character) return Boolean is
       begin
          if Source (Scan_Ptr + 1) = C then
             Accumulate_Checksum (C);
             Scan_Ptr := Scan_Ptr + 2;
             return True;

          elsif Source (Scan_Ptr + 1) = ' '
            and then Source (Scan_Ptr + 2) = C
          then
             Scan_Ptr := Scan_Ptr + 1;
             Error_Msg_S ("no space allowed here");
             Scan_Ptr := Scan_Ptr + 2;
             return True;

          else
             return False;
          end if;
       end Double_Char_Token;

       -----------------------------
       -- Error_Illegal_Character --
       -----------------------------

       procedure Error_Illegal_Character is
       begin
          Error_Msg_S ("illegal character");
          Scan_Ptr := Scan_Ptr + 1;
       end Error_Illegal_Character;

       ----------------------------------
       -- Error_Illegal_Wide_Character --
       ----------------------------------

       procedure Error_Illegal_Wide_Character is
       begin
          if OpenVMS then
             Error_Msg_S
               ("illegal wide character, check " &
                  "'/'W'I'D'E'_'C'H'A'R'A'C'T'E'R'_'E'N'C'O'D'I'N'G qualifier");
          else
             Error_Msg_S
               ("illegal wide character, check -gnatW switch");
          end if;

          Scan_Ptr := Scan_Ptr + 1;
       end Error_Illegal_Wide_Character;

       ---------------------
       -- Error_Long_Line --
       ---------------------

       procedure Error_Long_Line is
       begin
          Error_Msg
            ("this line is too long",
             Current_Line_Start + Hostparm.Max_Line_Length);
       end Error_Long_Line;

       -------------------------------
       -- Error_No_Double_Underline --
       -------------------------------

       procedure Error_No_Double_Underline is
       begin
          Error_Msg_S ("two consecutive underlines not permitted");
       end Error_No_Double_Underline;

       ----------
       -- Nlit --
       ----------

       procedure Nlit is

          C : Character;
          --  Current source program character

          Base_Char : Character;
          --  Either # or : (character at start of based number)

          Base : Int;
          --  Value of base

          UI_Base : Uint;
          --  Value of base in Uint format

          UI_Int_Value : Uint;
          --  Value of integer scanned by Scan_Integer in Uint format

          UI_Num_Value : Uint;
          --  Value of integer in numeric value being scanned

          Scale : Int;
          --  Scale value for real literal

          UI_Scale : Uint;
          --  Scale in Uint format

          Exponent_Is_Negative : Boolean;
          --  Set true for negative exponent

          Extended_Digit_Value : Int;
          --  Extended digit value

          Point_Scanned : Boolean;
          --  Flag for decimal point scanned in numeric literal

          -----------------------
          -- Local Subprograms --
          -----------------------

          procedure Error_Digit_Expected;
          --  Signal error of bad digit, Scan_Ptr points to the location at
          --  which the digit was expected on input, and is unchanged on return.

          procedure Scan_Integer;
          --  Procedure to scan integer literal. On entry, Scan_Ptr points to
          --  a digit, on exit Scan_Ptr points past the last character of
          --  the integer.
          --  For each digit encountered, UI_Int_Value is multiplied by 10,
          --  and the value of the digit added to the result. In addition,
          --  the value in Scale is decremented by one for each actual digit
          --  scanned.

          --------------------------
          -- Error_Digit_Expected --
          --------------------------

          procedure Error_Digit_Expected is
          begin
             Error_Msg_S ("digit expected");
          end Error_Digit_Expected;

          -------------------
          --  Scan_Integer --
          -------------------

          procedure Scan_Integer is
             C : Character;
             --  Next character scanned

          begin
             C := Source (Scan_Ptr);

             --  Loop through digits (allowing underlines)

             loop
                Accumulate_Checksum (C);
                UI_Int_Value :=
                  UI_Int_Value * 10 + (Character'Pos (C) - Character'Pos ('0'));
                Scan_Ptr := Scan_Ptr + 1;
                Scale := Scale - 1;
                C := Source (Scan_Ptr);

                if C = '_' then
                   Accumulate_Checksum ('_');

                   loop
                      Scan_Ptr := Scan_Ptr + 1;
                      C := Source (Scan_Ptr);
                      exit when C /= '_';
                      Error_No_Double_Underline;
                   end loop;

                   if C not in '0' .. '9' then
                      Error_Digit_Expected;
                      exit;
                   end if;

                else
                   exit when C not in '0' .. '9';
                end if;
             end loop;

          end Scan_Integer;

          ----------------------------------
          -- Start of Processing for Nlit --
          ----------------------------------

       begin
          Base := 10;
          UI_Base := Uint_10;
          UI_Int_Value := Uint_0;
          Scale := 0;
          Scan_Integer;
          Scale := 0;
          Point_Scanned := False;
          UI_Num_Value := UI_Int_Value;

          --  Various possibilities now for continuing the literal are
          --  period, E/e (for exponent), or :/# (for based literal).

          Scale := 0;
          C := Source (Scan_Ptr);

          if C = '.' then

             --  Scan out point, but do not scan past .. which is a range
             --  sequence, and must not be eaten up scanning a numeric literal.

             while C = '.' and then Source (Scan_Ptr + 1) /= '.' loop
                Accumulate_Checksum ('.');

                if Point_Scanned then
                   Error_Msg_S ("duplicate point ignored");
                end if;

                Point_Scanned := True;
                Scan_Ptr := Scan_Ptr + 1;
                C := Source (Scan_Ptr);

                if C not in '0' .. '9' then
                   Error_Msg
                     ("real literal cannot end with point", Scan_Ptr - 1);
                else
                   Scan_Integer;
                   UI_Num_Value := UI_Int_Value;
                end if;
             end loop;

             --  Based literal case. The base is the value we already scanned.
             --  In the case of colon, we insist that the following character
             --  is indeed an extended digit or a period. This catches a number
             --  of common errors, as well as catching the well known tricky
             --  bug otherwise arising from "x : integer range 1 .. 10:= 6;"

          elsif C = '#'
            or else (C = ':' and then
                       (Source (Scan_Ptr + 1) = '.'
                          or else
                        Source (Scan_Ptr + 1) in '0' .. '9'
                          or else
                        Source (Scan_Ptr + 1) in 'A' .. 'Z'
                          or else
                        Source (Scan_Ptr + 1) in 'a' .. 'z'))
          then
             if C = ':' and then Warn_On_Obsolescent_Feature then
                Error_Msg_S
                  ("use of "":"" is an obsolescent feature ('R'M 'J.2(3))?");
                Error_Msg_S
                  ("\use ""'#"" instead?");
             end if;

             Accumulate_Checksum (C);
             Base_Char := C;
             UI_Base := UI_Int_Value;

             if UI_Base < 2 or else UI_Base > 16 then
                Error_Msg_SC ("base not 2-16");
                UI_Base := Uint_16;
             end if;

             Base := UI_To_Int (UI_Base);
             Scan_Ptr := Scan_Ptr + 1;

             --  Scan out extended integer [. integer]

             C := Source (Scan_Ptr);
             UI_Int_Value := Uint_0;
             Scale := 0;

             loop
                if C in '0' .. '9' then
                   Accumulate_Checksum (C);
                   Extended_Digit_Value :=
                     Int'(Character'Pos (C)) - Int'(Character'Pos ('0'));

                elsif C in 'A' .. 'F' then
                   Accumulate_Checksum (Character'Val (Character'Pos (C) + 32));
                   Extended_Digit_Value :=
                     Int'(Character'Pos (C)) - Int'(Character'Pos ('A')) + 10;

                elsif C in 'a' .. 'f' then
                   Accumulate_Checksum (C);
                   Extended_Digit_Value :=
                     Int'(Character'Pos (C)) - Int'(Character'Pos ('a')) + 10;

                else
                   Error_Msg_S ("extended digit expected");
                   exit;
                end if;

                if Extended_Digit_Value >= Base then
                   Error_Msg_S ("digit '>= base");
                end if;

                UI_Int_Value := UI_Int_Value * UI_Base + Extended_Digit_Value;
                Scale := Scale - 1;
                Scan_Ptr := Scan_Ptr + 1;
                C := Source (Scan_Ptr);

                if C = '_' then
                   loop
                      Accumulate_Checksum ('_');
                      Scan_Ptr := Scan_Ptr + 1;
                      C := Source (Scan_Ptr);
                      exit when C /= '_';
                      Error_No_Double_Underline;
                   end loop;

                elsif C = '.' then
                   Accumulate_Checksum ('.');

                   if Point_Scanned then
                      Error_Msg_S ("duplicate point ignored");
                   end if;

                   Scan_Ptr := Scan_Ptr + 1;
                   C := Source (Scan_Ptr);
                   Point_Scanned := True;
                   Scale := 0;

                elsif C = Base_Char then
                   Accumulate_Checksum (C);
                   Scan_Ptr := Scan_Ptr + 1;
                   exit;

                elsif C = '#' or else C = ':' then
                   Error_Msg_S ("based number delimiters must match");
                   Scan_Ptr := Scan_Ptr + 1;
                   exit;

                elsif not Identifier_Char (C) then
                   if Base_Char = '#' then
                      Error_Msg_S ("missing '#");
                   else
                      Error_Msg_S ("missing ':");
                   end if;

                   exit;
                end if;

             end loop;

             UI_Num_Value := UI_Int_Value;
          end if;

          --  Scan out exponent

          if not Point_Scanned then
             Scale := 0;
             UI_Scale := Uint_0;
          else
             UI_Scale := UI_From_Int (Scale);
          end if;

          if Source (Scan_Ptr) = 'e' or else Source (Scan_Ptr) = 'E' then
             Accumulate_Checksum ('e');
             Scan_Ptr := Scan_Ptr + 1;
             Exponent_Is_Negative := False;

             if Source (Scan_Ptr) = '+' then
                Accumulate_Checksum ('+');
                Scan_Ptr := Scan_Ptr + 1;

             elsif Source (Scan_Ptr) = '-' then
                Accumulate_Checksum ('-');

                if not Point_Scanned then
                   Error_Msg_S
                     ("negative exponent not allowed for integer literal");
                else
                   Exponent_Is_Negative := True;
                end if;

                Scan_Ptr := Scan_Ptr + 1;
             end if;

             UI_Int_Value := Uint_0;

             if Source (Scan_Ptr) in '0' .. '9' then
                Scan_Integer;
             else
                Error_Digit_Expected;
             end if;

             if Exponent_Is_Negative then
                UI_Scale := UI_Scale - UI_Int_Value;
             else
                UI_Scale := UI_Scale + UI_Int_Value;
             end if;
          end if;

          --  Case of real literal to be returned

          if Point_Scanned then
             Token := Tok_Real_Literal;
             Real_Literal_Value :=
               UR_From_Components (
                                   Num   => UI_Num_Value,
                                   Den   => -UI_Scale,
                                   Rbase => Base);

             --  Case of integer literal to be returned

          else
             Token := Tok_Integer_Literal;

             if UI_Scale = 0 then
                Int_Literal_Value := UI_Num_Value;

                --  Avoid doing possibly expensive calculations in cases like
                --  parsing 163E800_000# when semantics will not be done anyway.
                --  This is especially useful when parsing garbled input.

             elsif Operating_Mode /= Check_Syntax
               and then (Serious_Errors_Detected = 0 or else Try_Semantics)
             then
                Int_Literal_Value := UI_Num_Value * UI_Base ** UI_Scale;

             else
                Int_Literal_Value := No_Uint;

             end if;

          end if;

          return;

       end Nlit;

       ----------
       -- Slit --
       ----------

       procedure Slit is

          Delimiter : Character;
          --  Delimiter (first character of string)

          C : Character;
          --  Current source program character

          Code : Char_Code;
          --  Current character code value

          Err : Boolean;
          --  Error flag for Scan_Wide call

          procedure Error_Bad_String_Char;
          --  Signal bad character in string/character literal. On entry
          --  Scan_Ptr points to the improper character encountered during
          --  the scan. Scan_Ptr is not modified, so it still points to the bad
          --  character on return.

          procedure Error_Unterminated_String;
          --  Procedure called if a line terminator character is encountered
          --  during scanning a string, meaning that the string is not properly
          --  terminated.

          procedure Set_String;
          --  Procedure used to distinguish between string and operator symbol.
          --  On entry the string has been scanned out, and its characters start
          --  at Token_Ptr and end one character before Scan_Ptr. On exit Token
          --  is set to Tok_String_Literal or Tok_Operator_Symbol as
          --  appropriate, and Token_Node is appropriately initialized.
          --  In addition, in the operator symbol case, Token_Name is
          --  appropriately set.

          ---------------------------
          -- Error_Bad_String_Char --
          ---------------------------

          procedure Error_Bad_String_Char is
             C : constant Character := Source (Scan_Ptr);

          begin
             if C = HT then
                Error_Msg_S ("horizontal tab not allowed in string");

             elsif C = VT or else C = FF then
                Error_Msg_S ("format effector not allowed in string");

             elsif C in Upper_Half_Character then
                Error_Msg_S ("(Ada 83) upper half character not allowed");

             else
                Error_Msg_S ("control character not allowed in string");
             end if;
          end Error_Bad_String_Char;

          -------------------------------
          -- Error_Unterminated_String --
          -------------------------------

          procedure Error_Unterminated_String is
          begin
             --  An interesting little refinement. Consider the following
             --  examples:

             --     A := "this is an unterminated string;
             --     A := "this is an unterminated string &
             --     P(A, "this is a parameter that didn't get terminated);

             --  We fiddle a little to do slightly better placement in these
             --  cases also if there is white space at the end of the line we
             --  place the flag at the start of this white space, not at the
             --  end. Note that we only have to test for blanks, since tabs
             --  aren't allowed in strings in the first place and would have
             --  caused an error message.

             --  Two more cases that we treat specially are:

             --     A := "this string uses the wrong terminator'
             --     A := "this string uses the wrong terminator' &

             --  In these cases we give a different error message as well

             --  We actually reposition the scan pointer to the point where we
             --  place the flag in these cases, since it seems a better bet on
             --  the original intention.

             while Source (Scan_Ptr - 1) = ' '
               or else Source (Scan_Ptr - 1) = '&'
             loop
                Scan_Ptr := Scan_Ptr - 1;
                Unstore_String_Char;
             end loop;

             --  Check for case of incorrect string terminator, but single quote
             --  is not considered incorrect if the opening terminator misused
             --  a single quote (error message already given).

             if Delimiter /= '''
               and then Source (Scan_Ptr - 1) = '''
             then
                Unstore_String_Char;
                Error_Msg
                  ("incorrect string terminator character", Scan_Ptr - 1);
                return;
             end if;

             if Source (Scan_Ptr - 1) = ';' then
                Scan_Ptr := Scan_Ptr - 1;
                Unstore_String_Char;

                if Source (Scan_Ptr - 1) = ')' then
                   Scan_Ptr := Scan_Ptr - 1;
                   Unstore_String_Char;
                end if;
             end if;

             Error_Msg_S ("missing string quote");
          end Error_Unterminated_String;

          ----------------
          -- Set_String --
          ----------------

          procedure Set_String is
             Slen : constant Int := Int (Scan_Ptr - Token_Ptr - 2);
             C1   : Character;
             C2   : Character;
             C3   : Character;

          begin
             --  Token_Name is currently set to Error_Name. The following
             --  section of code resets Token_Name to the proper Name_Op_xx
             --  value if the string is a valid operator symbol, otherwise it is
             --  left set to Error_Name.

             if Slen = 1 then
                C1 := Source (Token_Ptr + 1);

                case C1 is
                   when '=' =>
                      Token_Name := Name_Op_Eq;

                   when '>' =>
                      Token_Name := Name_Op_Gt;

                   when '<' =>
                      Token_Name := Name_Op_Lt;

                   when '+' =>
                      Token_Name := Name_Op_Add;

                   when '-' =>
                      Token_Name := Name_Op_Subtract;

                   when '&' =>
                      Token_Name := Name_Op_Concat;

                   when '*' =>
                      Token_Name := Name_Op_Multiply;

                   when '/' =>
                      Token_Name := Name_Op_Divide;

                   when others =>
                      null;
                end case;

             elsif Slen = 2 then
                C1 := Source (Token_Ptr + 1);
                C2 := Source (Token_Ptr + 2);

                if C1 = '*' and then C2 = '*' then
                   Token_Name := Name_Op_Expon;

                elsif C2 = '=' then

                   if C1 = '/' then
                      Token_Name := Name_Op_Ne;
                   elsif C1 = '<' then
                      Token_Name := Name_Op_Le;
                   elsif C1 = '>' then
                      Token_Name := Name_Op_Ge;
                   end if;

                elsif (C1 = 'O' or else C1 = 'o') and then    -- OR
                  (C2 = 'R' or else C2 = 'r')
                then
                   Token_Name := Name_Op_Or;
                end if;

             elsif Slen = 3 then
                C1 := Source (Token_Ptr + 1);
                C2 := Source (Token_Ptr + 2);
                C3 := Source (Token_Ptr + 3);

                if (C1 = 'A' or else C1 = 'a') and then       -- AND
                  (C2 = 'N' or else C2 = 'n') and then
                  (C3 = 'D' or else C3 = 'd')
                then
                   Token_Name := Name_Op_And;

                elsif (C1 = 'A' or else C1 = 'a') and then    -- ABS
                  (C2 = 'B' or else C2 = 'b') and then
                  (C3 = 'S' or else C3 = 's')
                then
                   Token_Name := Name_Op_Abs;

                elsif (C1 = 'M' or else C1 = 'm') and then    -- MOD
                  (C2 = 'O' or else C2 = 'o') and then
                  (C3 = 'D' or else C3 = 'd')
                then
                   Token_Name := Name_Op_Mod;

                elsif (C1 = 'N' or else C1 = 'n') and then    -- NOT
                  (C2 = 'O' or else C2 = 'o') and then
                  (C3 = 'T' or else C3 = 't')
                then
                   Token_Name := Name_Op_Not;

                elsif (C1 = 'R' or else C1 = 'r') and then    -- REM
                  (C2 = 'E' or else C2 = 'e') and then
                  (C3 = 'M' or else C3 = 'm')
                then
                   Token_Name := Name_Op_Rem;

                elsif (C1 = 'X' or else C1 = 'x') and then    -- XOR
                  (C2 = 'O' or else C2 = 'o') and then
                  (C3 = 'R' or else C3 = 'r')
                then
                   Token_Name := Name_Op_Xor;
                end if;

             end if;

             --  If it is an operator symbol, then Token_Name is set.
             --  If it is some other string value, then Token_Name still
             --  contains Error_Name.

             if Token_Name = Error_Name then
                Token := Tok_String_Literal;

             else
                Token := Tok_Operator_Symbol;
             end if;

          end Set_String;

          ----------
          -- Slit --
          ----------

       begin
          --  On entry, Scan_Ptr points to the opening character of the string
          --  which is either a percent, double quote, or apostrophe
          --  (single quote). The latter case is an error detected by
          --  the character literal circuit.

          Delimiter := Source (Scan_Ptr);
          Accumulate_Checksum (Delimiter);
          Start_String;
          Scan_Ptr := Scan_Ptr + 1;

          --  Loop to scan out characters of string literal

          loop
             C := Source (Scan_Ptr);

             if C = Delimiter then
                Accumulate_Checksum (C);
                Scan_Ptr := Scan_Ptr + 1;
                exit when Source (Scan_Ptr) /= Delimiter;
                Code := Get_Char_Code (C);
                Accumulate_Checksum (C);
                Scan_Ptr := Scan_Ptr + 1;

             else
                if C = '"' and then Delimiter = '%' then
                   Error_Msg_S
                     ("quote not allowed in percent delimited string");
                   Code := Get_Char_Code (C);
                   Scan_Ptr := Scan_Ptr + 1;

                elsif (C = ESC
                         and then
                         Wide_Character_Encoding_Method
                                              in WC_ESC_Encoding_Method)
                  or else
                  (C in Upper_Half_Character
                     and then
                     Upper_Half_Encoding)
                  or else
                  (C = '['
                     and then
                     Source (Scan_Ptr + 1) = '"'
                     and then
                     Identifier_Char (Source (Scan_Ptr + 2)))
                then
                   Scan_Wide (Source, Scan_Ptr, Code, Err);
                   Accumulate_Checksum (Code);

                   if Err then
                      Error_Illegal_Wide_Character;
                      Code := Get_Char_Code (' ');
                   end if;

                else
                   Accumulate_Checksum (C);

                   if C not in Graphic_Character then
                      if C in Line_Terminator then
                         Error_Unterminated_String;
                         exit;

                      elsif C in Upper_Half_Character then
                         if Ada_83 then
                            Error_Bad_String_Char;
                         end if;

                      else
                         Error_Bad_String_Char;
                      end if;
                   end if;

                   Code := Get_Char_Code (C);
                   Scan_Ptr := Scan_Ptr + 1;
                end if;
             end if;

             Store_String_Char (Code);

             if not In_Character_Range (Code) then
                Wide_Character_Found := True;
             end if;
          end loop;

          String_Literal_Id := End_String;
          Set_String;
          return;

       end Slit;

    --  Start of body of Scan

    begin
       Prev_Token := Token;
       Prev_Token_Ptr := Token_Ptr;
       Token_Name := Error_Name;

       --  The following loop runs more than once only if a format effector
       --  (tab, vertical tab, form  feed, line feed, carriage return) is
       --  encountered and skipped, or some error situation, such as an
       --  illegal character, is encountered.

       loop
          --  Skip past blanks, loop is opened up for speed

          while Source (Scan_Ptr) = ' ' loop

             if Source (Scan_Ptr + 1) /= ' ' then
                Scan_Ptr := Scan_Ptr + 1;
                exit;
             end if;

             if Source (Scan_Ptr + 2) /= ' ' then
                Scan_Ptr := Scan_Ptr + 2;
                exit;
             end if;

             if Source (Scan_Ptr + 3) /= ' ' then
                Scan_Ptr := Scan_Ptr + 3;
                exit;
             end if;

             if Source (Scan_Ptr + 4) /= ' ' then
                Scan_Ptr := Scan_Ptr + 4;
                exit;
             end if;

             if Source (Scan_Ptr + 5) /= ' ' then
                Scan_Ptr := Scan_Ptr + 5;
                exit;
             end if;

             if Source (Scan_Ptr + 6) /= ' ' then
                Scan_Ptr := Scan_Ptr + 6;
                exit;
             end if;

             if Source (Scan_Ptr + 7) /= ' ' then
                Scan_Ptr := Scan_Ptr + 7;
                exit;
             end if;

             Scan_Ptr := Scan_Ptr + 8;
          end loop;

          --  We are now at a non-blank character, which is the first character
          --  of the token we will scan, and hence the value of Token_Ptr.

          Token_Ptr := Scan_Ptr;

          --  Here begins the main case statement which transfers control on
          --  the basis of the non-blank character we have encountered.

          case Source (Scan_Ptr) is

          --  Line terminator characters

          when CR | LF | FF | VT => Line_Terminator_Case : begin

             --  Check line too long

             Check_End_Of_Line;

             --  Set Token_Ptr, if End_Of_Line is a token, for the case when
             --  it is a physical line.

             if End_Of_Line_Is_Token then
                Token_Ptr := Scan_Ptr;
             end if;

             declare
                Physical : Boolean;

             begin
                Skip_Line_Terminators (Scan_Ptr, Physical);

                --  If we are at start of physical line, update scan pointers
                --  to reflect the start of the new line.

                if Physical then
                   Current_Line_Start       := Scan_Ptr;
                   Start_Column             := Set_Start_Column;
                   First_Non_Blank_Location := Scan_Ptr;

                   --  If End_Of_Line is a token, we return it as it is
                   --  a physical line.

                   if End_Of_Line_Is_Token then
                      Token := Tok_End_Of_Line;
                      return;
                   end if;
                end if;
             end;
          end Line_Terminator_Case;

          --  Horizontal tab, just skip past it

          when HT =>
             if Style_Check then Style.Check_HT; end if;
             Scan_Ptr := Scan_Ptr + 1;

          --  End of file character, treated as an end of file only if it
          --  is the last character in the buffer, otherwise it is ignored.

          when EOF =>
             if Scan_Ptr = Source_Last (Current_Source_File) then
                Check_End_Of_Line;
                Token := Tok_EOF;
                return;

             else
                Scan_Ptr := Scan_Ptr + 1;
             end if;

          --  Ampersand

          when '&' =>
             Accumulate_Checksum ('&');

             if Source (Scan_Ptr + 1) = '&' then
                Error_Msg_S ("'&'& should be `AND THEN`");
                Scan_Ptr := Scan_Ptr + 2;
                Token := Tok_And;
                return;

             else
                Scan_Ptr := Scan_Ptr + 1;
                Token := Tok_Ampersand;
                return;
             end if;

          --  Asterisk (can be multiplication operator or double asterisk
          --  which is the exponentiation compound delimiter).

          when '*' =>
             Accumulate_Checksum ('*');

             if Source (Scan_Ptr + 1) = '*' then
                Accumulate_Checksum ('*');
                Scan_Ptr := Scan_Ptr + 2;
                Token := Tok_Double_Asterisk;
                return;

             else
                Scan_Ptr := Scan_Ptr + 1;
                Token := Tok_Asterisk;
                return;
             end if;

          --  Colon, which can either be an isolated colon, or part of an
          --  assignment compound delimiter.

          when ':' =>
             Accumulate_Checksum (':');

             if Double_Char_Token ('=') then
                Token := Tok_Colon_Equal;
                if Style_Check then Style.Check_Colon_Equal; end if;
                return;

             elsif Source (Scan_Ptr + 1) = '-'
               and then Source (Scan_Ptr + 2) /= '-'
             then
                Token := Tok_Colon_Equal;
                Error_Msg (":- should be :=", Scan_Ptr);
                Scan_Ptr := Scan_Ptr + 2;
                return;

             else
                Scan_Ptr := Scan_Ptr + 1;
                Token := Tok_Colon;
                if Style_Check then Style.Check_Colon; end if;
                return;
             end if;

          --  Left parenthesis

          when '(' =>
             Accumulate_Checksum ('(');
             Scan_Ptr := Scan_Ptr + 1;
             Token := Tok_Left_Paren;
             if Style_Check then Style.Check_Left_Paren; end if;
             return;

          --  Left bracket

          when '[' =>
             if Source (Scan_Ptr + 1) = '"' then
                Name_Len := 0;
                goto Scan_Identifier;

             else
                Error_Msg_S ("illegal character, replaced by ""(""");
                Scan_Ptr := Scan_Ptr + 1;
                Token := Tok_Left_Paren;
                return;
             end if;

          --  Left brace

          when '{' =>
             Error_Msg_S ("illegal character, replaced by ""(""");
             Scan_Ptr := Scan_Ptr + 1;
             Token := Tok_Left_Paren;
             return;

          --  Comma

          when ',' =>
             Accumulate_Checksum (',');
             Scan_Ptr := Scan_Ptr + 1;
             Token := Tok_Comma;
             if Style_Check then Style.Check_Comma; end if;
             return;

          --  Dot, which is either an isolated period, or part of a double
          --  dot compound delimiter sequence. We also check for the case of
          --  a digit following the period, to give a better error message.

          when '.' =>
             Accumulate_Checksum ('.');

             if Double_Char_Token ('.') then
                Token := Tok_Dot_Dot;
                if Style_Check then Style.Check_Dot_Dot; end if;
                return;

             elsif Source (Scan_Ptr + 1) in '0' .. '9' then
                Error_Msg_S ("numeric literal cannot start with point");
                Scan_Ptr := Scan_Ptr + 1;

             else
                Scan_Ptr := Scan_Ptr + 1;
                Token := Tok_Dot;
                return;
             end if;

          --  Equal, which can either be an equality operator, or part of the
          --  arrow (=>) compound delimiter.

          when '=' =>
             Accumulate_Checksum ('=');

             if Double_Char_Token ('>') then
                Token := Tok_Arrow;
                if Style_Check then Style.Check_Arrow; end if;
                return;

             elsif Source (Scan_Ptr + 1) = '=' then
                Error_Msg_S ("== should be =");
                Scan_Ptr := Scan_Ptr + 1;
             end if;

             Scan_Ptr := Scan_Ptr + 1;
             Token := Tok_Equal;
             return;

          --  Greater than, which can be a greater than operator, greater than
          --  or equal operator, or first character of a right label bracket.

          when '>' =>
             Accumulate_Checksum ('>');

             if Double_Char_Token ('=') then
                Token := Tok_Greater_Equal;
                return;

             elsif Double_Char_Token ('>') then
                Token := Tok_Greater_Greater;
                return;

             else
                Scan_Ptr := Scan_Ptr + 1;
                Token := Tok_Greater;
                return;
             end if;

          --  Less than, which can be a less than operator, less than or equal
          --  operator, or the first character of a left label bracket, or the
          --  first character of a box (<>) compound delimiter.

          when '<' =>
             Accumulate_Checksum ('<');

             if Double_Char_Token ('=') then
                Token := Tok_Less_Equal;
                return;

             elsif Double_Char_Token ('>') then
                Token := Tok_Box;
                if Style_Check then Style.Check_Box; end if;
                return;

             elsif Double_Char_Token ('<') then
                Token := Tok_Less_Less;
                return;

             else
                Scan_Ptr := Scan_Ptr + 1;
                Token := Tok_Less;
                return;
             end if;

          --  Minus, which is either a subtraction operator, or the first
          --  character of double minus starting a comment

          when '-' => Minus_Case : begin
             if Source (Scan_Ptr + 1) = '>' then
                Error_Msg_S ("invalid token");
                Scan_Ptr := Scan_Ptr + 2;
                Token := Tok_Arrow;
                return;

             elsif Source (Scan_Ptr + 1) /= '-' then
                Accumulate_Checksum ('-');
                Scan_Ptr := Scan_Ptr + 1;
                Token := Tok_Minus;
                return;

             --  Comment

             else -- Source (Scan_Ptr + 1) = '-' then
                if Style_Check then Style.Check_Comment; end if;
                Scan_Ptr := Scan_Ptr + 2;
                Start_Of_Comment := Scan_Ptr;

                --  Loop to scan comment (this loop runs more than once only if
                --  a horizontal tab or other non-graphic character is scanned)

                loop
                   --  Scan to non graphic character (opened up for speed)

                   loop
                      exit when Source (Scan_Ptr) not in Graphic_Character;
                      Scan_Ptr := Scan_Ptr + 1;
                      exit when Source (Scan_Ptr) not in Graphic_Character;
                      Scan_Ptr := Scan_Ptr + 1;
                      exit when Source (Scan_Ptr) not in Graphic_Character;
                      Scan_Ptr := Scan_Ptr + 1;
                      exit when Source (Scan_Ptr) not in Graphic_Character;
                      Scan_Ptr := Scan_Ptr + 1;
                      exit when Source (Scan_Ptr) not in Graphic_Character;
                      Scan_Ptr := Scan_Ptr + 1;
                   end loop;

                   --  Keep going if horizontal tab

                   if Source (Scan_Ptr) = HT then
                      if Style_Check then Style.Check_HT; end if;
                      Scan_Ptr := Scan_Ptr + 1;

                   --  Terminate scan of comment if line terminator

                   elsif Source (Scan_Ptr) in Line_Terminator then
                      exit;

                   --  Terminate scan of comment if end of file encountered
                   --  (embedded EOF character or real last character in file)

                   elsif Source (Scan_Ptr) = EOF then
                      exit;

                   --  Keep going if character in 80-FF range, or is ESC. These
                   --  characters are allowed in comments by RM-2.1(1), 2.7(2).
                   --  They are allowed even in Ada 83 mode according to the
                   --  approved AI. ESC was added to the AI in June 93.

                   elsif Source (Scan_Ptr) in Upper_Half_Character
                     or else Source (Scan_Ptr) = ESC
                   then
                      Scan_Ptr := Scan_Ptr + 1;

                   --  Otherwise we have an illegal comment character

                   else
                      Error_Illegal_Character;
                   end if;

                end loop;

                --  Note that, except when comments are tokens, we do NOT
                --  execute a return here, instead we fall through to reexecute
                --  the scan loop to look for a token.

                if Comment_Is_Token then
                   Name_Len := Integer (Scan_Ptr - Start_Of_Comment);
                   Name_Buffer (1 .. Name_Len) :=
                     String (Source (Start_Of_Comment .. Scan_Ptr - 1));
                   Comment_Id := Name_Find;
                   Token := Tok_Comment;
                   return;
                end if;
             end if;
          end Minus_Case;

          --  Double quote starting a string literal

          when '"' =>
             Slit;
             Post_Scan;
             return;

          --  Percent starting a string literal

          when '%' =>
             if Warn_On_Obsolescent_Feature then
                Error_Msg_S
                  ("use of ""'%"" is an obsolescent feature ('R'M 'J.2(4))?");
                Error_Msg_S
                  ("\use """""" instead?");
             end if;

             Slit;
             Post_Scan;
             return;

          --  Apostrophe. This can either be the start of a character literal,
          --  or an isolated apostrophe used in a qualified expression or an
          --  attribute. We treat it as a character literal if it does not
          --  follow a right parenthesis, identifier, the keyword ALL or
          --  a literal. This means that we correctly treat constructs like:

          --    A := CHARACTER'('A');

          --  Note that RM-2.2(7) does not require a separator between
          --  "CHARACTER" and "'" in the above.

          when ''' => Char_Literal_Case : declare
             Code : Char_Code;
             Err  : Boolean;

          begin
             Accumulate_Checksum (''');
             Scan_Ptr := Scan_Ptr + 1;

             --  Here is where we make the test to distinguish the cases. Treat
             --  as apostrophe if previous token is an identifier, right paren
             --  or the reserved word "all" (latter case as in A.all'Address)
             --  (or the reserved word "project" in project files).
             --  Also treat it as apostrophe after a literal (this catches
             --  some legitimate cases, like A."abs"'Address, and also gives
             --  better error behavior for impossible cases like 123'xxx).

             if Prev_Token = Tok_Identifier
                or else Prev_Token = Tok_Right_Paren
                or else Prev_Token = Tok_All
                or else Prev_Token = Tok_Project
                or else Prev_Token in Token_Class_Literal
             then
                Token := Tok_Apostrophe;
                if Style_Check then Style.Check_Apostrophe; end if;
                return;

             --  Otherwise the apostrophe starts a character literal

             else
                --  Case of wide character literal with ESC or [ encoding

                if (Source (Scan_Ptr) = ESC
                      and then
                     Wide_Character_Encoding_Method in WC_ESC_Encoding_Method)
                  or else
                    (Source (Scan_Ptr) in Upper_Half_Character
                      and then
                     Upper_Half_Encoding)
                  or else
                    (Source (Scan_Ptr) = '['
                      and then
                     Source (Scan_Ptr + 1) = '"')
                then
                   Scan_Wide (Source, Scan_Ptr, Code, Err);
                   Accumulate_Checksum (Code);

                   if Err then
                      Error_Illegal_Wide_Character;
                   end if;

                   if Source (Scan_Ptr) /= ''' then
                      Error_Msg_S ("missing apostrophe");
                   else
                      Scan_Ptr := Scan_Ptr + 1;
                   end if;

                --  If we do not find a closing quote in the expected place then
                --  assume that we have a misguided attempt at a string literal.

                --  However, if previous token is RANGE, then we return an
                --  apostrophe instead since this gives better error recovery

                elsif Source (Scan_Ptr + 1) /= ''' then

                   if Prev_Token = Tok_Range then
                      Token := Tok_Apostrophe;
                      return;

                   else
                      Scan_Ptr := Scan_Ptr - 1;
                      Error_Msg_S
                        ("strings are delimited by double quote character");
                      Slit;
                      Post_Scan;
                      return;
                   end if;

                --  Otherwise we have a (non-wide) character literal

                else
                   Accumulate_Checksum (Source (Scan_Ptr));

                   if Source (Scan_Ptr) not in Graphic_Character then
                      if Source (Scan_Ptr) in Upper_Half_Character then
                         if Ada_83 then
                            Error_Illegal_Character;
                         end if;

                      else
                         Error_Illegal_Character;
                      end if;
                   end if;

                   Code := Get_Char_Code (Source (Scan_Ptr));
                   Scan_Ptr := Scan_Ptr + 2;
                end if;

                --  Fall through here with Scan_Ptr updated past the closing
                --  quote, and Code set to the Char_Code value for the literal

                Accumulate_Checksum (''');
                Token := Tok_Char_Literal;
                Set_Character_Literal_Name (Code);
                Token_Name := Name_Find;
                Character_Code := Code;
                Post_Scan;
                return;
             end if;
          end Char_Literal_Case;

          --  Right parenthesis

          when ')' =>
             Accumulate_Checksum (')');
             Scan_Ptr := Scan_Ptr + 1;
             Token := Tok_Right_Paren;
             if Style_Check then Style.Check_Right_Paren; end if;
             return;

          --  Right bracket or right brace, treated as right paren

          when ']' | '}' =>
             Error_Msg_S ("illegal character, replaced by "")""");
             Scan_Ptr := Scan_Ptr + 1;
             Token := Tok_Right_Paren;
             return;

          --  Slash (can be division operator or first character of not equal)

          when '/' =>
             Accumulate_Checksum ('/');

             if Double_Char_Token ('=') then
                Token := Tok_Not_Equal;
                return;
             else
                Scan_Ptr := Scan_Ptr + 1;
                Token := Tok_Slash;
                return;
             end if;

          --  Semicolon

          when ';' =>
             Accumulate_Checksum (';');
             Scan_Ptr := Scan_Ptr + 1;
             Token := Tok_Semicolon;
             if Style_Check then Style.Check_Semicolon; end if;
             return;

          --  Vertical bar

          when '|' => Vertical_Bar_Case : begin
             Accumulate_Checksum ('|');

             --  Special check for || to give nice message

             if Source (Scan_Ptr + 1) = '|' then
                Error_Msg_S ("""'|'|"" should be `OR ELSE`");
                Scan_Ptr := Scan_Ptr + 2;
                Token := Tok_Or;
                return;

             else
                Scan_Ptr := Scan_Ptr + 1;
                Token := Tok_Vertical_Bar;
                if Style_Check then Style.Check_Vertical_Bar; end if;
                return;
             end if;
          end Vertical_Bar_Case;

          --  Exclamation, replacement character for vertical bar

          when '!' => Exclamation_Case : begin
             Accumulate_Checksum ('!');

             if Warn_On_Obsolescent_Feature then
                Error_Msg_S
                  ("use of ""'!"" is an obsolescent feature ('R'M 'J.2(2))?");
                Error_Msg_S
                  ("\use ""'|"" instead?");
             end if;

             if Source (Scan_Ptr + 1) = '=' then
                Error_Msg_S ("'!= should be /=");
                Scan_Ptr := Scan_Ptr + 2;
                Token := Tok_Not_Equal;
                return;

             else
                Scan_Ptr := Scan_Ptr + 1;
                Token := Tok_Vertical_Bar;
                return;
             end if;

          end Exclamation_Case;

          --  Plus

          when '+' => Plus_Case : begin
             Accumulate_Checksum ('+');
             Scan_Ptr := Scan_Ptr + 1;
             Token := Tok_Plus;
             return;
          end Plus_Case;

          --  Digits starting a numeric literal

          when '0' .. '9' =>
             Nlit;

             if Identifier_Char (Source (Scan_Ptr)) then
                Error_Msg_S
                  ("delimiter required between literal and identifier");
             end if;
             Post_Scan;
             return;

          --  Lower case letters

          when 'a' .. 'z' =>
             Name_Len := 1;
             Name_Buffer (1) := Source (Scan_Ptr);
             Accumulate_Checksum (Name_Buffer (1));
             Scan_Ptr := Scan_Ptr + 1;
             goto Scan_Identifier;

          --  Upper case letters

          when 'A' .. 'Z' =>
             Name_Len := 1;
             Name_Buffer (1) :=
               Character'Val (Character'Pos (Source (Scan_Ptr)) + 32);
             Accumulate_Checksum (Name_Buffer (1));
             Scan_Ptr := Scan_Ptr + 1;
             goto Scan_Identifier;

          --  Underline character

          when '_' =>
             if Special_Characters ('_') then
                Token_Ptr := Scan_Ptr;
                Scan_Ptr := Scan_Ptr + 1;
                Token := Tok_Special;
                Special_Character := '_';
                return;
             end if;

             Error_Msg_S ("identifier cannot start with underline");
             Name_Len := 1;
             Name_Buffer (1) := '_';
             Scan_Ptr := Scan_Ptr + 1;
             goto Scan_Identifier;

          --  Space (not possible, because we scanned past blanks)

          when ' ' =>
             raise Program_Error;

          --  Characters in top half of ASCII 8-bit chart

          when Upper_Half_Character =>

             --  Wide character case. Note that Scan_Identifier will issue
             --  an appropriate message if wide characters are not allowed
             --  in identifiers.

             if Upper_Half_Encoding then
                Name_Len := 0;
                goto Scan_Identifier;

             --  Otherwise we have OK Latin-1 character

             else
                --  Upper half characters may possibly be identifier letters
                --  but can never be digits, so Identifier_Char can be used
                --  to test for a valid start of identifier character.

                if Identifier_Char (Source (Scan_Ptr)) then
                   Name_Len := 0;
                   goto Scan_Identifier;
                else
                   Error_Illegal_Character;
                end if;
             end if;

          when ESC =>

             --  ESC character, possible start of identifier if wide characters
             --  using ESC encoding are allowed in identifiers, which we can
             --  tell by looking at the Identifier_Char flag for ESC, which is
             --  only true if these conditions are met.

             if Identifier_Char (ESC) then
                Name_Len := 0;
                goto Scan_Identifier;
             else
                Error_Illegal_Wide_Character;
             end if;

          --  Invalid control characters

          when NUL | SOH | STX | ETX | EOT | ENQ | ACK | BEL | BS  | SO  |
               SI  | DLE | DC1 | DC2 | DC3 | DC4 | NAK | SYN | ETB | CAN |
               EM  | FS  | GS  | RS  | US  | DEL
          =>
             Error_Illegal_Character;

          --  Invalid graphic characters

          when '#' | '$' | '?' | '@' | '`' | '\' | '^' | '~' =>
             --  If Set_Special_Character has been called for this character,
             --  set Scans.Special_Character and return a Special token.

             if Special_Characters (Source (Scan_Ptr)) then
                Token_Ptr := Scan_Ptr;
                Token := Tok_Special;
                Special_Character := Source (Scan_Ptr);
                Scan_Ptr := Scan_Ptr + 1;
                return;

             --  otherwise, this is an illegal character

             else
                Error_Illegal_Character;
             end if;

          --  End switch on non-blank character

          end case;

       --  End loop past format effectors. The exit from this loop is by
       --  executing a return statement following completion of token scan
       --  (control never falls out of this loop to the code which follows)

       end loop;

       --  Identifier scanning routine. On entry, some initial characters
       --  of the identifier may have already been stored in Name_Buffer.
       --  If so, Name_Len has the number of characters stored. otherwise
       --  Name_Len is set to zero on entry.

       <<Scan_Identifier>>

          --  This loop scans as fast as possible past lower half letters
          --  and digits, which we expect to be the most common characters.

          loop
             if Source (Scan_Ptr) in 'a' .. 'z'
               or else Source (Scan_Ptr) in '0' .. '9'
             then
                Name_Buffer (Name_Len + 1) := Source (Scan_Ptr);
                Accumulate_Checksum (Source (Scan_Ptr));

             elsif Source (Scan_Ptr) in 'A' .. 'Z' then
                Name_Buffer (Name_Len + 1) :=
                  Character'Val (Character'Pos (Source (Scan_Ptr)) + 32);
                Accumulate_Checksum (Name_Buffer (Name_Len + 1));
             else
                exit;
             end if;

             --  Open out the loop a couple of times for speed

             if Source (Scan_Ptr + 1) in 'a' .. 'z'
               or else Source (Scan_Ptr + 1) in '0' .. '9'
             then
                Name_Buffer (Name_Len + 2) := Source (Scan_Ptr + 1);
                Accumulate_Checksum (Source (Scan_Ptr + 1));

             elsif Source (Scan_Ptr + 1) in 'A' .. 'Z' then
                Name_Buffer (Name_Len + 2) :=
                  Character'Val (Character'Pos (Source (Scan_Ptr + 1)) + 32);
                Accumulate_Checksum (Name_Buffer (Name_Len + 2));

             else
                Scan_Ptr := Scan_Ptr + 1;
                Name_Len := Name_Len + 1;
                exit;
             end if;

             if Source (Scan_Ptr + 2) in 'a' .. 'z'
               or else Source (Scan_Ptr + 2) in '0' .. '9'
             then
                Name_Buffer (Name_Len + 3) := Source (Scan_Ptr + 2);
                Accumulate_Checksum (Source (Scan_Ptr + 2));

             elsif Source (Scan_Ptr + 2) in 'A' .. 'Z' then
                Name_Buffer (Name_Len + 3) :=
                  Character'Val (Character'Pos (Source (Scan_Ptr + 2)) + 32);
                Accumulate_Checksum (Name_Buffer (Name_Len + 3));
             else
                Scan_Ptr := Scan_Ptr + 2;
                Name_Len := Name_Len + 2;
                exit;
             end if;

             if Source (Scan_Ptr + 3) in 'a' .. 'z'
               or else Source (Scan_Ptr + 3) in '0' .. '9'
             then
                Name_Buffer (Name_Len + 4) := Source (Scan_Ptr + 3);
                Accumulate_Checksum (Source (Scan_Ptr + 3));

             elsif Source (Scan_Ptr + 3) in 'A' .. 'Z' then
                Name_Buffer (Name_Len + 4) :=
                  Character'Val (Character'Pos (Source (Scan_Ptr + 3)) + 32);
                Accumulate_Checksum (Name_Buffer (Name_Len + 4));

             else
                Scan_Ptr := Scan_Ptr + 3;
                Name_Len := Name_Len + 3;
                exit;
             end if;

             Scan_Ptr := Scan_Ptr + 4;
             Name_Len := Name_Len + 4;
          end loop;

          --  If we fall through, then we have encountered either an underline
          --  character, or an extended identifier character (i.e. one from the
          --  upper half), or a wide character, or an identifier terminator.
          --  The initial test speeds us up in the most common case where we
          --  have an identifier terminator. Note that ESC is an identifier
          --  character only if a wide character encoding method that uses
          --  ESC encoding is active, so if we find an ESC character we know
          --  that we have a wide character.

          if Identifier_Char (Source (Scan_Ptr)) then

             --  Case of underline

             if Source (Scan_Ptr) = '_' then
                Accumulate_Checksum ('_');

                --  Check error case of identifier ending with underscore
                --  In this case we ignore the underscore and do not store it.

                if not Identifier_Char (Source (Scan_Ptr + 1)) then
                   Error_Msg_S ("identifier cannot end with underline");
                   Scan_Ptr := Scan_Ptr + 1;

                --  Check error case of two underscores. In this case we do
                --  not store the first underscore (we will store the second)

                elsif Source (Scan_Ptr + 1) = '_' then
                      Error_No_Double_Underline;

                --  Normal case of legal underscore

                else
                   Name_Len := Name_Len + 1;
                   Name_Buffer (Name_Len) := '_';
                end if;

                Scan_Ptr := Scan_Ptr + 1;
                goto Scan_Identifier;

             --  Upper half character

             elsif Source (Scan_Ptr) in Upper_Half_Character
               and then not Upper_Half_Encoding
             then
                Accumulate_Checksum (Source (Scan_Ptr));
                Store_Encoded_Character
                  (Get_Char_Code (Fold_Lower (Source (Scan_Ptr))));
                Scan_Ptr := Scan_Ptr + 1;
                goto Scan_Identifier;

             --  Left bracket not followed by a quote terminates an identifier.
             --  This is an error, but we don't want to give a junk error msg
             --  about wide characters in this case!

             elsif Source (Scan_Ptr) = '['
               and then Source (Scan_Ptr + 1) /= '"'
             then
                null;

             --  We know we have a wide character encoding here (the current
             --  character is either ESC, left bracket, or an upper half
             --  character depending on the encoding method).

             else
                --  Scan out the wide character and insert the appropriate
                --  encoding into the name table entry for the identifier.

                declare
                   Sptr : constant Source_Ptr := Scan_Ptr;
                   Code : Char_Code;
                   Err  : Boolean;
                   Chr  : Character;

                begin
                   Scan_Wide (Source, Scan_Ptr, Code, Err);

                   --  If error, signal error

                   if Err then
                      Error_Illegal_Wide_Character;

                   --  If the character scanned is a normal identifier
                   --  character, then we treat it that way.

                   elsif In_Character_Range (Code)
                     and then Identifier_Char (Get_Character (Code))
                   then
                      Chr := Get_Character (Code);
                      Accumulate_Checksum (Chr);
                      Store_Encoded_Character
                        (Get_Char_Code (Fold_Lower (Chr)));

                   --  Character is not normal identifier character, store
                   --  it in encoded form.

                   else
                      Accumulate_Checksum (Code);
                      Store_Encoded_Character (Code);

                      --  Make sure we are allowing wide characters in
                      --  identifiers. Note that we allow wide character
                      --  notation for an OK identifier character. This
                      --  in particular allows bracket or other notation
                      --  to be used for upper half letters.

                      if Identifier_Character_Set /= 'w' then
                         Error_Msg
                           ("wide character not allowed in identifier", Sptr);
                      end if;
                   end if;
                end;

                goto Scan_Identifier;
             end if;
          end if;

          --  Scan of identifier is complete. The identifier is stored in
          --  Name_Buffer, and Scan_Ptr points past the last character.

          Token_Name := Name_Find;

          --  Here is where we check if it was a keyword

          if Get_Name_Table_Byte (Token_Name) /= 0
            and then (Ada_95 or else Token_Name not in Ada_95_Reserved_Words)
          then
             Token := Token_Type'Val (Get_Name_Table_Byte (Token_Name));

             --  Deal with possible style check for non-lower case keyword,
             --  but we don't treat ACCESS, DELTA, DIGITS, RANGE as keywords
             --  for this purpose if they appear as attribute designators.
             --  Actually we only check the first character for speed.

             if Style_Check
               and then Source (Token_Ptr) <= 'Z'
               and then (Prev_Token /= Tok_Apostrophe
                           or else
                             (Token /= Tok_Access
                                and then Token /= Tok_Delta
                                and then Token /= Tok_Digits
                                and then Token /= Tok_Range))
             then
                Style.Non_Lower_Case_Keyword;
             end if;

             --  We must reset Token_Name since this is not an identifier
             --  and if we leave Token_Name set, the parser gets confused
             --  because it thinks it is dealing with an identifier instead
             --  of the corresponding keyword.

             Token_Name := No_Name;
             return;

          --  It is an identifier after all

          else
             Token := Tok_Identifier;
             Post_Scan;
             return;
          end if;
    end Scan;
    --------------------------
    -- Set_Comment_As_Token --
    --------------------------

    procedure Set_Comment_As_Token (Value : Boolean) is
    begin
       Comment_Is_Token := Value;
    end Set_Comment_As_Token;

    ------------------------------
    -- Set_End_Of_Line_As_Token --
    ------------------------------

    procedure Set_End_Of_Line_As_Token (Value : Boolean) is
    begin
       End_Of_Line_Is_Token := Value;
    end Set_End_Of_Line_As_Token;

    ---------------------------
    -- Set_Special_Character --
    ---------------------------

    procedure Set_Special_Character (C : Character) is
    begin
       case C is
          when '#' | '$' | '_' | '?' | '@' | '`' | '\' | '^' | '~' =>
             Special_Characters (C) := True;

          when others =>
             null;
       end case;
    end Set_Special_Character;

    ----------------------
    -- Set_Start_Column --
    ----------------------

    --  Note: it seems at first glance a little expensive to compute this value
    --  for every source line (since it is certainly not used for all source
    --  lines). On the other hand, it doesn't take much more work to skip past
    --  the initial white space on the line counting the columns than it would
    --  to scan past the white space using the standard scanning circuits.

    function Set_Start_Column return Column_Number is
       Start_Column : Column_Number := 0;

    begin
       --  Outer loop scans past horizontal tab characters

       Tabs_Loop : loop

          --  Inner loop scans past blanks as fast as possible, bumping Scan_Ptr
          --  past the blanks and adjusting Start_Column to account for them.

          Blanks_Loop : loop
             if Source (Scan_Ptr) = ' ' then
                if Source (Scan_Ptr + 1) = ' ' then
                   if Source (Scan_Ptr + 2) = ' ' then
                      if Source (Scan_Ptr + 3) = ' ' then
                         if Source (Scan_Ptr + 4) = ' ' then
                            if Source (Scan_Ptr + 5) = ' ' then
                               if Source (Scan_Ptr + 6) = ' ' then
                                  Scan_Ptr := Scan_Ptr + 7;
                                  Start_Column := Start_Column + 7;
                               else
                                  Scan_Ptr := Scan_Ptr + 6;
                                  Start_Column := Start_Column + 6;
                                  exit Blanks_Loop;
                               end if;
                            else
                               Scan_Ptr := Scan_Ptr + 5;
                               Start_Column := Start_Column + 5;
                               exit Blanks_Loop;
                            end if;
                         else
                            Scan_Ptr := Scan_Ptr + 4;
                            Start_Column := Start_Column + 4;
                            exit Blanks_Loop;
                         end if;
                      else
                         Scan_Ptr := Scan_Ptr + 3;
                         Start_Column := Start_Column + 3;
                         exit Blanks_Loop;
                      end if;
                   else
                      Scan_Ptr := Scan_Ptr + 2;
                      Start_Column := Start_Column + 2;
                      exit Blanks_Loop;
                   end if;
                else
                   Scan_Ptr := Scan_Ptr + 1;
                   Start_Column := Start_Column + 1;
                   exit Blanks_Loop;
                end if;
             else
                exit Blanks_Loop;
             end if;
          end loop Blanks_Loop;

          --  Outer loop keeps going only if a horizontal tab follows

          if Source (Scan_Ptr) = HT then
             if Style_Check then Style.Check_HT; end if;
             Scan_Ptr := Scan_Ptr + 1;
             Start_Column := (Start_Column / 8) * 8 + 8;
          else
             exit Tabs_Loop;
          end if;

       end loop Tabs_Loop;

       return Start_Column;
    end Set_Start_Column;

 end Scng;