Support hexadecimal floating-point constants.

2024-05-29 04:41:27 +00:00 · 2021-10-17 18:19:29 -05:00 · 2021-10-17 18:19:29 -05:00 · ad5063a9a3
commit ad5063a9a3
parent ba944e5675
3 changed files with 322 additions and 5 deletions
--- a/Scanner.asm
+++ b/Scanner.asm
@ -1,5 +1,305 @@
         mcopy scanner.macros
         datachk off
 ****************************************************************
 *
 *  ConvertHexFloat - Parse a hexadecimal floating-point constant
 *
 *  Inputs:
 *        str - pointer to the string (p-string)
 *
 *  Outputs:
 *        Returns the extended value (or a NAN on error).
 *
 ****************************************************************
 *
 ConvertHexFloat start scanner
         subroutine (4:str),26
 end_idx  equ   0                        index one past end of string
 got_period equ end_idx+2                flag: have we encountered a period?
 full     equ   got_period+2             flag: is mantissa full?
 mantissa equ   full+2                   mantissa
 extrabits equ  mantissa+8               extra bits that do not fit in mantissa
 exp_adjust equ extrabits+2              exponent adjustment
 negate_exp equ exp_adjust+2             flag: is exponent negative?
 exp      equ   negate_exp+2             exponent
 nonzero  equ   exp+2                    flag: is mantissa non-zero?
 got_digit equ  nonzero+2                flag: got any digit yet?
         stz   got_period               no period yet
         stz   full                     not full yet
         stz   negate_exp               assume positive exponent
         stz   got_digit                no digit yet
         stz   exp                      exponent value = 0
         stz   mantissa                 mantissa = 0.0
         stz   mantissa+2
         stz   mantissa+4
         stz   mantissa+6
         stz   extrabits                extrabits = 0
         lda   #63                      exponent adjustment = 63
         sta   exp_adjust
         lda   [str]                    end_idx = string length + 1 
         and   #$00FF
         inc   a
         sta   end_idx
         ldy   #1                       string index = 1
         jsr   nextch                   check for 0x or 0X prefix
         cmp   #'0'
         beq   check_x
         brl   error
 check_x  jsr   nextch
         and   #$df
         cmp   #'X'
         beq   digitlp
         brl   error
 digitlp  jsr   nextch                   get a character
         ldx   got_period               if there was no period yet
         bne   check_p
         cmp   #'.'                       if character is '.'
         bne   check_p
         dec   got_period                   flag that we got a period
         bra   digitlp                      loop for another digit
 check_p  cmp   #'p'                     if character is 'p' or 'P'
         beq   normal                     mantissa is done: normalize it
         cmp   #'P'
         beq   normal
         sta   got_digit                flag that we (presumably) got a digit
         jsr   hexdigit                 must be a hex digit: get value
         ldx   full                     if mantissa is full
         beq   donibble
         ora   extrabits                  record extra bits for rounding
         sta   extrabits
         lda   got_period                 if we are not past the period
         bne   digitlp
         lda   #4                           exp_adjust += 4
         clc
         adc   exp_adjust
 ;        bvs   error                        no overflow with p-string input
         sta   exp_adjust
         bra   digitlp                    loop for another digit
 donibble xba                            get nibble value in high bits
         asl   a
         asl   a
         asl   a
         asl   a
         ldx   #4                       for each bit in nibble:
 bitloop  bit   mantissa+6                 if mantissa is now full
         bpl   notfull
         inc   full                         full = true
         sta   extrabits                    record next bit(s) for rounding
         lda   got_period                   if we are not past the period
         bne   digitlp
         txa                                  exp_adjust += number of extra bits
         clc
         adc   exp_adjust
         sta   exp_adjust
         bra   digitlp                      loop for another digit
 notfull  asl   a                          shift bit into mantissa
         rol   mantissa
         rol   mantissa+2
         rol   mantissa+4
         rol   mantissa+6
         bit   got_period                 if we are past the period
         bpl   nextbit
         dec   exp_adjust                   exp_adjust-- (no overflow w/ p-str)
 nextbit  dex
         bne   bitloop
         bra   digitlp
 normal   lda   got_digit                check that there was a mantissa digit
         bne   chkzero
         brl   error
 chkzero  lda   mantissa                 check if mantissa is nonzero
         ora   mantissa+2
         ora   mantissa+4
         ora   mantissa+6
         sta   nonzero                  set nonzero flag as appropriate
         beq   do_exp                   if mantissa is nonzero, normalize:
         lda   mantissa+6                 if high bit of mantissa is not 1:
         bmi   do_exp                       do    
 normallp dec   exp_adjust                     exp_adjust--
         asl   mantissa                       shift mantissa left one bit
         rol   mantissa+2
         rol   mantissa+4
         rol   mantissa+6
         bpl   normallp                     while high bit of mantissa is not 1
 do_exp   jsr   nextch                   get next character
         cmp   #'+'                     if it is '+'
         bne   chkminus
         jsr   nextch                     ignore it and get next char
         bra   exploop
 chkminus cmp   #'-'                     else if it is '-'
         bne   exploop
         jsr   nextch                     get next character
         inc   negate_exp                 flag that exponent is negative
 exploop  jsr   decdigit                 for each exponent digit
         asl   exp                        exp = exp*10 + digit
         pei   exp
         bcs   bigexp
         bmi   bigexp
         asl   exp
         asl   exp
         bcs   bigexp
         bmi   bigexp
         adc   1,s
         bvs   bigexp
         clc
         adc   exp
         bvs   bigexp
         sta   exp
         pla
         jsr   nextch
         bpl   exploop
         bra   neg_exp
 bigexp   pla
         lda   #$7fff                   if exponent value overflows
         sta   exp                        exp = INT_MAX
 bigexplp jsr   nextch
         bpl   bigexplp
 neg_exp  lda   negate_exp               if exponent is negative
         beq   finalexp
         lda   exp                        negate exp
         eor   #$ffff
         inc   a
         sta   exp
 finalexp lda   exp                      add in exponent adjustment
         clc
         adc   exp_adjust
         bvc   expdone                  if addition overflows
         lda   #$7fff                     positive exponent -> INT_MAX
         ldx   negate_exp
         beq   expdone
         inc   a                          negative exponent -> INT_MIN
 expdone  ldx   nonzero                  if value is zero
         bne   bias
         txa                              exponent field = 0
         bra   storeexp
 bias     clc                            else
         adc   #16383                     compute biased exp. [-16385..49150]
 storeexp sta   exp
         cmp   #32767                   if it is [0..32766], it is valid
         blt   round
         cmp   #32767+16383+1           if it is larger, generate an infinity
         blt   inf                      otherwise, denormalize:
 denormlp lsr   mantissa+6               while biased exponent is negative:
         ror   mantissa+4                 shift mantissa left one bit
         ror   mantissa+2
         ror   mantissa
         ror   extrabits                  adjust extrabits
         bcc   dn_next
         lda   extrabits
         ora   #1
         sta   extrabits
 dn_next  inc   exp                        exp++
         bmi   denormlp
 round    lda   extrabits                implement SANE/IEEE round-to-nearest:
         cmp   #$8000                   if less than halfway to next number
         blt   done                       return value as-is
         bne   roundup                  if more than halfway to next: round up
         lda   mantissa                 if exactly halfway to next number
         lsr   a                          if least significant bit is 0
         bcc   done                         return value as-is
 roundup  inc   mantissa                 otherwise, round up to next number:
         bne   done                       increment mantissa
         inc   mantissa+2
         bne   done
         inc   mantissa+4
         bne   done
         inc   mantissa+6
         bne   done
         lda   #$8000                     if mantissa overflowed:
         sta   mantissa+6                   mantissa = 1.0
         inc   exp                          exp++ (could generate an infinity)
 done     jsr   nextch                   if we have not consumed the full input
         bpl   error                      flag an error
         lda   mantissa                 done: store return value
         sta   >retval
         lda   mantissa+2
         sta   >retval+2
         lda   mantissa+4
         sta   >retval+4
         lda   mantissa+6
         sta   >retval+6
         lda   exp
         sta   >retval+8
         bra   ret
 inf      lda   #32767                   infinity: exponent field = 32767
         sta   >retval+8                mantissa = 1.0
         inc   a
         sta   >retval+6
         asl   a
         sta   >retval+4
         sta   >retval+2
         sta   >retval+0
         bra   ret
 error    lda   #32767                   bad input: return NANASCBIN
         sta   >retval+8
         lda   #$C011
         sta   >retval+6
         lda   #0
         sta   >retval+4
         sta   >retval+2
         sta   >retval
 ret      lda   #retval
         sta   str
         lda   #^retval
         sta   str+2
         return 4:str
 ;get next character of string, or -1 if none (nz flags also set based on value)
 nextch   cpy   end_idx
         bge   no_ch
         lda   [str],y
         iny
         and   #$00FF
         rts
 no_ch    lda   #-1
         rts
 ;get value of A, taken as a hex digit
 ;branches to error if it is not a valid digit
 hexdigit cmp   #'0'
         blt   baddigit
         cmp   #'9'+1
         bge   letter
         and   #$000F
         rts
 letter   and   #$df
         cmp   #'A'
         blt   baddigit
         cmp   #'F'+1
         bge   baddigit
         and   #$000F
         adc   #9
         rts
 ;get value of A, taken as a decimal digit
 ;branches to error if it is not a valid digit
 decdigit cmp   #'0'
         blt   baddigit
         cmp   #'9'+1
         bge   baddigit
         and   #$000F
         rts
 baddigit pla
         brl   error
 retval   ds    10
         end
 ****************************************************************
 *
 *  Convertsl - Convert a string to a long integer
--- a/Scanner.pas
+++ b/Scanner.pas
@ -449,6 +449,10 @@ procedure Convertsll(var qval: longlong; var str: pString); extern;
 { Save the integer equivalent of the string to qval.  Assumes a }
 { valid 8-byte integer string; supports unsigned values.        }
 function ConvertHexFloat(var str: pString): extended; extern;
 { Return the extended equivalent of the hexadecimal floating-   }
 { point string.                                                 }
 procedure SetDateTime; extern;
@ -735,6 +739,7 @@ if list or (numErr <> 0) then begin
        165: msg := @'''\p'' may not be used in a prefixed string';
        166: msg := @'string literals with these prefixes may not be merged';
        167: msg := @'''L''-prefixed character or string constants are not supported by ORCA/C';
        168: msg := @'malformed hexadecimal floating constant';
         otherwise: Error(57);
         end; {case}
       writeln(msg^);
@ -3544,7 +3549,8 @@ else begin
            if c2 = 'B' then isBin := true;
            NextChar;
            GetDigits;
-            goto 1;
+            if not isHex or not (c2 in ['.','p','P']) then
               goto 1;
            end; {if}
   end;
 if c2 = '.' then begin                  {handle a decimal}
@ -3552,16 +3558,18 @@ if c2 = '.' then begin                  {handle a decimal}
   numString[stringIndex] := '.';
   NextChar;
   isReal := true;
-   if charKinds[ord(c2)] = digit then
+   if (charKinds[ord(c2)] = digit) or
      (isHex and (c2 in ['a'..'f','A'..'F'])) then
      GetDigits
   else if stringIndex = 2 then begin
      numString[3] := '0';
      stringIndex := 3;
      end; {else}
   end; {if}
-if c2 in ['e','E'] then begin           {handle an exponent}
+if (not isHex and (c2 in ['e','E']))    {handle an exponent}
   or (isHex and (c2 in ['p','P'])) then begin           
   stringIndex := stringIndex+1;
-   numString[stringIndex] := 'e';
+   numString[stringIndex] := c2;
   NextChar;
   isReal := true;
   if c2 in ['+','-'] then begin
@ -3622,7 +3630,12 @@ if isReal then begin                    {convert a real constant}
   else
      token.kind := doubleConst;
   token.class := realConstant;
-   if stringIndex > 80 then begin
+   if isHex then begin
      token.rval := ConvertHexFloat(numString);
      if token.rval <> token.rval then  {NAN => invalid format}
         FlagError(168);
      end {if}
   else if stringIndex > 80 then begin
      FlagError(131);
      token.rval := 0.0;
      end {if}
--- a/cc.notes
+++ b/cc.notes
@ -132,6 +132,8 @@ The discussion of escape sequences states that hexadecimal numeric escape sequen
 The value of an octal or hexadecimal escape sequence must be within the range of representable values in the relevant type (0-255 for char).  Also, \ may not be followed by a character other than one of the ones described as forming an escape sequence.  ORCA/C now gives an error in these cases.  Accordingly, the examples of "\410" and '\g' mentioned in the manual are now treated as errors.
 Floating-point constants may now be written in a new hexadecimal format.  See "New Language Features," below. 
 p. 241
 The 'f', 'F', 'l', or 'L' suffixes on floating-point constants do now affect the semantic type of those constants, although they do not change the constant's precision or range (which are always those of the SANE extended format).
@ -436,6 +438,8 @@ Generic selection expressions are primarily useful within macros, which can give
 23. (C11) Character constants and string literals may now have prefixes indicating they should use Unicode encodings.  The prefixes u8, u, and U indicate UTF-8, UTF-16, and UTF-32 encodings, respectively.  The u8 prefix may only be used on string literals.  The U and u prefixes may be used on string literals or character constants.  U- and u-prefixed character constants have the types char32_t and char16_t (as defined in <uchar.h>); U- and u-prefixed string literals are treated as arrays of those types.  For example, the string literal U"abc" designates an array with four members of type char32_t: the three letters encoded in UTF-32, plus a null terminator.
 24. (C99) Floating-point constants may now be expressed in a hexadecimal format.  These consist of a leading 0X or 0x, followed by a sequence of hexadecimal digits optionally containing a period, then P or p, then an exponent expressed as a sequence of decimal digits optionally preceded by + or -.  These designate the number given by the hexadecimal digit sequence (with any digits after the period being the fractional part) multiplied by 2 raised to the specified exponent.  For example, the constant 0xF.8p-1 is equivalent to 7.75. 
 Multi-Character Character Constants
 -----------------------------------