[Git][cmucl/cmucl][arm64-dev-1] 2 commits: Document integer-with-a-bite-out

24 Mar 2026


      Raymond Toy pushed to branch arm64-dev-1 at cmucl / cmucl


Commits:
f7324a79 by Raymond Toy at 2026-03-24T15:03:35-07:00
Document integer-with-a-bite-out

Not used in arm64, but let's just document what it does for posterity.
I always wondered what it did.

- - - - -
8555c8f4 by Raymond Toy at 2026-03-24T15:31:33-07:00
Update and fix positive-fixnum-bits.

Used Claude to update this.  Only major change was that currently
fixnums are only 30 bits long, not more to match current 32-bit
lisps.  (Hopefully that will change some day.)

Documented the fpcr/fpsr layout which is pretty helpful.

And we're little-endian, not big-endian.

[skip-ci]

- - - - -


2 changed files:

- src/compiler/arm64/arith.lisp
- src/compiler/arm64/parms.lisp


Changes:

=====================================
src/compiler/arm64/arith.lisp
=====================================
@@ -772,6 +772,14 @@
   (:affected)
   (:policy :fast-safe))
 
+;;; INTEGER-WITH-A-BITE-OUT -- the full signed S-bit range with the top BITE
+;;; values removed from the upper end.  That is:
+;;;   (integer -(2^(s-1))  (2^(s-1) - bite - 1))
+;;;
+;;; Useful for immediate constants where the maximum positive value must be
+;;; avoided to prevent overflow in subsequent arithmetic.  Examples:
+;;;   (integer-with-a-bite-out 14 4) => (integer -8192 8187)  ; 14-bit signed, top 4 missing
+;;;   (integer-with-a-bite-out  8 1) => (integer -128   126)  ; 8-bit signed, top 1 missing
 (deftype integer-with-a-bite-out (s bite)
   (cond ((eq s '*) 'integer)
         ((and (integerp s) (> s 1))


=====================================
src/compiler/arm64/parms.lisp
=====================================
@@ -1,4 +1,4 @@
-;;; -*- Package: SPARC -*-
+;;; -*- Package: ARM64 -*-
 ;;;
 ;;; **********************************************************************
 ;;; This code was written as part of the CMU Common Lisp project at
@@ -10,49 +10,53 @@
 ;;; **********************************************************************
 ;;;
 ;;;    This file contains some parameterizations of various VM
-;;; attributes for ARM.  This file is separate from other stuff so 
-;;; that it can be compiled and loaded earlier. 
+;;; attributes for the ARM64 (AArch64) architecture.  This file is
+;;; separate from other stuff so that it can be compiled and loaded
+;;; earlier.
 ;;;
-;;; Converted from SPARC to ARM.
+;;; Written by Rob MacLachlan (original SPARC version).
+;;; Converted to ARM64 by [ARM64 port contributors].
+;;; Derived from the SPARC and PPC ports.
 ;;;
 
 (in-package "ARM64")
-;;(intl:textdomain "cmucl-sparc-vm")
+(intl:textdomain "cmucl-arm64-vm")
 (use-package "C")
 
-
+
 ;;;; Compiler constants.
 
 (eval-when (compile eval load)
 
-(adjoin :linux (backend-features *target-backend*))
 (setf (backend-name *target-backend*) "ARM64")
-(setf (backend-version *target-backend*)
-      "ARM64/Linux")
-
+(setf (backend-version *target-backend*) "ARM64/AArch64")
 (setf (backend-fasl-file-type *target-backend*) "arm64f")
 (setf (backend-fasl-file-implementation *target-backend*)
-      arm-fasl-file-implementation)
+      arm64-fasl-file-implementation)
 (setf (backend-fasl-file-version *target-backend*) byte-fasl-file-version)
 (setf (backend-register-save-penalty *target-backend*) 3)
-
-;; Only supporting little-endian ARM for now.
+;; AArch64 is a little-endian architecture by default (BE8 mode exists
+;; but is uncommon and not targeted here).
 (setf (backend-byte-order *target-backend*) :little-endian)
 (setf (backend-page-size *target-backend*) 4096)
 
+;;; Foreign linkage space.  The start address must match arm64-validate.h
+;;; and the entry size must agree with arm64-arch.c.  Each entry is a
+;;; ADRP + ADD + BR sequence (3 instructions = 12 bytes), rounded up to
+;;; 16 bytes for alignment.
 (setf (c::backend-foreign-linkage-space-start *target-backend*)
-      #x0f000000
+      #x0f800000
       (c::backend-foreign-linkage-entry-size *target-backend*)
-      ;; FIXME: Update this when we figure out how to do
-      ;; linkage-tables on ARM.
       16)
+
 ); eval-when
 
 (pushnew :new-assembler *features*)
 
-
+
 ;;;; Machine Architecture parameters:
 
+(eval-when (:compile-toplevel :load-toplevel :execute)
 (export '(word-bits byte-bits char-bits word-shift word-bytes char-bytes
 	  fixnum-tag-bits fixnum-tag-mask positive-fixnum-bits
 
@@ -76,10 +80,13 @@
 
 #+double-double
 (export '(double-double-float-digits))
-	  
+) ; eval-when
+
 
 (eval-when (compile load eval)
 
+;;; AArch64 is a 64-bit architecture: one Lisp descriptor occupies one
+;;; 64-bit word.
 (defconstant word-bits 64
   "Number of bits per word where a word holds one lisp descriptor.")
 
@@ -92,21 +99,22 @@
 (defconstant char-bytes (truncate char-bits byte-bits)
   "Number of bytes needed to represent a character")
 
+;;; word-shift = log2(word-bytes) = log2(8) = 3
 (defconstant word-shift (1- (integer-length (/ word-bits byte-bits)))
   "Number of bits to shift between word addresses and byte addresses.")
 
 (defconstant word-bytes (/ word-bits byte-bits)
   "Number of bytes in a word.")
 
+;;; AArch64 uses the same 3-bit lowtag scheme as SPARC/PPC.
 (defconstant lowtag-bits 3
   "Number of bits at the low end of a pointer used for type information.")
 
 (defconstant lowtag-mask (1- (ash 1 lowtag-bits))
   "Mask to extract the low tag bits from a pointer.")
-  
+
 (defconstant lowtag-limit (ash 1 lowtag-bits)
-  "Exclusive upper bound on the value of the low tag bits from a
-  pointer.")
+  "Exclusive upper bound on the value of the low tag bits from a pointer.")
 
 (defconstant fixnum-tag-bits (1- lowtag-bits)
   "Number of tag bits used for a fixnum")
@@ -114,15 +122,20 @@
 (defconstant fixnum-tag-mask (1- (ash 1 fixnum-tag-bits))
   "Mask to get the fixnum tag")
 
-(defconstant positive-fixnum-bits (- word-bits fixnum-tag-bits 1)
-  "Maximum number of bits in a positive fixnum")
+(defconstant positive-fixnum-bits (- 32 fixnum-tag-bits 1)
+  "Maximum number of bits in a positive fixnum.
+  Although the machine word is 64 bits, fixnums are kept within a
+  signed 32-bit range for compatibility with the rest of CMU CL.")
 
-;; FIXME: All of the IEEE-754 float parms should probably be split
-;; into a separate file to be shared by all platforms using standard
-;; IEEE-754 single and double precision floats.
+;;; Float layout constants.  IEEE 754 applies uniformly across
+;;; architectures; only the sign-bit position changes with word width.
+;;; For AArch64 (64-bit word) we use bit 63 as the float sign bit, but
+;;; for the 32-bit single-float representation the sign is still bit 31
+;;; within the 32-bit encoding word.
 (defconstant float-sign-shift 31)
 
-(defconstant single-float-bytes 4)	; Bytes to hold a single-float
+;;; Single-float (32-bit IEEE 754 binary32).  Identical to SPARC/PPC.
+(defconstant single-float-bytes 4)
 (defconstant single-float-bias 126)
 (defconstant single-float-exponent-byte (byte 8 23))
 (defconstant single-float-significand-byte (byte 23 0))
@@ -131,7 +144,8 @@
 (defconstant single-float-hidden-bit (ash 1 23))
 (defconstant single-float-trapping-nan-bit (ash 1 22))
 
-(defconstant double-float-bytes 8)	; Bytes to hold a double-float
+;;; Double-float (64-bit IEEE 754 binary64).  Identical to SPARC/PPC.
+(defconstant double-float-bytes 8)
 (defconstant double-float-bias 1022)
 (defconstant double-float-exponent-byte (byte 11 20))
 (defconstant double-float-significand-byte (byte 20 0))
@@ -143,63 +157,101 @@
 (defconstant single-float-digits
   (+ (byte-size single-float-significand-byte) 1))
 
+;;; double-float-digits = 20 + 32 + 1 = 53 (IEEE 754 binary64).
+;;; The literal 32 matches the SPARC formula; word-bits cannot be used
+;;; here because on ARM64 word-bits is 64, which would give the wrong answer.
 (defconstant double-float-digits
-  (+ (byte-size double-float-significand-byte) word-bits 1))
+  (+ (byte-size double-float-significand-byte) 32 1))
 
 #+double-double
 (defconstant double-double-float-digits
   (* 2 double-float-digits))
 
-;; ARM specific information
-;; See B6.1.39: FPSCR, Floating-point Status and Control Regiser, PMSA
-(defconstant float-denormal-trap-bit (ash 1 15))         ; IDE bit[15]
-(defconstant float-inexact-trap-bit (ash 1 12))          ; IXE bit[12]
-(defconstant float-underflow-trap-bit (ash 1 11))        ; UFE bit[11]
-(defconstant float-overflow-trap-bit (ash 1 10))         ; OFE bit[10]
-(defconstant float-divide-by-zero-trap-bit (ash 1 9))    ; DZE bit[9]
-(defconstant float-invalid-trap-bit (ash 1 8))           ; IOE bit[8]
-
-(defconstant float-round-to-nearest 0)  ; #b00 Round to Nearest
-(defconstant float-round-to-positive 1) ; #b01 Round towards Plus Infinity
-(defconstant float-round-to-negative 2) ; #b10 Round towards Minus Infinity
-(defconstant float-round-to-zero 3)     ; #b11 Round towards Zero
-
-(defconstant float-rounding-mode (byte 2 22))	  ; RMode bits[23:22]
-
-;; The trap enable bits are split with the IDE bit separate from the
-;; rest of the enable bits.  We're ignoring the IDE bit for now until
-;; float-traps support it.
-(defconstant float-traps-byte (byte 5 8))	  ; Trap enable bits
-;; There doesn't appear to be separate accrued (sticky) and current
-;; exceptions.  We also ignore the IDC bit.
-(defconstant float-sticky-bits (byte 5 0))	  ; Cumulative excection bits Bits[4:0]
-(defconstant float-exceptions-byte (byte 5 0))	  ; Same as cumulative
-
-;; Flush-to-zero bit
-(defconstant float-fast-bit (ash 1 24))
+;;; AArch64 FPCR/FPSR trap and rounding-mode bits.
+;;;
+;;; FPCR layout (Floating-Point Control Register):
+;;;   [26]   IDE  – Input Denormal exception trap enable
+;;;   [25]   IXE  – Inexact trap enable
+;;;   [24]   UFE  – Underflow trap enable
+;;;   [23]   OFE  – Overflow trap enable
+;;;   [22]   DZE  – Divide-by-Zero trap enable
+;;;   [21]   IOE  – Invalid Operation trap enable
+;;;   [23:22] RMode – Rounding mode
+;;;
+;;; FPSR layout (Floating-Point Status Register):
+;;;   [4]    QC   – Cumulative saturation (SIMD)
+;;;   [3]    IDC  – Input Denormal cumulative
+;;;   [2:0]  –    (reserved)
+;;;   Bits 0-4 of the low byte carry the IEEE exception sticky flags:
+;;;   [4]    IXC  – Inexact
+;;;   [3]    UFC  – Underflow
+;;;   [2]    OFC  – Overflow
+;;;   [1]    DZC  – Divide-by-Zero
+;;;   [0]    IOC  – Invalid Operation
+;;;
+;;; The trap-enable bits in FPCR use the same bit positions as FPSR
+;;; sticky flags, offset by 8.  We follow the SPARC convention and
+;;; name the FPCR trap-enable fields here; the runtime uses them when
+;;; installing/querying the floating-point environment.
+
+;;; Exception / trap-enable bit positions within their respective
+;;; FPCR byte (bits 8..13) and FPSR byte (bits 0..4).
+(defconstant float-inexact-trap-bit        (ash 1 4))  ; IXE / IXC
+(defconstant float-underflow-trap-bit      (ash 1 3))  ; UFE / UFC
+(defconstant float-overflow-trap-bit       (ash 1 2))  ; OFE / OFC
+(defconstant float-divide-by-zero-trap-bit (ash 1 1))  ; DZE / DZC
+(defconstant float-invalid-trap-bit        (ash 1 0))  ; IOE / IOC
+(defconstant float-imprecise-trap-bit float-inexact-trap-bit)
+
+;;; Rounding mode encoding in FPCR bits [23:22].
+(defconstant float-round-to-nearest  0)   ; RN  (ties to even)
+(defconstant float-round-to-positive 1)   ; RP
+(defconstant float-round-to-negative 2)   ; RM
+(defconstant float-round-to-zero     3)   ; RZ
+
+;;; Byte descriptors for fields within the 32-bit FPCR value.
+(defconstant float-rounding-mode   (byte 2 22))  ; RMode field
+(defconstant float-traps-byte      (byte 6  8))  ; trap-enable bits 8..13
+(defconstant float-exceptions-byte (byte 6  0))  ; FPSR sticky bits 0..5
+(defconstant float-sticky-bits     (byte 6  0))  ; alias for exceptions
+
+;;; Flush-to-zero / fast mode bit in FPCR.
+;;; When set, AArch64 flushes denormal inputs/outputs to zero
+;;; (equivalent to the SPARC EFM bit).
+(defconstant float-fast-bit (ash 1 24))    ; FZ bit in FPCR
 
 ); eval-when
 
 ;;; NUMBER-STACK-DISPLACEMENT
 ;;;
 ;;; The number of bytes reserved above the number stack pointer.
-;;;
-;;; FIXME: Use the right value!
+;;; AArch64 does not have SPARC-style register windows, so no window-
+;;; spill area is needed.  We reserve one word (8 bytes) as a
+;;; red-zone / alignment pad to match common ABI expectations.
 (defconstant number-stack-displacement
-  0)
-
+  (* 1 vm:word-bytes))
+
+
 ;;;; Description of the target address space.
 
+(eval-when (:compile-toplevel :load-toplevel :execute)
 (export '(target-read-only-space-start
 	  target-static-space-start
 	  target-dynamic-space-start
 	  target-foreign-linkage-space-start
 	  target-foreign-linkage-entry-size))
+)
 
-;;; Where to put the different spaces.  Must match the C code!
-;;; 
+;;; Where to put the different spaces.  Must match the C code (arm64-validate.h)!
+;;;
+;;; AArch64 virtual address space is 48 bits (256 TiB) with the low
+;;; half available to user-space processes.  We place the Lisp spaces
+;;; in the first gigabyte, mirroring the SPARC layout but noting that
+;;; on AArch64 the upper 16 bits of a 64-bit address must match bit 47
+;;; (tagged-address extension); user-space addresses are therefore in
+;;; the range 0x0000_0000_0000_0000 – 0x0000_7FFF_FFFF_FFFF.
 (defconstant target-read-only-space-start #x10000000)
-(defconstant target-static-space-start    #x30000000)
+(defconstant target-static-space-start    #x28000000)
 (defconstant target-dynamic-space-start   #x40000000)
 
 (defconstant target-foreign-linkage-space-start
@@ -207,12 +259,12 @@
 (defconstant target-foreign-linkage-entry-size
   (c:backend-foreign-linkage-entry-size *target-backend*))
 
-
+
 ;;;; Other random constants.
 
+(eval-when (:compile-toplevel :load-toplevel :execute)
 (export '(halt-trap pending-interrupt-trap error-trap cerror-trap
 	  breakpoint-trap function-end-breakpoint-trap
-	  not-implemented-trap
 	  after-breakpoint-trap allocation-trap
 	  pseudo-atomic-trap
 	  object-not-list-trap object-not-instance-trap
@@ -222,12 +274,15 @@
 #+heap-overflow-check
 (export '(dynamic-space-overflow-error-trap
 	  dynamic-space-overflow-warning-trap))
+)
 
-;; These values are used as the immediate value in a UDF instruction.
-;; Note that Linux on arm appears to use udf 16 as its trace/breakpoint
-;; trap, so we shouldn't use this for Lisp.
-(defenum (:suffix -trap :start 4)
-  function-header			; This value must be a multiple of 4!
+;;; Trap codes are encoded as the immediate operand of the UDF (Undefined
+;;; instruction) used to signal synchronous traps to the runtime.  The
+;;; encoding must match arm64-arch.c.
+;;;
+;;; We start at 8 (same as SPARC) to leave room for low values that may
+;;; be used by the OS or debugger.
+(defenum (:suffix -trap :start 8)
   halt
   pending-interrupt
   error
@@ -239,14 +294,10 @@
   dynamic-space-overflow-warning
   #+heap-overflow-check
   dynamic-space-overflow-error
-  not-implemented
-  ;; This is the trap number to use when a pseudo-atomic section has
-  ;; been interrupted.
-  pseudo-atomic
   )
 
 ;; Make sure this starts AFTER the last element of the above enum!
-(defenum (:prefix object-not- :suffix -trap :start 20)
+(defenum (:prefix object-not- :suffix -trap :start 16)
   list
   instance)
 
@@ -256,10 +307,12 @@
   function-prologue
   function-epilogue)
 
-
+
 ;;;; Static symbols.
 
+(eval-when (:compile-toplevel :load-toplevel :execute)
 (export '(static-symbols static-functions))
+)
 
 ;;; These symbols are loaded into static space directly after NIL so
 ;;; that the system can compute their address by adding a constant
@@ -303,8 +356,6 @@
     lisp::*free-interrupt-context-index*
     unix::*interrupts-enabled*
     unix::*interrupt-pending*
-    lisp::*pseudo-atomic-atomic*
-    lisp::*pseudo-atomic-interrupted*
 
     ;; Foreign linkage stuff
     #+linkage-table
@@ -314,22 +365,11 @@
     lisp::*cmucl-lib*
     lisp::*cmucl-core-path*
 
-    *binding-stack-pointer*
-
-    ;; The real C stack pointer
-    *number-stack-pointer*
-
-    ;; The number frame pointer (aka NFP)
-    *number-frame-pointer*
-
-    ;; Gc
-    #-gencgc
-    lisp::*allocation-pointer*
-    
     ;; Gencgc
-    ;;
     #+gencgc
     *current-region-free-pointer*
+    ;; current-region-end-addr is a 64-bit physical address; when read
+    ;; back from Lisp it is a fixnum shifted left by fixnum-tag-bits.
     #+gencgc
     *current-region-end-addr*
 
@@ -342,9 +382,13 @@
     :key-and-value
     :key-or-value
 
+    ;; FP constants
+    *fp-constant-0d0*
+    *fp-constant-0f0*
+
     lisp::*unidata-path*
     lisp::*lisp-implementation-version*
-    
+
     ;; Some spare static symbols.  Useful for adding another static
     ;; symbol without having to do a cross-compile.  Just rename one
     ;; of these to the desired name.
@@ -368,31 +412,51 @@
     ))
 
 
-
 ;;;; Assembler parameters:
 
-;;; The number of bits per element in the assemblers code vector.
-;;;
+;;; The number of bits per element in the assembler's code vector.
+;;; AArch64 instructions are always 32 bits wide (4 bytes), but the
+;;; assembler code-vector element unit is still 8-bit bytes, matching
+;;; every other CMU CL port.
 (defparameter *assembly-unit-length* 8)
 
-
-(export '(pseudo-atomic-trap
+
+(eval-when (:compile-toplevel :load-toplevel :execute)
+(export '(pseudo-atomic-trap allocation-trap
 	  pseudo-atomic-value pseudo-atomic-interrupted-value))
+)
+
+;;;; Pseudo-atomic trap number.
+;;;;
+;;;; On AArch64 we encode synchronous traps with UDF (permanently
+;;;; undefined instruction), whose 16-bit immediate is the trap code.
+;;;; There is no software-trap instruction analogous to SPARC's TRAP,
+;;;; so pseudo-atomic-trap is an alias for the pending-interrupt-trap
+;;;; UDF code.  The value must match arm64-arch.c.
+(defconstant pseudo-atomic-trap pending-interrupt-trap)
+
+;;;; Allocation trap number.
+;;;;
+;;;; This is the UDF immediate used when inline allocation overflows
+;;;; the current region.  Must match arm64-arch.c.
+(defconstant allocation-trap
+  ;; allocation-trap is encoded as the UDF immediate in macros.lisp.
+  ;; Re-export the value used there so C code and Lisp agree.
+  ;;
+  ;; The numeric value 31 (same as SPARC) is chosen to be distinct from
+  ;; all values in the halt..after-breakpoint range (8..14) and the
+  ;; object-not-*-trap range (16..17).
+  31)
+
 ;;;; Pseudo-atomic flag
 ;;;;
-;;;; This value is added to *pseudo-atomic-atomic* to indicate a
-;;;; pseudo-atomic section.
+;;;; This value is ORed into ALLOC-TN (X14) to mark a pseudo-atomic
+;;;; section, matching the SPARC and PPC convention of using the bit
+;;;; just below the lowtag field.
 (defconstant pseudo-atomic-value (ash 1 (1- vm::lowtag-bits)))
 
 ;;;; Pseudo-atomic-interrupted-mask
 ;;;;
-;;;; This is a mask used to check if a pseudo-atomic section was
-;;;; interrupted.  This is indicated by least-significant bit of
-;;;; *pseudo-atomic-atomic* being 1.
-;;;;
-;;;; FIXME: This is based on the sparc port where the pseudo-atomic
-;;;; stuff is implemented as bits on the alloc-tn.  We don't have an
-;;;; alloc-tn on ARM.  So should we emulate that using
-;;;; *pseudo-atomic-atomic* or use *pseudo-atomic-interrupted* as on
-;;;; x86?
+;;;; AArch64 (like SPARC) signals a pseudo-atomic interrupt via the
+;;;; least-significant bit of ALLOC-TN.
 (defconstant pseudo-atomic-interrupted-value 1)



View it on GitLab: https://gitlab.common-lisp.net/cmucl/cmucl/-/compare/ba1a3d4c081ff5f3765baa6...

-- 
View it on GitLab: https://gitlab.common-lisp.net/cmucl/cmucl/-/compare/ba1a3d4c081ff5f3765baa6...
You're receiving this email because of your account on gitlab.common-lisp.net. Manage all notifications: https://gitlab.common-lisp.net/-/profile/notifications | Help: https://gitlab.common-lisp.net/help

    

[Git][cmucl/cmucl][arm64-dev-1] 2 commits: Document integer-with-a-bite-out

Raymond Toy (＠rtoy)