Add AArch64 instructions: FCVTZU, UCVTF, SQXTN, UQXTN.

woess · woess · commit d257b7dc6c69 · 2025-06-16T12:07:14.000+02:00
diff --git a/compiler/src/jdk.graal.compiler/src/jdk/graal/compiler/asm/aarch64/AArch64ASIMDAssembler.java b/compiler/src/jdk.graal.compiler/src/jdk/graal/compiler/asm/aarch64/AArch64ASIMDAssembler.java
@@ -625,16 +625,20 @@ public enum ASIMDInstruction {
         CMLT_ZERO(0b01010 << 12),
         ABS(0b01011 << 12),
         XTN(0b10010 << 12),
+        SQXTN(0b10100 << 12),
+        UQXTN(UBit | 0b10100 << 12),
         /* size 0x */
         FCVTN(0b10110 << 12),
         FCVTL(0b10111 << 12),
         SCVTF(0b11101 << 12),
+        UCVTF(UBit | 0b11101 << 12),
         /* size 1x */
         FCMGT_ZERO(0b01100 << 12),
         FCMEQ_ZERO(0b01101 << 12),
         FCMLT_ZERO(0b01110 << 12),
         FABS(0b01111 << 12),
         FCVTZS(0b11011 << 12),
+        FCVTZU(UBit | 0b11011 << 12),
         /* UBit 1, size xx */
         REV32(UBit | 0b00000 << 12),
         CMGE_ZERO(UBit | 0b01000 << 12),
@@ -1979,6 +1983,25 @@ public void fcvtzsVV(ASIMDSize size, ElementSize eSize, Register dst, Register s
         twoRegMiscEncoding(ASIMDInstruction.FCVTZS, size, elemSize1X(eSize), dst, src);
     }
 
+    /**
+     * Floating-point convert to unsigned integer, rounding toward zero.<br>
+     *
+     * @param size register size.
+     * @param eSize source element size. Must be ElementSize.Word or ElementSize.DoubleWord.
+     *            ElementSize.DoubleWord is only applicable when size is 128 (i.e. the operation is
+     *            performed on more than one element).
+     * @param dst SIMD register.
+     * @param src SIMD register.
+     */
+    public void fcvtzuVV(ASIMDSize size, ElementSize eSize, Register dst, Register src) {
+        assert usesMultipleLanes(size, eSize) : "Must use multiple lanes " + size + " " + eSize;
+        assert dst.getRegisterCategory().equals(SIMD) : dst;
+        assert src.getRegisterCategory().equals(SIMD) : src;
+        assert eSize == ElementSize.Word || eSize == ElementSize.DoubleWord : eSize;
+
+        twoRegMiscEncoding(ASIMDInstruction.FCVTZU, size, elemSize1X(eSize), dst, src);
+    }
+
     /**
      * C7.2.97 floating point divide vector.<br>
      *
@@ -2734,6 +2757,25 @@ public void scvtfVV(ASIMDSize size, ElementSize eSize, Register dst, Register sr
         twoRegMiscEncoding(ASIMDInstruction.SCVTF, size, elemSize0X(eSize), dst, src);
     }
 
+    /**
+     * Unsigned integer convert to floating-point.<br>
+     *
+     * @param size register size.
+     * @param eSize source element size. Must be ElementSize.Word or ElementSize.DoubleWord.
+     *            ElementSize.DoubleWord is only applicable when size is 128 (i.e. the operation is
+     *            performed on more than one element).
+     * @param dst SIMD register.
+     * @param src SIMD register.
+     */
+    public void ucvtfVV(ASIMDSize size, ElementSize eSize, Register dst, Register src) {
+        assert usesMultipleLanes(size, eSize) : "Must use multiple lanes " + size + " " + eSize;
+        assert dst.getRegisterCategory().equals(SIMD) : dst;
+        assert src.getRegisterCategory().equals(SIMD) : src;
+        assert eSize == ElementSize.Word || eSize == ElementSize.DoubleWord : eSize;
+
+        twoRegMiscEncoding(ASIMDInstruction.UCVTF, size, elemSize0X(eSize), dst, src);
+    }
+
     /**
      * C7.2.239 SHA1 hash update.<br>
      *
@@ -4096,6 +4138,48 @@ public void xtn2VV(ElementSize dstESize, Register dst, Register src) {
         twoRegMiscEncoding(ASIMDInstruction.XTN, true, elemSizeXX(dstESize), dst, src);
     }
 
+    /**
+     * Signed saturating extract Narrow.<br>
+     * <p>
+     * From the manual: "This instruction reads each vector element from the source SIMD register,
+     * saturates each value to half the original width, places the result into a vector, and writes
+     * the vector to the destination SIMD register. All the values in this instruction are signed
+     * integer values."
+     *
+     * @param dstESize destination element size. Cannot be ElementSize.DoubleWord. The source
+     *            element size is twice this width.
+     * @param dst SIMD register.
+     * @param src SIMD register.
+     */
+    public void sqxtnVV(ElementSize dstESize, Register dst, Register src) {
+        assert dst.getRegisterCategory().equals(SIMD) : dst;
+        assert src.getRegisterCategory().equals(SIMD) : src;
+        assert dstESize != ElementSize.DoubleWord : dstESize;
+
+        twoRegMiscEncoding(ASIMDInstruction.SQXTN, false, elemSizeXX(dstESize), dst, src);
+    }
+
+    /**
+     * Unsigned saturating extract Narrow.<br>
+     * <p>
+     * From the manual: "This instruction reads each vector element from the source SIMD register,
+     * saturates each value to half the original width, places the result into a vector, and writes
+     * the vector to the destination SIMD register. All the values in this instruction are unsigned
+     * integer values."
+     *
+     * @param dstESize destination element size. Cannot be ElementSize.DoubleWord. The source
+     *            element size is twice this width.
+     * @param dst SIMD register.
+     * @param src SIMD register.
+     */
+    public void uqxtnVV(ElementSize dstESize, Register dst, Register src) {
+        assert dst.getRegisterCategory().equals(SIMD) : dst;
+        assert src.getRegisterCategory().equals(SIMD) : src;
+        assert dstESize != ElementSize.DoubleWord : dstESize;
+
+        twoRegMiscEncoding(ASIMDInstruction.UQXTN, false, elemSizeXX(dstESize), dst, src);
+    }
+
     /**
      * C7.2.403 Zip vectors (primary).
      * <p>
diff --git a/compiler/src/jdk.graal.compiler/src/jdk/graal/compiler/asm/aarch64/AArch64Assembler.java b/compiler/src/jdk.graal.compiler/src/jdk/graal/compiler/asm/aarch64/AArch64Assembler.java
@@ -97,6 +97,7 @@
 import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.Instruction.FCVTAS;
 import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.Instruction.FCVTMS;
 import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.Instruction.FCVTZS;
+import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.Instruction.FCVTZU;
 import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.Instruction.FDIV;
 import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.Instruction.FMADD;
 import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.Instruction.FMAX;
@@ -151,6 +152,7 @@
 import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.Instruction.TBNZ;
 import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.Instruction.TBZ;
 import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.Instruction.UBFM;
+import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.Instruction.UCVTF;
 import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.Instruction.UDIV;
 import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.InstructionType.FP32;
 import static jdk.graal.compiler.asm.aarch64.AArch64Assembler.InstructionType.FP64;
@@ -1013,7 +1015,9 @@ public enum Instruction {
         FCVTMS(0x00100000),
 
         FCVTZS(0x00180000),
+        FCVTZU(0x00190000),
         SCVTF(0x00020000),
+        UCVTF(0x00030000),
 
         FABS(0x00008000),
         FSQRT(0x00018000),
@@ -3524,6 +3528,20 @@ public void fcvtzs(int dstSize, int srcSize, Register dst, Register src) {
         fcvtCpuFpuInstruction(FCVTZS, dst, src, generalFromSize(dstSize), floatFromSize(srcSize));
     }
 
+    /**
+     * Floating-point Convert to Unsigned integer, rounding toward Zero.
+     *
+     * @param dstSize size of integer register. 32 or 64.
+     * @param srcSize size of floating point register. 32 or 64.
+     * @param dst general purpose register. May not be null, the zero-register or the stackpointer.
+     * @param src floating point register. May not be null.
+     */
+    public void fcvtzu(int dstSize, int srcSize, Register dst, Register src) {
+        assert verifySizesAndRegistersRF(dstSize, srcSize, dst, src);
+
+        fcvtCpuFpuInstruction(FCVTZU, dst, src, generalFromSize(dstSize), floatFromSize(srcSize));
+    }
+
     /* Convert from Integer (5.7.4.2) */
     /**
      * C7.2.236 Signed integer Convert to Floating-point (scalar).
@@ -3539,6 +3557,20 @@ public void scvtf(int dstSize, int srcSize, Register dst, Register src) {
         fcvtCpuFpuInstruction(SCVTF, dst, src, floatFromSize(dstSize), generalFromSize(srcSize));
     }
 
+    /**
+     * Unsigned integer Convert to Floating-point (scalar).
+     *
+     * @param dstSize size of floating point register. 32 or 64.
+     * @param srcSize size of integer register. 32 or 64.
+     * @param dst floating point register. May not be null.
+     * @param src general purpose register. May not be null or the stackpointer.
+     */
+    public void ucvtf(int dstSize, int srcSize, Register dst, Register src) {
+        assert verifySizesAndRegistersFZ(dstSize, srcSize, dst, src);
+
+        fcvtCpuFpuInstruction(UCVTF, dst, src, floatFromSize(dstSize), generalFromSize(srcSize));
+    }
+
     private void fcvtCpuFpuInstruction(Instruction instr, Register dst, Register src, InstructionType type1, InstructionType type2) {
         emitInt(type1.encoding | type2.encoding | instr.encoding | FpConvertOp | rd(dst) | rs1(src));
     }