mirror of
https://github.com/yuzu-mirror/oaknut.git
synced 2026-02-21 04:24:41 +01:00
oaknut: Add ARMv8.2 instructions
This commit is contained in:
parent
9eb7cca885
commit
7470c76117
27
README.md
27
README.md
|
|
@ -1,6 +1,6 @@
|
|||
# Oaknut
|
||||
|
||||
*A C++20 assembler for AArch64 (ARMv8.1)*
|
||||
*A C++20 assembler for AArch64 (ARMv8.0 to ARMv8.2)*
|
||||
|
||||
Oaknut is a header-only library that allows one to dynamically assemble code in-memory at runtime.
|
||||
|
||||
|
|
@ -51,6 +51,7 @@ int main()
|
|||
Each AArch64 instruction corresponds to one emitter function. For a list of emitter functions see:
|
||||
* ARMv8.0: [general instructions](include/oaknut/impl/mnemonics_generic_v8.0.inc.hpp), [FP & SIMD instructions](include/oaknut/impl/mnemonics_fpsimd_v8.0.inc.hpp)
|
||||
* ARMv8.1: [general instructions](include/oaknut/impl/mnemonics_generic_v8.1.inc.hpp), [FP & SIMD instructions](include/oaknut/impl/mnemonics_fpsimd_v8.1.inc.hpp)
|
||||
* ARMv8.2: [general instructions](include/oaknut/impl/mnemonics_generic_v8.2.inc.hpp), [FP & SIMD instructions](include/oaknut/impl/mnemonics_fpsimd_v8.2.inc.hpp)
|
||||
|
||||
### Operands
|
||||
|
||||
|
|
@ -60,10 +61,10 @@ The `oaknut::util` namespace provides convenient names for operands for instruct
|
|||
|----|----|----|
|
||||
|W0, W1, ..., W30|`WReg`|32-bit general purpose registers|
|
||||
|X0, X1, ..., X30|`XReg`|64-bit general purpose registers|
|
||||
|WZR|WzrReg (convertable to `WReg`)|32-bit zero register|
|
||||
|XZR|ZrReg (convertable to `XReg`)|64-bit zero register|
|
||||
|WSP|WspReg (convertable to `WRegSp`)|32-bit stack pointer|
|
||||
|SP|SpReg (convertable to `XRegSp`)|64-bit stack pointer|
|
||||
|WZR|`WzrReg` (convertable to `WReg`)|32-bit zero register|
|
||||
|XZR|`ZrReg` (convertable to `XReg`)|64-bit zero register|
|
||||
|WSP|`WspReg` (convertable to `WRegSp`)|32-bit stack pointer|
|
||||
|SP|`SpReg` (convertable to `XRegSp`)|64-bit stack pointer|
|
||||
|B0, B1, ..., B31|`BReg`|8-bit scalar SIMD register|
|
||||
|H0, H1, ..., H31|`HReg`|16-bit scalar SIMD register|
|
||||
|S0, S1, ..., S31|`SReg`|32-bit scalar SIMD register|
|
||||
|
|
@ -74,14 +75,14 @@ For vector operations, you can specify registers like so:
|
|||
|
||||
|Name|Class| |
|
||||
|----|----|----|
|
||||
|V0.B8(), ...|`VReg_B8`|8 elements each 8 bits in size|
|
||||
|V0.B16(), ...|`VReg_B16`|16 elements each 8 bits in size|
|
||||
|V0.H4(), ...|`VReg_H4`|4 elements each 16 bits in size|
|
||||
|V0.H8(), ...|`VReg_H8`|8 elements each 16 bits in size|
|
||||
|V0.S2(), ...|`VReg_S2`|2 elements each 32 bits in size|
|
||||
|V0.S4(), ...|`VReg_S4`|4 elements each 32 bits in size|
|
||||
|V0.D1(), ...|`VReg_D1`|1 elements each 64 bits in size|
|
||||
|V0.D2(), ...|`VReg_D2`|2 elements each 64 bits in size|
|
||||
|V0.B8(), ...|`VReg_8B`|8 elements each 8 bits in size|
|
||||
|V0.B16(), ...|`VReg_16B`|16 elements each 8 bits in size|
|
||||
|V0.H4(), ...|`VReg_4H`|4 elements each 16 bits in size|
|
||||
|V0.H8(), ...|`VReg_8H`|8 elements each 16 bits in size|
|
||||
|V0.S2(), ...|`VReg_2S`|2 elements each 32 bits in size|
|
||||
|V0.S4(), ...|`VReg_4S`|4 elements each 32 bits in size|
|
||||
|V0.D1(), ...|`VReg_1D`|1 elements each 64 bits in size|
|
||||
|V0.D2(), ...|`VReg_2D`|2 elements each 64 bits in size|
|
||||
|
||||
And you can specify elements like so:
|
||||
|
||||
|
|
|
|||
855
include/oaknut/impl/mnemonics_fpsimd_v8.2.inc.hpp
Normal file
855
include/oaknut/impl/mnemonics_fpsimd_v8.2.inc.hpp
Normal file
|
|
@ -0,0 +1,855 @@
|
|||
// SPDX-FileCopyrightText: Copyright (c) 2022 merryhime <https://mary.rs>
|
||||
// SPDX-License-Identifier: MIT
|
||||
|
||||
void BCAX(VReg_16B rd, VReg_16B rn, VReg_16B rm, VReg_16B ra)
|
||||
{
|
||||
emit<"11001110001mmmmm0aaaaannnnnddddd", "d", "n", "m", "a">(rd, rn, rm, ra);
|
||||
}
|
||||
void EOR3(VReg_16B rd, VReg_16B rn, VReg_16B rm, VReg_16B ra)
|
||||
{
|
||||
emit<"11001110000mmmmm0aaaaannnnnddddd", "d", "n", "m", "a">(rd, rn, rm, ra);
|
||||
}
|
||||
void FABD(HReg rd, HReg rn, HReg rm)
|
||||
{
|
||||
emit<"01111110110mmmmm000101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FABD(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00101110110mmmmm000101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FABD(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01101110110mmmmm000101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FABS(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111011111000111110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FABS(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111011111000111110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FACGE(HReg rd, HReg rn, HReg rm)
|
||||
{
|
||||
emit<"01111110010mmmmm001011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FACGE(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00101110010mmmmm001011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FACGE(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01101110010mmmmm001011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FACGT(HReg rd, HReg rn, HReg rm)
|
||||
{
|
||||
emit<"01111110110mmmmm001011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FACGT(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00101110110mmmmm001011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FACGT(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01101110110mmmmm001011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FADD(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00001110010mmmmm000101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FADD(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01001110010mmmmm000101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FADDP(HReg rd, VReg_2H rn)
|
||||
{
|
||||
emit<"0101111000110000110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FADDP(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00101110010mmmmm000101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FADDP(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01101110010mmmmm000101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FCMEQ(HReg rd, HReg rn, HReg rm)
|
||||
{
|
||||
emit<"01011110010mmmmm001001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FCMEQ(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00001110010mmmmm001001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FCMEQ(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01001110010mmmmm001001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FCMEQ(HReg rd, HReg rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0101111011111000110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMEQ(VReg_4H rd, VReg_4H rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0000111011111000110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMEQ(VReg_8H rd, VReg_8H rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0100111011111000110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMGE(HReg rd, HReg rn, HReg rm)
|
||||
{
|
||||
emit<"01111110010mmmmm001001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FCMGE(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00101110010mmmmm001001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FCMGE(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01101110010mmmmm001001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FCMGE(HReg rd, HReg rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0111111011111000110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMGE(VReg_4H rd, VReg_4H rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0010111011111000110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMGE(VReg_8H rd, VReg_8H rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0110111011111000110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMGT(HReg rd, HReg rn, HReg rm)
|
||||
{
|
||||
emit<"01111110110mmmmm001001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FCMGT(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00101110110mmmmm001001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FCMGT(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01101110110mmmmm001001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FCMGT(HReg rd, HReg rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0101111011111000110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMGT(VReg_4H rd, VReg_4H rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0000111011111000110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMGT(VReg_8H rd, VReg_8H rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0100111011111000110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMLE(HReg rd, HReg rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0111111011111000110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMLE(VReg_4H rd, VReg_4H rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0010111011111000110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMLE(VReg_8H rd, VReg_8H rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0110111011111000110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMLT(HReg rd, HReg rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0101111011111000111010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMLT(VReg_4H rd, VReg_4H rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0000111011111000111010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCMLT(VReg_8H rd, VReg_8H rn, ImmConstFZero)
|
||||
{
|
||||
emit<"0100111011111000111010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTAS(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0101111001111001110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTAS(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111001111001110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTAS(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111001111001110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTAU(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0111111001111001110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTAU(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0010111001111001110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTAU(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0110111001111001110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTMS(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0101111001111001101110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTMS(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111001111001101110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTMS(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111001111001101110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTMU(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0111111001111001101110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTMU(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0010111001111001101110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTMU(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0110111001111001101110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTNS(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0101111001111001101010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTNS(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111001111001101010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTNS(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111001111001101010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTNU(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0111111001111001101010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTNU(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0010111001111001101010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTNU(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0110111001111001101010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTPS(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0101111011111001101010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTPS(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111011111001101010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTPS(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111011111001101010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTPU(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0111111011111001101010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTPU(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0010111011111001101010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTPU(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0110111011111001101010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTZS(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0101111011111001101110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTZS(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111011111001101110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTZS(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111011111001101110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTZU(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0111111011111001101110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTZU(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0010111011111001101110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FCVTZU(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0110111011111001101110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FDIV(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00101110010mmmmm001111nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FDIV(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01101110010mmmmm001111nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMAX(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00001110010mmmmm001101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMAX(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01001110010mmmmm001101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMAXNM(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00001110010mmmmm000001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMAXNM(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01001110010mmmmm000001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMAXNMP(HReg rd, VReg_2H rn)
|
||||
{
|
||||
emit<"0101111000110000110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FMAXNMP(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00101110010mmmmm000001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMAXNMP(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01101110010mmmmm000001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMAXNMV(HReg rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111000110000110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FMAXNMV(HReg rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111000110000110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FMAXP(HReg rd, VReg_2H rn)
|
||||
{
|
||||
emit<"0101111000110000111110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FMAXP(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00101110010mmmmm001101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMAXP(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01101110010mmmmm001101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMAXV(HReg rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111000110000111110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FMAXV(HReg rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111000110000111110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FMIN(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00001110110mmmmm001101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMIN(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01001110110mmmmm001101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMINNM(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00001110110mmmmm000001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMINNM(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01001110110mmmmm000001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMINNMP(HReg rd, VReg_2H rn)
|
||||
{
|
||||
emit<"0101111010110000110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FMINNMP(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00101110110mmmmm000001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMINNMP(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01101110110mmmmm000001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMINNMV(HReg rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111010110000110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FMINNMV(HReg rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111010110000110010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FMINP(HReg rd, VReg_2H rn)
|
||||
{
|
||||
emit<"0101111010110000111110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FMINP(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00101110110mmmmm001101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMINP(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01101110110mmmmm001101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMINV(HReg rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111010110000111110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FMINV(HReg rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111010110000111110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FMLA(HReg rd, HReg rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0101111100LMmmmm0001H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLA(VReg_8B rd, VReg_8B rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0000111100LMmmmm0001H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLA(VReg_16B rd, VReg_16B rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0100111100LMmmmm0001H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLA(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00001110010mmmmm000011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMLA(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01001110010mmmmm000011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMLAL(VReg_2S rd, VReg_2H rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0000111110LMmmmm0000H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLAL(VReg_4S rd, VReg_4H rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0100111110LMmmmm0000H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLAL2(VReg_2S rd, VReg_2H rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0010111110LMmmmm1000H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLAL2(VReg_4S rd, VReg_4H rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0110111110LMmmmm1000H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLAL(VReg_2S rd, VReg_2H rn, VReg_2H rm)
|
||||
{
|
||||
emit<"00001110001mmmmm111011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMLAL(VReg_4S rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"01001110001mmmmm111011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMLAL2(VReg_2S rd, VReg_2H rn, VReg_2H rm)
|
||||
{
|
||||
emit<"00101110001mmmmm110011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMLAL2(VReg_4S rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"01101110001mmmmm110011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMLS(HReg rd, HReg rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0101111100LMmmmm0101H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLS(VReg_8B rd, VReg_8B rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0000111100LMmmmm0101H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLS(VReg_16B rd, VReg_16B rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0100111100LMmmmm0101H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLS(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00001110110mmmmm000011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMLS(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01001110110mmmmm000011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMLSL(VReg_2S rd, VReg_2H rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0000111110LMmmmm0100H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLSL(VReg_4S rd, VReg_4H rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0100111110LMmmmm0100H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLSL2(VReg_2S rd, VReg_2H rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0010111110LMmmmm1100H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLSL2(VReg_4S rd, VReg_4H rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0110111110LMmmmm1100H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMLSL(VReg_2S rd, VReg_2H rn, VReg_2H rm)
|
||||
{
|
||||
emit<"00001110101mmmmm111011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMLSL(VReg_4S rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"01001110101mmmmm111011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMLSL2(VReg_2S rd, VReg_2H rn, VReg_2H rm)
|
||||
{
|
||||
emit<"00101110101mmmmm110011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMLSL2(VReg_4S rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"01101110101mmmmm110011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMOV(VReg_4H rd, FImm8 imm)
|
||||
{
|
||||
emit<"0000111100000vvv111111vvvvvddddd", "d", "v">(rd, imm);
|
||||
}
|
||||
void FMOV(VReg_8H rd, FImm8 imm)
|
||||
{
|
||||
emit<"0100111100000vvv111111vvvvvddddd", "d", "v">(rd, imm);
|
||||
}
|
||||
void FMUL(HReg rd, HReg rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0101111100LMmmmm1001H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMUL(VReg_8B rd, VReg_8B rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0000111100LMmmmm1001H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMUL(VReg_16B rd, VReg_16B rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0100111100LMmmmm1001H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMUL(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00101110010mmmmm000111nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMUL(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01101110010mmmmm000111nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMULX(HReg rd, HReg rn, HReg rm)
|
||||
{
|
||||
emit<"01011110010mmmmm000111nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMULX(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00001110010mmmmm000111nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMULX(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01001110010mmmmm000111nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FMULX(HReg rd, HReg rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0111111100LMmmmm1001H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMULX(VReg_8B rd, VReg_8B rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0010111100LMmmmm1001H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FMULX(VReg_16B rd, VReg_16B rn, HElem em)
|
||||
{
|
||||
if (em.reg_index() >= 16)
|
||||
throw "InvalidCombination";
|
||||
emit<"0110111100LMmmmm1001H0nnnnnddddd", "d", "n", "m", "H", "L", "M">(rd, rn, em.reg_index(), em.elem_index() >> 2, (em.elem_index() >> 1) & 1, em.elem_index() & 1);
|
||||
}
|
||||
void FNEG(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0010111011111000111110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FNEG(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0110111011111000111110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRECPE(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0101111011111001110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRECPE(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111011111001110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRECPE(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111011111001110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRECPS(HReg rd, HReg rn, HReg rm)
|
||||
{
|
||||
emit<"01011110010mmmmm001111nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FRECPS(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00001110010mmmmm001111nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FRECPS(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01001110010mmmmm001111nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FRECPX(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0101111011111001111110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTA(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0010111001111001100010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTA(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0110111001111001100010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTI(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0010111011111001100110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTI(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0110111011111001100110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTM(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111001111001100110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTM(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111001111001100110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTN(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111001111001100010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTN(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111001111001100010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTP(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111011111001100010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTP(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111011111001100010nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTX(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0010111001111001100110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTX(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0110111001111001100110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTZ(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111011111001100110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRINTZ(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111011111001100110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRSQRTE(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0111111011111001110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRSQRTE(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0010111011111001110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRSQRTE(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0110111011111001110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FRSQRTS(HReg rd, HReg rn, HReg rm)
|
||||
{
|
||||
emit<"01011110110mmmmm001111nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FRSQRTS(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00001110110mmmmm001111nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FRSQRTS(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01001110110mmmmm001111nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FSQRT(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0010111011111001111110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FSQRT(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0110111011111001111110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void FSUB(VReg_4H rd, VReg_4H rn, VReg_4H rm)
|
||||
{
|
||||
emit<"00001110110mmmmm000101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void FSUB(VReg_8H rd, VReg_8H rn, VReg_8H rm)
|
||||
{
|
||||
emit<"01001110110mmmmm000101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void RAX1(VReg_2D rd, VReg_2D rn, VReg_2D rm)
|
||||
{
|
||||
emit<"11001110011mmmmm100011nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void SCVTF(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0101111001111001110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void SCVTF(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0000111001111001110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void SCVTF(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0100111001111001110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void SDOT(VReg_2S rd, VReg_8B rn, SElem em)
|
||||
{
|
||||
emit<"0000111110LMmmmm1110H0nnnnnddddd", "d", "n", "Mm", "H", "L">(rd, rn, em.reg_index(), em.elem_index() >> 1, em.elem_index() & 1);
|
||||
}
|
||||
void SDOT(VReg_4S rd, VReg_16B rn, SElem em)
|
||||
{
|
||||
emit<"0100111110LMmmmm1110H0nnnnnddddd", "d", "n", "Mm", "H", "L">(rd, rn, em.reg_index(), em.elem_index() >> 1, em.elem_index() & 1);
|
||||
}
|
||||
void SDOT(VReg_2S rd, VReg_8B rn, VReg_8B rm)
|
||||
{
|
||||
emit<"00001110100mmmmm100101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void SDOT(VReg_4S rd, VReg_16B rn, VReg_16B rm)
|
||||
{
|
||||
emit<"01001110100mmmmm100101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void SHA512H(QReg rd, QReg rn, VReg_2D rm)
|
||||
{
|
||||
emit<"11001110011mmmmm100000nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void SHA512H2(QReg rd, QReg rn, VReg_2D rm)
|
||||
{
|
||||
emit<"11001110011mmmmm100001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void SHA512SU0(VReg_2D rd, VReg_2D rn)
|
||||
{
|
||||
emit<"1100111011000000100000nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void SHA512SU1(VReg_2D rd, VReg_2D rn, VReg_2D rm)
|
||||
{
|
||||
emit<"11001110011mmmmm100010nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void SM3PARTW1(VReg_4S rd, VReg_4S rn, VReg_4S rm)
|
||||
{
|
||||
emit<"11001110011mmmmm110000nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void SM3PARTW2(VReg_4S rd, VReg_4S rn, VReg_4S rm)
|
||||
{
|
||||
emit<"11001110011mmmmm110001nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void SM3SS1(VReg_4S rd, VReg_4S rn, VReg_4S rm, VReg_4S ra)
|
||||
{
|
||||
emit<"11001110010mmmmm0aaaaannnnnddddd", "d", "n", "m", "a">(rd, rn, rm, ra);
|
||||
}
|
||||
void SM3TT1A(VReg_4S rd, VReg_4S rn, SElem em)
|
||||
{
|
||||
emit<"11001110010mmmmm10ii00nnnnnddddd", "d", "n", "m", "i">(rd, rn, em.reg_index(), em.elem_index());
|
||||
}
|
||||
void SM3TT1B(VReg_4S rd, VReg_4S rn, SElem em)
|
||||
{
|
||||
emit<"11001110010mmmmm10ii01nnnnnddddd", "d", "n", "m", "i">(rd, rn, em.reg_index(), em.elem_index());
|
||||
}
|
||||
void SM3TT2A(VReg_4S rd, VReg_4S rn, SElem em)
|
||||
{
|
||||
emit<"11001110010mmmmm10ii10nnnnnddddd", "d", "n", "m", "i">(rd, rn, em.reg_index(), em.elem_index());
|
||||
}
|
||||
void SM3TT2B(VReg_4S rd, VReg_4S rn, SElem em)
|
||||
{
|
||||
emit<"11001110010mmmmm10ii11nnnnnddddd", "d", "n", "m", "i">(rd, rn, em.reg_index(), em.elem_index());
|
||||
}
|
||||
void SM4E(VReg_4S rd, VReg_4S rn)
|
||||
{
|
||||
emit<"1100111011000000100001nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void SM4EKEY(VReg_4S rd, VReg_4S rn, VReg_4S rm)
|
||||
{
|
||||
emit<"11001110011mmmmm110010nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void UCVTF(HReg rd, HReg rn)
|
||||
{
|
||||
emit<"0111111001111001110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void UCVTF(VReg_4H rd, VReg_4H rn)
|
||||
{
|
||||
emit<"0010111001111001110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void UCVTF(VReg_8H rd, VReg_8H rn)
|
||||
{
|
||||
emit<"0110111001111001110110nnnnnddddd", "d", "n">(rd, rn);
|
||||
}
|
||||
void UDOT(VReg_2S rd, VReg_8B rn, SElem em)
|
||||
{
|
||||
emit<"0010111110LMmmmm1110H0nnnnnddddd", "d", "n", "Mm", "H", "L">(rd, rn, em.reg_index(), em.elem_index() >> 1, em.elem_index() & 1);
|
||||
}
|
||||
void UDOT(VReg_4S rd, VReg_16B rn, SElem em)
|
||||
{
|
||||
emit<"0110111110LMmmmm1110H0nnnnnddddd", "d", "n", "Mm", "H", "L">(rd, rn, em.reg_index(), em.elem_index() >> 1, em.elem_index() & 1);
|
||||
}
|
||||
void UDOT(VReg_2S rd, VReg_8B rn, VReg_8B rm)
|
||||
{
|
||||
emit<"00101110100mmmmm100101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void UDOT(VReg_4S rd, VReg_16B rn, VReg_16B rm)
|
||||
{
|
||||
emit<"01101110100mmmmm100101nnnnnddddd", "d", "n", "m">(rd, rn, rm);
|
||||
}
|
||||
void XAR(VReg_2D rd, VReg_2D rn, VReg_2D rm, Imm<6> rotate_amount)
|
||||
{
|
||||
emit<"11001110100mmmmmiiiiiinnnnnddddd", "d", "n", "m", "i">(rd, rn, rm, rotate_amount);
|
||||
}
|
||||
23
include/oaknut/impl/mnemonics_generic_v8.2.inc.hpp
Normal file
23
include/oaknut/impl/mnemonics_generic_v8.2.inc.hpp
Normal file
|
|
@ -0,0 +1,23 @@
|
|||
// SPDX-FileCopyrightText: Copyright (c) 2022 merryhime <https://mary.rs>
|
||||
// SPDX-License-Identifier: MIT
|
||||
|
||||
void BFC(WReg wd, Imm<5> lsb, Imm<5> width)
|
||||
{
|
||||
if (width.value() == 0 || width.value() > (32 - lsb.value()))
|
||||
throw "invalid width";
|
||||
emit<"0011001100rrrrrrssssss11111ddddd", "d", "r", "s">(wd, (-lsb.value()) & 31, width.value() - 1);
|
||||
}
|
||||
void BFC(XReg xd, Imm<6> lsb, Imm<6> width)
|
||||
{
|
||||
if (width.value() == 0 || width.value() > (64 - lsb.value()))
|
||||
throw "invalid width";
|
||||
emit<"1011001101rrrrrrssssss11111ddddd", "d", "r", "s">(xd, (-lsb.value()) & 63, width.value() - 1);
|
||||
}
|
||||
void ESB()
|
||||
{
|
||||
emit<"11010101000000110010001000011111">();
|
||||
}
|
||||
void PSB()
|
||||
{
|
||||
emit<"11010101000000110010001000111111">();
|
||||
}
|
||||
|
|
@ -28,6 +28,7 @@ struct HReg;
|
|||
struct SReg;
|
||||
struct DReg;
|
||||
struct QReg;
|
||||
struct VReg_2H;
|
||||
struct VReg_8B;
|
||||
struct VReg_4H;
|
||||
struct VReg_2S;
|
||||
|
|
@ -185,10 +186,10 @@ struct VReg : public Reg {
|
|||
};
|
||||
|
||||
struct VRegArranged : public Reg {
|
||||
protected:
|
||||
constexpr explicit VRegArranged(unsigned bitsize_, int index_, unsigned esize_)
|
||||
: Reg(true, bitsize_, index_), m_esize(esize_)
|
||||
{
|
||||
assert(bitsize_ == 64 || bitsize_ == 128);
|
||||
assert(esize_ != 0 && (esize_ & (esize_ - 1)) == 0 && "esize must be a power of two");
|
||||
assert(esize_ <= bitsize_);
|
||||
}
|
||||
|
|
@ -200,6 +201,15 @@ private:
|
|||
int m_esize : 8;
|
||||
};
|
||||
|
||||
struct VReg_2H : public VRegArranged {
|
||||
constexpr explicit VReg_2H(int reg_index_)
|
||||
: VRegArranged(32, reg_index_, 32 / 2)
|
||||
{}
|
||||
|
||||
template<typename Policy>
|
||||
friend class BasicCodeGenerator;
|
||||
};
|
||||
|
||||
struct VReg_8B : public VRegArranged {
|
||||
constexpr explicit VReg_8B(int reg_index_)
|
||||
: VRegArranged(64, reg_index_, 64 / 8)
|
||||
|
|
@ -445,6 +455,7 @@ struct VRegSelector {
|
|||
constexpr ElemSelector<SElem> S() const { return ElemSelector<SElem>(index()); }
|
||||
constexpr ElemSelector<DElem> D() const { return ElemSelector<DElem>(index()); }
|
||||
|
||||
constexpr VReg_2H H2() const { return VReg_2H{index()}; }
|
||||
constexpr VReg_8B B8() const { return VReg_8B{index()}; }
|
||||
constexpr VReg_4H H4() const { return VReg_4H{index()}; }
|
||||
constexpr VReg_2S S2() const { return VReg_2S{index()}; }
|
||||
|
|
|
|||
|
|
@ -100,8 +100,10 @@ public:
|
|||
|
||||
#include "oaknut/impl/mnemonics_fpsimd_v8.0.inc.hpp"
|
||||
#include "oaknut/impl/mnemonics_fpsimd_v8.1.inc.hpp"
|
||||
#include "oaknut/impl/mnemonics_fpsimd_v8.2.inc.hpp"
|
||||
#include "oaknut/impl/mnemonics_generic_v8.0.inc.hpp"
|
||||
#include "oaknut/impl/mnemonics_generic_v8.1.inc.hpp"
|
||||
#include "oaknut/impl/mnemonics_generic_v8.2.inc.hpp"
|
||||
|
||||
void RET()
|
||||
{
|
||||
|
|
|
|||
Loading…
Reference in a new issue