#pragma once #ifdef LLVM_AVAILABLE #ifdef _MSC_VER #pragma warning(push, 0) #else #pragma GCC diagnostic push #pragma GCC diagnostic ignored "-Wall" #pragma GCC diagnostic ignored "-Wextra" #pragma GCC diagnostic ignored "-Wold-style-cast" #pragma GCC diagnostic ignored "-Wunused-parameter" #pragma GCC diagnostic ignored "-Wstrict-aliasing" #pragma GCC diagnostic ignored "-Weffc++" #pragma GCC diagnostic ignored "-Wmissing-noreturn" #pragma GCC diagnostic ignored "-Wredundant-decls" #endif #include "llvm/IR/LLVMContext.h" #include "llvm/ExecutionEngine/ExecutionEngine.h" #include "llvm/IR/IRBuilder.h" #include "llvm/IR/Module.h" #include "llvm/Target/TargetMachine.h" #include "llvm/Support/KnownBits.h" #include "llvm/Support/ModRef.h" #include "llvm/Analysis/ConstantFolding.h" #include "llvm/Analysis/ValueTracking.h" #include "llvm/IR/IntrinsicsX86.h" #include "llvm/IR/IntrinsicsAArch64.h" #ifdef _MSC_VER #pragma warning(pop) #else #pragma GCC diagnostic pop #endif #include "util/types.hpp" #include "util/sysinfo.hpp" #include "Utilities/StrFmt.h" #include "Utilities/BitField.h" #include "Utilities/JIT.h" #include "util/v128.hpp" #include #include // Helper function llvm::Value* peek_through_bitcasts(llvm::Value*); enum class i2 : char { }; enum class i4 : char { }; template concept LLVMType = (std::is_pointer_v) && (std::is_base_of_v>); template concept LLVMValue = (std::is_pointer_v) && (std::is_base_of_v>); template concept DSLValue = requires (T& v) { { v.eval(std::declval*>()) } -> LLVMValue; }; template struct get_int_bits { }; template <> struct get_int_bits<1> { using utype = bool; }; template <> struct get_int_bits<2> { using utype = i2; }; template <> struct get_int_bits<4> { using utype = i4; }; template <> struct get_int_bits<8> { using utype = u8; }; template <> struct get_int_bits<16> { using utype = u16; }; template <> struct get_int_bits<32> { using utype = u32; }; template <> struct get_int_bits<64> { using utype = u64; }; template <> struct get_int_bits<128> { using utype = u128; }; template using get_int_vt = typename get_int_bits::utype; template struct llvm_value_t { static_assert(std::is_same::value, "llvm_value_t<> error: unknown type"); using type = void; using base = llvm_value_t; static constexpr uint esize = 0; static constexpr bool is_int = false; static constexpr bool is_sint = false; static constexpr bool is_uint = false; static constexpr bool is_float = false; static constexpr uint is_array = false; static constexpr uint is_vector = false; static constexpr uint is_pointer = false; static llvm::Type* get_type(llvm::LLVMContext& context) { return llvm::Type::getVoidTy(context); } llvm::Value* eval(llvm::IRBuilder<>*) const { return value; } std::tuple<> match(llvm::Value*& value, llvm::Module*) const { if (peek_through_bitcasts(value) != peek_through_bitcasts(this->value)) { value = nullptr; } return {}; } llvm::Value* value; // llvm_value_t() = default; // llvm_value_t(llvm::Value* value) // : value(value) // { // } }; template <> struct llvm_value_t : llvm_value_t { using type = bool; using base = llvm_value_t; using base::base; static constexpr uint esize = 1; static constexpr bool is_int = true; static llvm::Type* get_type(llvm::LLVMContext& context) { return llvm::Type::getInt1Ty(context); } }; template <> struct llvm_value_t : llvm_value_t { using type = i2; using base = llvm_value_t; using base::base; static constexpr uint esize = 2; static constexpr bool is_int = true; static llvm::Type* get_type(llvm::LLVMContext& context) { return llvm::Type::getIntNTy(context, 2); } }; template <> struct llvm_value_t : llvm_value_t { using type = i4; using base = llvm_value_t; using base::base; static constexpr uint esize = 4; static constexpr bool is_int = true; static llvm::Type* get_type(llvm::LLVMContext& context) { return llvm::Type::getIntNTy(context, 4); } }; template <> struct llvm_value_t : llvm_value_t { using type = char; using base = llvm_value_t; using base::base; static constexpr uint esize = 8; static constexpr bool is_int = true; static llvm::Type* get_type(llvm::LLVMContext& context) { return llvm::Type::getInt8Ty(context); } }; template <> struct llvm_value_t : llvm_value_t { using type = s8; using base = llvm_value_t; using base::base; static constexpr bool is_sint = true; }; template <> struct llvm_value_t : llvm_value_t { using type = u8; using base = llvm_value_t; using base::base; static constexpr bool is_uint = true; }; template <> struct llvm_value_t : llvm_value_t { using type = s16; using base = llvm_value_t; using base::base; static constexpr uint esize = 16; static llvm::Type* get_type(llvm::LLVMContext& context) { return llvm::Type::getInt16Ty(context); } }; template <> struct llvm_value_t : llvm_value_t { using type = u16; using base = llvm_value_t; using base::base; static constexpr bool is_sint = false; static constexpr bool is_uint = true; }; template <> struct llvm_value_t : llvm_value_t { using type = int; using base = llvm_value_t; using base::base; static constexpr uint esize = 32; static llvm::Type* get_type(llvm::LLVMContext& context) { return llvm::Type::getInt32Ty(context); } }; template <> struct llvm_value_t : llvm_value_t { using type = uint; using base = llvm_value_t; using base::base; static constexpr bool is_sint = false; static constexpr bool is_uint = true; }; template <> struct llvm_value_t : llvm_value_t { using type = long; using base = llvm_value_t; using base::base; static constexpr uint esize = 8 * sizeof(long); static llvm::Type* get_type(llvm::LLVMContext& context) { return llvm::Type::getInt64Ty(context); } }; template <> struct llvm_value_t : llvm_value_t { using type = ulong; using base = llvm_value_t; using base::base; static constexpr bool is_sint = false; static constexpr bool is_uint = true; }; template <> struct llvm_value_t : llvm_value_t { using type = llong; using base = llvm_value_t; using base::base; static constexpr uint esize = 64; static llvm::Type* get_type(llvm::LLVMContext& context) { return llvm::Type::getInt64Ty(context); } }; template <> struct llvm_value_t : llvm_value_t { using type = ullong; using base = llvm_value_t; using base::base; static constexpr bool is_sint = false; static constexpr bool is_uint = true; }; template <> struct llvm_value_t : llvm_value_t { using type = s128; using base = llvm_value_t; using base::base; static constexpr uint esize = 128; static llvm::Type* get_type(llvm::LLVMContext& context) { return llvm::Type::getIntNTy(context, 128); } }; template <> struct llvm_value_t : llvm_value_t { using type = u128; using base = llvm_value_t; using base::base; static constexpr bool is_sint = false; static constexpr bool is_uint = true; }; template <> struct llvm_value_t : llvm_value_t { using type = f32; using base = llvm_value_t; using base::base; static constexpr uint esize = 32; static constexpr bool is_float = true; static llvm::Type* get_type(llvm::LLVMContext& context) { return llvm::Type::getFloatTy(context); } }; template <> struct llvm_value_t : llvm_value_t { using type = f64; using base = llvm_value_t; using base::base; static constexpr uint esize = 64; static constexpr bool is_float = true; static llvm::Type* get_type(llvm::LLVMContext& context) { return llvm::Type::getDoubleTy(context); } }; template struct llvm_value_t : llvm_value_t { static_assert(!std::is_void::value, "llvm_value_t<> error: invalid pointer to void type"); using type = T*; using base = llvm_value_t; using base::base; static constexpr uint esize = 64; static constexpr bool is_int = false; static constexpr bool is_sint = false; static constexpr bool is_uint = false; static constexpr bool is_float = false; static constexpr uint is_array = false; static constexpr uint is_vector = false; static constexpr uint is_pointer = llvm_value_t::is_pointer + 1; static llvm::Type* get_type(llvm::LLVMContext& context) { return llvm_value_t::get_type(context)->getPointerTo(); } }; // u32[4] : vector of 4 u32 elements // u32[123][4] : array of 123 u32[4] vectors // u32[123][1] : array of 123 u32 scalars template struct llvm_value_t : llvm_value_t > 1), T, std::remove_extent_t>> { using type = T[N]; using base = llvm_value_t > 1), T, std::remove_extent_t>>; using base::base; static constexpr uint esize = std::is_array_v ? 0 : base::esize; static constexpr bool is_int = !std::is_array_v && base::is_int; static constexpr bool is_sint = !std::is_array_v && base::is_sint; static constexpr bool is_uint = !std::is_array_v && base::is_uint; static constexpr bool is_float = !std::is_array_v && base::is_float; static constexpr uint is_array = std::is_array_v ? N : 0; static constexpr uint is_vector = std::is_array_v ? 0 : N; static constexpr uint is_pointer = 0; static llvm::Type* get_type(llvm::LLVMContext& context) { if constexpr (std::is_array_v) { return llvm::ArrayType::get(base::get_type(context), N); } else if constexpr (N > 1) { return llvm::VectorType::get(base::get_type(context), N, false); } else { return base::get_type(context); } } }; template using llvm_expr_t = std::decay_t; template struct is_llvm_expr { }; template struct is_llvm_expr().eval(std::declval*>()))>> { using type = typename std::decay_t::type; }; template struct is_llvm_expr_of { static constexpr bool ok = false; }; template struct is_llvm_expr_of::type, typename is_llvm_expr::type>> { static constexpr bool ok = std::is_same_v::type, typename is_llvm_expr::type>; }; template using llvm_common_t = std::enable_if_t<(is_llvm_expr_of::ok && ...), typename is_llvm_expr::type>; template using llvm_match_tuple = decltype(std::tuple_cat(std::declval&>().match(std::declval(), nullptr)...)); template >> struct llvm_match_t { using type = T; llvm::Value* value = nullptr; explicit operator bool() const { return value != nullptr; } template bool eq(const Args&... args) const { llvm::Value* lhs = nullptr; return value && (lhs = peek_through_bitcasts(value)) && ((lhs == peek_through_bitcasts(args.value)) && ...); } llvm::Value* eval(llvm::IRBuilder<>*) const { return value; } std::tuple<> match(llvm::Value*& value, llvm::Module*) const { if (peek_through_bitcasts(value) != peek_through_bitcasts(this->value)) { value = nullptr; } return {}; } }; template >> struct llvm_placeholder_t { // TODO: placeholder extracting actual constant values (u64, f64, vector, etc) using type = T; llvm::Value* eval(llvm::IRBuilder<>*) const { return nullptr; } std::tuple> match(llvm::Value*& value, llvm::Module*) const { if (value && value->getType() == llvm_value_t::get_type(value->getContext())) { return {{value}}; } value = nullptr; return {}; } }; template struct llvm_const_int { using type = T; u64 val; static constexpr bool is_ok = llvm_value_t::is_int; llvm::Value* eval(llvm::IRBuilder<>* ir) const { static_assert(llvm_value_t::is_int, "llvm_const_int<>: invalid type"); return llvm::ConstantInt::get(llvm_value_t::get_type(ir->getContext()), val, ForceSigned || llvm_value_t::is_sint); } std::tuple<> match(llvm::Value*& value, llvm::Module*) const { if (value && value == llvm::ConstantInt::get(llvm_value_t::get_type(value->getContext()), val, ForceSigned || llvm_value_t::is_sint)) { return {}; } value = nullptr; return {}; } }; template struct llvm_const_float { using type = T; f64 val; static constexpr bool is_ok = llvm_value_t::is_float; llvm::Value* eval(llvm::IRBuilder<>* ir) const { static_assert(llvm_value_t::is_float, "llvm_const_float<>: invalid type"); return llvm::ConstantFP::get(llvm_value_t::get_type(ir->getContext()), val); } std::tuple<> match(llvm::Value*& value, llvm::Module*) const { if (value && value == llvm::ConstantFP::get(llvm_value_t::get_type(value->getContext()), val)) { return {}; } value = nullptr; return {}; } }; template struct llvm_const_vector { using type = T; T data; static constexpr bool is_ok = N && llvm_value_t::is_vector == N; llvm::Value* eval(llvm::IRBuilder<>* ir) const { static_assert(N && llvm_value_t::is_vector == N, "llvm_const_vector<>: invalid type"); return llvm::ConstantDataVector::get(ir->getContext(), data); } std::tuple<> match(llvm::Value*& value, llvm::Module*) const { if (value && value == llvm::ConstantDataVector::get(value->getContext(), data)) { return {}; } value = nullptr; return {}; } }; template > struct llvm_add { using type = T; llvm_expr_t a1; llvm_expr_t a2; static_assert(llvm_value_t::is_sint || llvm_value_t::is_uint || llvm_value_t::is_float, "llvm_add<>: invalid type"); static constexpr auto opc = llvm_value_t::is_float ? llvm::Instruction::FAdd : llvm::Instruction::Add; llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); return ir->CreateBinOp(opc, v1, v2); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getOpcode() == opc) { v1 = i->getOperand(0); v2 = i->getOperand(1); if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2); } } v1 = i->getOperand(0); v2 = i->getOperand(1); // Argument order does not matter here, try when swapped if (auto r1 = a1.match(v2, _m); v2) { if (auto r2 = a2.match(v1, _m); v1) { return std::tuple_cat(r1, r2); } } } value = nullptr; return {}; } }; template inline llvm_add operator +(T1&& a1, T2&& a2) { return {a1, a2}; } template inline llvm_add::type>> operator +(T1&& a1, u64 c) { return {a1, {c}}; } template > struct llvm_sum { using type = T; llvm_expr_t a1; llvm_expr_t a2; llvm_expr_t a3; static_assert(llvm_value_t::is_sint || llvm_value_t::is_uint, "llvm_sum<>: invalid_type"); llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); const auto v3 = a3.eval(ir); return ir->CreateAdd(ir->CreateAdd(v1, v2), v3); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; llvm::Value* v3 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getOpcode() == llvm::Instruction::Add) { v3 = i->getOperand(1); if (auto r3 = a3.match(v3, _m); v3) { i = llvm::dyn_cast(i->getOperand(0)); if (i && i->getOpcode() == llvm::Instruction::Add) { v1 = i->getOperand(0); v2 = i->getOperand(1); if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2, r3); } } } } } value = nullptr; return {}; } }; template llvm_sum(T1&& a1, T2&& a2, T3&& a3) -> llvm_sum; template > struct llvm_sub { using type = T; llvm_expr_t a1; llvm_expr_t a2; static_assert(llvm_value_t::is_sint || llvm_value_t::is_uint || llvm_value_t::is_float, "llvm_sub<>: invalid type"); static constexpr auto opc = llvm_value_t::is_float ? llvm::Instruction::FSub : llvm::Instruction::Sub; llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); return ir->CreateBinOp(opc, v1, v2); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getOpcode() == opc) { v1 = i->getOperand(0); v2 = i->getOperand(1); if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2); } } } value = nullptr; return {}; } }; template inline llvm_sub operator -(T1&& a1, T2&& a2) { return {a1, a2}; } template inline llvm_sub::type>> operator -(T1&& a1, u64 c) { return {a1, {c}}; } template inline llvm_sub::type>, T1> operator -(u64 c, T1&& a1) { return {{c}, a1}; } template > struct llvm_mul { using type = T; llvm_expr_t a1; llvm_expr_t a2; static_assert(llvm_value_t::is_sint || llvm_value_t::is_uint || llvm_value_t::is_float, "llvm_mul<>: invalid type"); static constexpr auto opc = llvm_value_t::is_float ? llvm::Instruction::FMul : llvm::Instruction::Mul; llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); return ir->CreateBinOp(opc, v1, v2); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getOpcode() == opc) { v1 = i->getOperand(0); v2 = i->getOperand(1); if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2); } } v1 = i->getOperand(0); v2 = i->getOperand(1); // Argument order does not matter here, try when swapped if (auto r1 = a1.match(v2, _m); v2) { if (auto r2 = a2.match(v1, _m); v1) { return std::tuple_cat(r1, r2); } } } value = nullptr; return {}; } }; template inline llvm_mul operator *(T1&& a1, T2&& a2) { return {a1, a2}; } template > struct llvm_div { using type = T; llvm_expr_t a1; llvm_expr_t a2; static_assert(llvm_value_t::is_sint || llvm_value_t::is_uint || llvm_value_t::is_float, "llvm_div<>: invalid type"); static constexpr auto opc = llvm_value_t::is_float ? llvm::Instruction::FDiv : llvm_value_t::is_uint ? llvm::Instruction::UDiv : llvm::Instruction::SDiv; llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); return ir->CreateBinOp(opc, v1, v2); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getOpcode() == opc) { v1 = i->getOperand(0); v2 = i->getOperand(1); if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2); } } } value = nullptr; return {}; } }; template inline llvm_div operator /(T1&& a1, T2&& a2) { return {a1, a2}; } inline llvm::Constant* getZeroValueForNegation(llvm::Type* Ty) { if (Ty->isFPOrFPVectorTy()) return llvm::ConstantFP::getNegativeZero(Ty); return llvm::Constant::getNullValue(Ty); } template > struct llvm_neg { using type = T; llvm_expr_t a1; static_assert(llvm_value_t::is_sint || llvm_value_t::is_uint || llvm_value_t::is_float, "llvm_neg<>: invalid type"); static constexpr int opc = llvm_value_t::is_float ? +llvm::Instruction::FNeg : +llvm::Instruction::Sub; llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); if constexpr (llvm_value_t::is_int) { return ir->CreateNeg(v1); } if constexpr (llvm_value_t::is_float) { return ir->CreateFNeg(v1); } // TODO: return value ? } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; if constexpr (llvm_value_t::is_float) { if (auto i = llvm::dyn_cast_or_null(value); i && i->getOpcode() == opc) { v1 = i->getOperand(0); if (auto r1 = a1.match(v1, _m); v1) { return r1; } } } if (auto i = llvm::dyn_cast_or_null(value); i && i->getOpcode() == opc) { v1 = i->getOperand(1); if (i->getOperand(0) == getZeroValueForNegation(v1->getType())) { if (auto r1 = a1.match(v1, _m); v1) { return r1; } } } value = nullptr; return {}; } }; template inline llvm_neg operator -(T1 a1) { return {a1}; } template > struct llvm_shl { using type = T; llvm_expr_t a1; llvm_expr_t a2; static_assert(llvm_value_t::is_sint || llvm_value_t::is_uint, "llvm_shl<>: invalid type"); llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); return ir->CreateShl(v1, v2); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getOpcode() == llvm::Instruction::Shl) { v1 = i->getOperand(0); v2 = i->getOperand(1); if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2); } } } value = nullptr; return {}; } }; template inline llvm_shl operator <<(T1&& a1, T2&& a2) { return {a1, a2}; } template inline llvm_shl::type>> operator <<(T1&& a1, u64 c) { return {a1, {c}}; } template > struct llvm_shr { using type = T; llvm_expr_t a1; llvm_expr_t a2; static_assert(llvm_value_t::is_sint || llvm_value_t::is_uint, "llvm_shr<>: invalid type"); static constexpr auto opc = llvm_value_t::is_uint ? llvm::Instruction::LShr : llvm::Instruction::AShr; llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); return ir->CreateBinOp(opc, v1, v2); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getOpcode() == opc) { v1 = i->getOperand(0); v2 = i->getOperand(1); if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2); } } } value = nullptr; return {}; } }; template inline llvm_shr operator >>(T1&& a1, T2&& a2) { return {a1, a2}; } template inline llvm_shr::type>> operator >>(T1&& a1, u64 c) { return {a1, {c}}; } template > struct llvm_fshl { using type = T; llvm_expr_t a1; llvm_expr_t a2; llvm_expr_t a3; static_assert(llvm_value_t::is_sint || llvm_value_t::is_uint, "llvm_fshl<>: invalid type"); static constexpr bool is_ok = llvm_value_t::is_sint || llvm_value_t::is_uint; static llvm::Function* get_fshl(llvm::IRBuilder<>* ir) { const auto _module = ir->GetInsertBlock()->getParent()->getParent(); return llvm::Intrinsic::getDeclaration(_module, llvm::Intrinsic::fshl, {llvm_value_t::get_type(ir->getContext())}); } static llvm::Value* fold(llvm::IRBuilder<>* ir, llvm::Value* v1, llvm::Value* v2, llvm::Value* v3) { // Compute constant result. const u64 size = v3->getType()->getScalarSizeInBits(); const auto val = ir->CreateURem(v3, llvm::ConstantInt::get(v3->getType(), size)); const auto shl = ir->CreateShl(v1, val); const auto shr = ir->CreateLShr(v2, ir->CreateSub(llvm::ConstantInt::get(v3->getType(), size - 1), val)); return ir->CreateOr(shl, ir->CreateLShr(shr, 1)); } llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); const auto v3 = a3.eval(ir); if (llvm::isa(v1) && llvm::isa(v2) && llvm::isa(v3)) { return fold(ir, v1, v2, v3); } return ir->CreateCall(get_fshl(ir), {v1, v2, v3}); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; llvm::Value* v3 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getIntrinsicID() == llvm::Intrinsic::fshl) { v1 = i->getOperand(0); v2 = i->getOperand(1); v3 = i->getOperand(2); if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { if (auto r3 = a3.match(v3, _m); v3) { return std::tuple_cat(r1, r2, r3); } } } } value = nullptr; return {}; } }; template > struct llvm_fshr { using type = T; llvm_expr_t a1; llvm_expr_t a2; llvm_expr_t a3; static_assert(llvm_value_t::is_sint || llvm_value_t::is_uint, "llvm_fshr<>: invalid type"); static constexpr bool is_ok = llvm_value_t::is_sint || llvm_value_t::is_uint; static llvm::Function* get_fshr(llvm::IRBuilder<>* ir) { const auto _module = ir->GetInsertBlock()->getParent()->getParent(); return llvm::Intrinsic::getDeclaration(_module, llvm::Intrinsic::fshr, {llvm_value_t::get_type(ir->getContext())}); } static llvm::Value* fold(llvm::IRBuilder<>* ir, llvm::Value* v1, llvm::Value* v2, llvm::Value* v3) { // Compute constant result. const u64 size = v3->getType()->getScalarSizeInBits(); const auto val = ir->CreateURem(v3, llvm::ConstantInt::get(v3->getType(), size)); const auto shr = ir->CreateLShr(v2, val); const auto shl = ir->CreateShl(v1, ir->CreateSub(llvm::ConstantInt::get(v3->getType(), size - 1), val)); return ir->CreateOr(shr, ir->CreateShl(shl, 1)); } llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); const auto v3 = a3.eval(ir); if (llvm::isa(v1) && llvm::isa(v2) && llvm::isa(v3)) { return fold(ir, v1, v2, v3); } return ir->CreateCall(get_fshr(ir), {v1, v2, v3}); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; llvm::Value* v3 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getIntrinsicID() == llvm::Intrinsic::fshr) { v1 = i->getOperand(0); v2 = i->getOperand(1); v3 = i->getOperand(2); if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { if (auto r3 = a3.match(v3, _m); v3) { return std::tuple_cat(r1, r2, r3); } } } } value = nullptr; return {}; } }; template > struct llvm_rol { using type = T; llvm_expr_t a1; llvm_expr_t a2; static_assert(llvm_value_t::is_sint || llvm_value_t::is_uint, "llvm_rol<>: invalid type"); static constexpr bool is_ok = llvm_value_t::is_sint || llvm_value_t::is_uint; llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); if (llvm::isa(v1) && llvm::isa(v2)) { return llvm_fshl::fold(ir, v1, v1, v2); } return ir->CreateCall(llvm_fshl::get_fshl(ir), {v1, v1, v2}); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getIntrinsicID() == llvm::Intrinsic::fshl) { v1 = i->getOperand(0); v2 = i->getOperand(2); if (i->getOperand(1) == v1) { if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2); } } } } value = nullptr; return {}; } }; template > struct llvm_and { using type = T; llvm_expr_t a1; llvm_expr_t a2; static_assert(llvm_value_t::is_int, "llvm_and<>: invalid type"); llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); return ir->CreateAnd(v1, v2); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getOpcode() == llvm::Instruction::And) { v1 = i->getOperand(0); v2 = i->getOperand(1); if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2); } } } value = nullptr; return {}; } }; template inline llvm_and operator &(T1&& a1, T2&& a2) { return {a1, a2}; } template inline llvm_and::type>> operator &(T1&& a1, u64 c) { return {a1, {c}}; } template > struct llvm_or { using type = T; llvm_expr_t a1; llvm_expr_t a2; static_assert(llvm_value_t::is_int, "llvm_or<>: invalid type"); llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); return ir->CreateOr(v1, v2); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getOpcode() == llvm::Instruction::Or) { v1 = i->getOperand(0); v2 = i->getOperand(1); if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2); } } } value = nullptr; return {}; } }; template inline llvm_or operator |(T1&& a1, T2&& a2) { return {a1, a2}; } template inline llvm_or::type>> operator |(T1&& a1, u64 c) { return {a1, {c}}; } template > struct llvm_xor { using type = T; llvm_expr_t a1; llvm_expr_t a2; static_assert(llvm_value_t::is_int, "llvm_xor<>: invalid type"); llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); return ir->CreateXor(v1, v2); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getOpcode() == llvm::Instruction::Xor) { v1 = i->getOperand(0); v2 = i->getOperand(1); if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2); } } } value = nullptr; return {}; } }; template inline llvm_xor operator ^(T1&& a1, T2&& a2) { return {a1, a2}; } template inline llvm_xor::type>> operator ^(T1&& a1, u64 c) { return {a1, {c}}; } template inline llvm_xor::type, true>> operator ~(T1&& a1) { return {a1, {u64{umax}}}; } template > struct llvm_cmp { using type = std::conditional_t::is_vector != 0, bool[llvm_value_t::is_vector], bool>; static constexpr bool is_float = llvm_value_t::is_float; llvm_expr_t a1; llvm_expr_t a2; static_assert(llvm_value_t::is_int || is_float, "llvm_cmp<>: invalid type"); // Convert unsigned comparison predicate to signed if necessary static constexpr llvm::CmpInst::Predicate pred = llvm_value_t::is_uint ? UPred : UPred == llvm::ICmpInst::ICMP_UGT ? llvm::ICmpInst::ICMP_SGT : UPred == llvm::ICmpInst::ICMP_UGE ? llvm::ICmpInst::ICMP_SGE : UPred == llvm::ICmpInst::ICMP_ULT ? llvm::ICmpInst::ICMP_SLT : UPred == llvm::ICmpInst::ICMP_ULE ? llvm::ICmpInst::ICMP_SLE : UPred; static_assert(llvm_value_t::is_sint || llvm_value_t::is_uint || is_float || UPred == llvm::ICmpInst::ICMP_EQ || UPred == llvm::ICmpInst::ICMP_NE, "llvm_cmp<>: invalid operation on sign-undefined type"); llvm::Value* eval(llvm::IRBuilder<>* ir) const { static_assert(!is_float, "llvm_cmp<>: invalid operation (missing fcmp_ord or fcmp_uno)"); const auto v1 = a1.eval(ir); const auto v2 = a2.eval(ir); return ir->CreateICmp(pred, v1, v2); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getPredicate() == pred) { v1 = i->getOperand(0); v2 = i->getOperand(1); if (auto r1 = a1.match(v1, _m); v1) { if (auto r2 = a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2); } } } value = nullptr; return {}; } }; template struct is_llvm_cmp : std::bool_constant { }; template struct is_llvm_cmp> : std::bool_constant { }; template > struct llvm_ord { using base = std::decay_t; using type = typename base::type; llvm_expr_t cmp; // Convert comparison predicate to ordered static constexpr llvm::CmpInst::Predicate pred = base::pred == llvm::ICmpInst::ICMP_EQ ? llvm::ICmpInst::FCMP_OEQ : base::pred == llvm::ICmpInst::ICMP_NE ? llvm::ICmpInst::FCMP_ONE : base::pred == llvm::ICmpInst::ICMP_SGT ? llvm::ICmpInst::FCMP_OGT : base::pred == llvm::ICmpInst::ICMP_SGE ? llvm::ICmpInst::FCMP_OGE : base::pred == llvm::ICmpInst::ICMP_SLT ? llvm::ICmpInst::FCMP_OLT : base::pred == llvm::ICmpInst::ICMP_SLE ? llvm::ICmpInst::FCMP_OLE : base::pred; static_assert(base::is_float, "llvm_ord<>: invalid type"); llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = cmp.a1.eval(ir); const auto v2 = cmp.a2.eval(ir); return ir->CreateFCmp(pred, v1, v2); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getPredicate() == pred) { v1 = i->getOperand(0); v2 = i->getOperand(1); if (auto r1 = cmp.a1.match(v1, _m); v1) { if (auto r2 = cmp.a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2); } } } value = nullptr; return {}; } }; template llvm_ord(T&&) -> llvm_ord>::value, T&&>>; template > struct llvm_uno { using base = std::decay_t; using type = typename base::type; llvm_expr_t cmp; // Convert comparison predicate to unordered static constexpr llvm::CmpInst::Predicate pred = base::pred == llvm::ICmpInst::ICMP_EQ ? llvm::ICmpInst::FCMP_UEQ : base::pred == llvm::ICmpInst::ICMP_NE ? llvm::ICmpInst::FCMP_UNE : base::pred == llvm::ICmpInst::ICMP_SGT ? llvm::ICmpInst::FCMP_UGT : base::pred == llvm::ICmpInst::ICMP_SGE ? llvm::ICmpInst::FCMP_UGE : base::pred == llvm::ICmpInst::ICMP_SLT ? llvm::ICmpInst::FCMP_ULT : base::pred == llvm::ICmpInst::ICMP_SLE ? llvm::ICmpInst::FCMP_ULE : base::pred; static_assert(base::is_float, "llvm_uno<>: invalid type"); llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = cmp.a1.eval(ir); const auto v2 = cmp.a2.eval(ir); return ir->CreateFCmp(pred, v1, v2); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { llvm::Value* v1 = {}; llvm::Value* v2 = {}; if (auto i = llvm::dyn_cast_or_null(value); i && i->getPredicate() == pred) { v1 = i->getOperand(0); v2 = i->getOperand(1); if (auto r1 = cmp.a1.match(v1, _m); v1) { if (auto r2 = cmp.a2.match(v2, _m); v2) { return std::tuple_cat(r1, r2); } } } value = nullptr; return {}; } }; template llvm_uno(T&&) -> llvm_uno>::value, T&&>>; template inline llvm_cmp operator ==(T1&& a1, T2&& a2) { return {a1, a2}; } template inline llvm_cmp::type>, llvm::ICmpInst::ICMP_EQ> operator ==(T1&& a1, u64 c) { return {a1, {c}}; } template inline llvm_cmp operator !=(T1&& a1, T2&& a2) { return {a1, a2}; } template inline llvm_cmp::type>, llvm::ICmpInst::ICMP_NE> operator !=(T1&& a1, u64 c) { return {a1, {c}}; } template inline llvm_cmp operator >(T1&& a1, T2&& a2) { return {a1, a2}; } template inline llvm_cmp::type>, llvm::ICmpInst::ICMP_UGT> operator >(T1&& a1, u64 c) { return {a1, {c}}; } template inline llvm_cmp operator >=(T1&& a1, T2&& a2) { return {a1, a2}; } template inline llvm_cmp::type>, llvm::ICmpInst::ICMP_UGE> operator >=(T1&& a1, u64 c) { return {a1, {c}}; } template inline llvm_cmp operator <(T1&& a1, T2&& a2) { return {a1, a2}; } template inline llvm_cmp::type>, llvm::ICmpInst::ICMP_ULT> operator <(T1&& a1, u64 c) { return {a1, {c}}; } template inline llvm_cmp operator <=(T1&& a1, T2&& a2) { return {a1, a2}; } template inline llvm_cmp::type>, llvm::ICmpInst::ICMP_ULE> operator <=(T1&& a1, u64 c) { return {a1, {c}}; } template > struct llvm_noncast { using type = U; llvm_expr_t a1; static_assert(llvm_value_t::is_int, "llvm_noncast<>: invalid type"); static_assert(llvm_value_t::is_int, "llvm_noncast<>: invalid result type"); static_assert(llvm_value_t::esize == llvm_value_t::esize, "llvm_noncast<>: result is resized"); static_assert(llvm_value_t::is_vector == llvm_value_t::is_vector, "llvm_noncast<>: vector element mismatch"); static constexpr bool is_ok = llvm_value_t::is_int && llvm_value_t::is_int && llvm_value_t::esize == llvm_value_t::esize && llvm_value_t::is_vector == llvm_value_t::is_vector; llvm::Value* eval(llvm::IRBuilder<>* ir) const { // No operation required return a1.eval(ir); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { if (value) { if (auto r1 = a1.match(value, _m); value) { return r1; } } value = nullptr; return {}; } }; template > struct llvm_bitcast { using type = U; llvm_expr_t a1; llvm::Module* _module; static constexpr uint bitsize0 = llvm_value_t::is_vector ? llvm_value_t::is_vector * llvm_value_t::esize : llvm_value_t::esize; static constexpr uint bitsize1 = llvm_value_t::is_vector ? llvm_value_t::is_vector * llvm_value_t::esize : llvm_value_t::esize; static_assert(bitsize0 == bitsize1, "llvm_bitcast<>: invalid type (size mismatch)"); static_assert(llvm_value_t::is_int || llvm_value_t::is_float, "llvm_bitcast<>: invalid type"); static_assert(llvm_value_t::is_int || llvm_value_t::is_float, "llvm_bitcast<>: invalid result type"); static constexpr bool is_ok = bitsize0 && bitsize0 == bitsize1 && (llvm_value_t::is_int || llvm_value_t::is_float) && (llvm_value_t::is_int || llvm_value_t::is_float); llvm::Value* eval(llvm::IRBuilder<>* ir) const { const auto v1 = a1.eval(ir); const auto rt = llvm_value_t::get_type(ir->getContext()); if constexpr (llvm_value_t::is_int == llvm_value_t::is_int && llvm_value_t::is_vector == llvm_value_t::is_vector) { return v1; } if (const auto c1 = llvm::dyn_cast(v1)) { const auto result = llvm::ConstantFoldCastOperand(llvm::Instruction::BitCast, c1, rt, ir->GetInsertBlock()->getParent()->getParent()->getDataLayout()); if (result) { return result; } } return ir->CreateBitCast(v1, rt); } llvm_match_tuple match(llvm::Value*& value, llvm::Module* _m) const { if constexpr (llvm_value_t::is_int == llvm_value_t::is_int && llvm_value_t::is_vector == llvm_value_t::is_vector) { if (value) { if (auto r1 = a1.match(value, _m); value) { return r1; } } return {}; } llvm::Value* v1 = {}; if (auto i = llvm::dyn_cast_or_null