mirror of
https://git.wownero.com/wownero/RandomWOW.git
synced 2024-08-15 00:23:14 +00:00
Use strongly typed enums (#55)
This commit is contained in:
parent
52aa36249e
commit
447634f51d
7 changed files with 94 additions and 83 deletions
|
@ -67,10 +67,12 @@ namespace randomx {
|
|||
|
||||
void AssemblyGeneratorX86::generateAsm(SuperscalarProgram& prog) {
|
||||
asmCode.str(std::string()); //clear
|
||||
#ifdef RANDOMX_ALIGN
|
||||
asmCode << "ALIGN 16" << std::endl;
|
||||
#endif
|
||||
for (unsigned i = 0; i < prog.getSize(); ++i) {
|
||||
Instruction& instr = prog(i);
|
||||
switch (instr.opcode)
|
||||
switch ((SuperscalarInstructionType)instr.opcode)
|
||||
{
|
||||
case SuperscalarInstructionType::ISUB_R:
|
||||
asmCode << "sub " << regR[instr.dst] << ", " << regR[instr.src] << std::endl;
|
||||
|
@ -95,19 +97,27 @@ namespace randomx {
|
|||
break;
|
||||
case SuperscalarInstructionType::IADD_C8:
|
||||
asmCode << "add " << regR[instr.dst] << ", " << (int32_t)instr.getImm32() << std::endl;
|
||||
#ifdef RANDOMX_ALIGN
|
||||
asmCode << "nop" << std::endl;
|
||||
#endif
|
||||
break;
|
||||
case SuperscalarInstructionType::IXOR_C8:
|
||||
asmCode << "xor " << regR[instr.dst] << ", " << (int32_t)instr.getImm32() << std::endl;
|
||||
#ifdef RANDOMX_ALIGN
|
||||
asmCode << "nop" << std::endl;
|
||||
#endif
|
||||
break;
|
||||
case SuperscalarInstructionType::IADD_C9:
|
||||
asmCode << "add " << regR[instr.dst] << ", " << (int32_t)instr.getImm32() << std::endl;
|
||||
#ifdef RANDOMX_ALIGN
|
||||
asmCode << "xchg ax, ax ;nop" << std::endl;
|
||||
#endif
|
||||
break;
|
||||
case SuperscalarInstructionType::IXOR_C9:
|
||||
asmCode << "xor " << regR[instr.dst] << ", " << (int32_t)instr.getImm32() << std::endl;
|
||||
#ifdef RANDOMX_ALIGN
|
||||
asmCode << "xchg ax, ax ;nop" << std::endl;
|
||||
#endif
|
||||
break;
|
||||
case SuperscalarInstructionType::IMULH_R:
|
||||
asmCode << "mov rax, " << regR[instr.dst] << std::endl;
|
||||
|
@ -179,7 +189,7 @@ namespace randomx {
|
|||
asmCode << "uint64_t r8 = r[0], r9 = r[1], r10 = r[2], r11 = r[3], r12 = r[4], r13 = r[5], r14 = r[6], r15 = r[7];" << std::endl;
|
||||
for (unsigned i = 0; i < prog.getSize(); ++i) {
|
||||
Instruction& instr = prog(i);
|
||||
switch (instr.opcode)
|
||||
switch ((SuperscalarInstructionType)instr.opcode)
|
||||
{
|
||||
case SuperscalarInstructionType::ISUB_R:
|
||||
asmCode << regR[instr.dst] << " -= " << regR[instr.src] << ";" << std::endl;
|
||||
|
|
|
@ -125,7 +125,7 @@ namespace randomx {
|
|||
randomx::generateSuperscalar(cache->programs[i], gen);
|
||||
for (unsigned j = 0; j < cache->programs[i].getSize(); ++j) {
|
||||
auto& instr = cache->programs[i](j);
|
||||
if (instr.opcode == randomx::SuperscalarInstructionType::IMUL_RCP) {
|
||||
if ((SuperscalarInstructionType)instr.opcode == SuperscalarInstructionType::IMUL_RCP) {
|
||||
auto rcp = randomx_reciprocal(instr.getImm32());
|
||||
instr.setImm32(cache->reciprocalCache.size());
|
||||
cache->reciprocalCache.push_back(rcp);
|
||||
|
|
|
@ -39,38 +39,38 @@ namespace randomx {
|
|||
|
||||
typedef void(Instruction::*InstructionFormatter)(std::ostream&) const;
|
||||
|
||||
namespace InstructionType {
|
||||
constexpr int IADD_RS = 0;
|
||||
constexpr int IADD_M = 1;
|
||||
constexpr int ISUB_R = 2;
|
||||
constexpr int ISUB_M = 3;
|
||||
constexpr int IMUL_R = 4;
|
||||
constexpr int IMUL_M = 5;
|
||||
constexpr int IMULH_R = 6;
|
||||
constexpr int IMULH_M = 7;
|
||||
constexpr int ISMULH_R = 8;
|
||||
constexpr int ISMULH_M = 9;
|
||||
constexpr int IMUL_RCP = 10;
|
||||
constexpr int INEG_R = 11;
|
||||
constexpr int IXOR_R = 12;
|
||||
constexpr int IXOR_M = 13;
|
||||
constexpr int IROR_R = 14;
|
||||
constexpr int IROL_R = 15;
|
||||
constexpr int ISWAP_R = 16;
|
||||
constexpr int FSWAP_R = 17;
|
||||
constexpr int FADD_R = 18;
|
||||
constexpr int FADD_M = 19;
|
||||
constexpr int FSUB_R = 20;
|
||||
constexpr int FSUB_M = 21;
|
||||
constexpr int FSCAL_R = 22;
|
||||
constexpr int FMUL_R = 23;
|
||||
constexpr int FDIV_M = 24;
|
||||
constexpr int FSQRT_R = 25;
|
||||
constexpr int CBRANCH = 26;
|
||||
constexpr int CFROUND = 27;
|
||||
constexpr int ISTORE = 28;
|
||||
constexpr int NOP = 29;
|
||||
}
|
||||
enum class InstructionType : uint16_t {
|
||||
IADD_RS = 0,
|
||||
IADD_M = 1,
|
||||
ISUB_R = 2,
|
||||
ISUB_M = 3,
|
||||
IMUL_R = 4,
|
||||
IMUL_M = 5,
|
||||
IMULH_R = 6,
|
||||
IMULH_M = 7,
|
||||
ISMULH_R = 8,
|
||||
ISMULH_M = 9,
|
||||
IMUL_RCP = 10,
|
||||
INEG_R = 11,
|
||||
IXOR_R = 12,
|
||||
IXOR_M = 13,
|
||||
IROR_R = 14,
|
||||
IROL_R = 15,
|
||||
ISWAP_R = 16,
|
||||
FSWAP_R = 17,
|
||||
FADD_R = 18,
|
||||
FADD_M = 19,
|
||||
FSUB_R = 20,
|
||||
FSUB_M = 21,
|
||||
FSCAL_R = 22,
|
||||
FMUL_R = 23,
|
||||
FDIV_M = 24,
|
||||
FSQRT_R = 25,
|
||||
CBRANCH = 26,
|
||||
CFROUND = 27,
|
||||
ISTORE = 28,
|
||||
NOP = 29,
|
||||
};
|
||||
|
||||
class Instruction {
|
||||
public:
|
||||
|
|
|
@ -306,7 +306,7 @@ namespace randomx {
|
|||
}
|
||||
|
||||
void JitCompilerX86::generateSuperscalarCode(Instruction& instr, std::vector<uint64_t> &reciprocalCache) {
|
||||
switch (instr.opcode)
|
||||
switch ((SuperscalarInstructionType)instr.opcode)
|
||||
{
|
||||
case randomx::SuperscalarInstructionType::ISUB_R:
|
||||
emit(REX_SUB_RR);
|
||||
|
|
|
@ -40,7 +40,7 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|||
|
||||
namespace randomx {
|
||||
|
||||
static bool isMultiplication(int type) {
|
||||
static bool isMultiplication(SuperscalarInstructionType type) {
|
||||
return type == SuperscalarInstructionType::IMUL_R || type == SuperscalarInstructionType::IMULH_R || type == SuperscalarInstructionType::ISMULH_R || type == SuperscalarInstructionType::IMUL_RCP;
|
||||
}
|
||||
|
||||
|
@ -167,7 +167,7 @@ namespace randomx {
|
|||
const MacroOp& getOp(int index) const {
|
||||
return ops_[index];
|
||||
}
|
||||
int getType() const {
|
||||
SuperscalarInstructionType getType() const {
|
||||
return type_;
|
||||
}
|
||||
int getResultOp() const {
|
||||
|
@ -196,7 +196,7 @@ namespace randomx {
|
|||
static const SuperscalarInstructionInfo NOP;
|
||||
private:
|
||||
const char* name_;
|
||||
int type_;
|
||||
SuperscalarInstructionType type_;
|
||||
std::vector<MacroOp> ops_;
|
||||
int latency_;
|
||||
int resultOp_ = 0;
|
||||
|
@ -204,13 +204,13 @@ namespace randomx {
|
|||
int srcOp_;
|
||||
|
||||
SuperscalarInstructionInfo(const char* name)
|
||||
: name_(name), type_(-1), latency_(0) {}
|
||||
SuperscalarInstructionInfo(const char* name, int type, const MacroOp& op, int srcOp)
|
||||
: name_(name), type_(SuperscalarInstructionType::INVALID), latency_(0) {}
|
||||
SuperscalarInstructionInfo(const char* name, SuperscalarInstructionType type, const MacroOp& op, int srcOp)
|
||||
: name_(name), type_(type), latency_(op.getLatency()), srcOp_(srcOp) {
|
||||
ops_.push_back(MacroOp(op));
|
||||
}
|
||||
template <size_t N>
|
||||
SuperscalarInstructionInfo(const char* name, int type, const MacroOp(&arr)[N], int resultOp, int dstOp, int srcOp)
|
||||
SuperscalarInstructionInfo(const char* name, SuperscalarInstructionType type, const MacroOp(&arr)[N], int resultOp, int dstOp, int srcOp)
|
||||
: name_(name), type_(type), latency_(0), resultOp_(resultOp), dstOp_(dstOp), srcOp_(srcOp) {
|
||||
for (unsigned i = 0; i < N; ++i) {
|
||||
ops_.push_back(MacroOp(arr[i]));
|
||||
|
@ -267,7 +267,7 @@ namespace randomx {
|
|||
const char* getName() const {
|
||||
return name_;
|
||||
}
|
||||
const DecoderBuffer* fetchNext(int instrType, int cycle, int mulCount, Blake2Generator& gen) const {
|
||||
const DecoderBuffer* fetchNext(SuperscalarInstructionType instrType, int cycle, int mulCount, Blake2Generator& gen) const {
|
||||
//If the current RandomX instruction is "IMULH", the next fetch configuration must be 3-3-10
|
||||
//because the full 128-bit multiplication instruction is 3 bytes long and decodes to 2 uOPs on Intel CPUs.
|
||||
//Intel CPUs can decode at most 4 uOPs per cycle, so this requires a 2-1-1 configuration for a total of 3 macro ops.
|
||||
|
@ -345,9 +345,9 @@ namespace randomx {
|
|||
|
||||
class RegisterInfo {
|
||||
public:
|
||||
RegisterInfo() : latency(0), lastOpGroup(-1), lastOpPar(-1), value(0) {}
|
||||
RegisterInfo() : latency(0), lastOpGroup(SuperscalarInstructionType::INVALID), lastOpPar(-1), value(0) {}
|
||||
int latency;
|
||||
int lastOpGroup;
|
||||
SuperscalarInstructionType lastOpGroup;
|
||||
int lastOpPar;
|
||||
int value;
|
||||
};
|
||||
|
@ -356,7 +356,7 @@ namespace randomx {
|
|||
class SuperscalarInstruction {
|
||||
public:
|
||||
void toInstr(Instruction& instr) { //translate to a RandomX instruction format
|
||||
instr.opcode = getType();
|
||||
instr.opcode = (int)getType();
|
||||
instr.dst = dst_;
|
||||
instr.src = src_ >= 0 ? src_ : dst_;
|
||||
instr.setMod(mod_);
|
||||
|
@ -534,7 +534,7 @@ namespace randomx {
|
|||
return false;
|
||||
}
|
||||
|
||||
int getType() {
|
||||
SuperscalarInstructionType getType() {
|
||||
return info_->getType();
|
||||
}
|
||||
int getSource() {
|
||||
|
@ -543,7 +543,7 @@ namespace randomx {
|
|||
int getDestination() {
|
||||
return dst_;
|
||||
}
|
||||
int getGroup() {
|
||||
SuperscalarInstructionType getGroup() {
|
||||
return opGroup_;
|
||||
}
|
||||
int getGroupPar() {
|
||||
|
@ -562,7 +562,7 @@ namespace randomx {
|
|||
int dst_ = -1;
|
||||
int mod_;
|
||||
uint32_t imm32_;
|
||||
int opGroup_;
|
||||
SuperscalarInstructionType opGroup_;
|
||||
int opGroupPar_;
|
||||
bool canReuse_ = false;
|
||||
bool groupParIsSource_ = false;
|
||||
|
@ -849,40 +849,40 @@ namespace randomx {
|
|||
void executeSuperscalar(int_reg_t(&r)[8], SuperscalarProgram& prog, std::vector<uint64_t> *reciprocals) {
|
||||
for (unsigned j = 0; j < prog.getSize(); ++j) {
|
||||
Instruction& instr = prog(j);
|
||||
switch (instr.opcode)
|
||||
switch ((SuperscalarInstructionType)instr.opcode)
|
||||
{
|
||||
case randomx::SuperscalarInstructionType::ISUB_R:
|
||||
case SuperscalarInstructionType::ISUB_R:
|
||||
r[instr.dst] -= r[instr.src];
|
||||
break;
|
||||
case randomx::SuperscalarInstructionType::IXOR_R:
|
||||
case SuperscalarInstructionType::IXOR_R:
|
||||
r[instr.dst] ^= r[instr.src];
|
||||
break;
|
||||
case randomx::SuperscalarInstructionType::IADD_RS:
|
||||
case SuperscalarInstructionType::IADD_RS:
|
||||
r[instr.dst] += r[instr.src] << instr.getModShift();
|
||||
break;
|
||||
case randomx::SuperscalarInstructionType::IMUL_R:
|
||||
case SuperscalarInstructionType::IMUL_R:
|
||||
r[instr.dst] *= r[instr.src];
|
||||
break;
|
||||
case randomx::SuperscalarInstructionType::IROR_C:
|
||||
case SuperscalarInstructionType::IROR_C:
|
||||
r[instr.dst] = rotr(r[instr.dst], instr.getImm32());
|
||||
break;
|
||||
case randomx::SuperscalarInstructionType::IADD_C7:
|
||||
case randomx::SuperscalarInstructionType::IADD_C8:
|
||||
case randomx::SuperscalarInstructionType::IADD_C9:
|
||||
case SuperscalarInstructionType::IADD_C7:
|
||||
case SuperscalarInstructionType::IADD_C8:
|
||||
case SuperscalarInstructionType::IADD_C9:
|
||||
r[instr.dst] += signExtend2sCompl(instr.getImm32());
|
||||
break;
|
||||
case randomx::SuperscalarInstructionType::IXOR_C7:
|
||||
case randomx::SuperscalarInstructionType::IXOR_C8:
|
||||
case randomx::SuperscalarInstructionType::IXOR_C9:
|
||||
case SuperscalarInstructionType::IXOR_C7:
|
||||
case SuperscalarInstructionType::IXOR_C8:
|
||||
case SuperscalarInstructionType::IXOR_C9:
|
||||
r[instr.dst] ^= signExtend2sCompl(instr.getImm32());
|
||||
break;
|
||||
case randomx::SuperscalarInstructionType::IMULH_R:
|
||||
case SuperscalarInstructionType::IMULH_R:
|
||||
r[instr.dst] = mulh(r[instr.dst], r[instr.src]);
|
||||
break;
|
||||
case randomx::SuperscalarInstructionType::ISMULH_R:
|
||||
case SuperscalarInstructionType::ISMULH_R:
|
||||
r[instr.dst] = smulh(r[instr.dst], r[instr.src]);
|
||||
break;
|
||||
case randomx::SuperscalarInstructionType::IMUL_RCP:
|
||||
case SuperscalarInstructionType::IMUL_RCP:
|
||||
if (reciprocals != nullptr)
|
||||
r[instr.dst] *= (*reciprocals)[instr.getImm32()];
|
||||
else
|
||||
|
|
|
@ -35,25 +35,24 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|||
|
||||
namespace randomx {
|
||||
// Intel Ivy Bridge reference
|
||||
namespace SuperscalarInstructionType { //uOPs (decode) execution ports latency code size
|
||||
constexpr int ISUB_R = 0; //1 p015 1 3 (sub)
|
||||
constexpr int IXOR_R = 1; //1 p015 1 3 (xor)
|
||||
constexpr int IADD_RS = 2; //1 p01 1 4 (lea)
|
||||
constexpr int IMUL_R = 3; //1 p1 3 4 (imul)
|
||||
constexpr int IROR_C = 4; //1 p05 1 4 (ror)
|
||||
constexpr int IADD_C7 = 5; //1 p015 1 7 (add)
|
||||
constexpr int IXOR_C7 = 6; //1 p015 1 7 (xor)
|
||||
constexpr int IADD_C8 = 7; //1+0 p015 1 7+1 (add+nop)
|
||||
constexpr int IXOR_C8 = 8; //1+0 p015 1 7+1 (xor+nop)
|
||||
constexpr int IADD_C9 = 9; //1+0 p015 1 7+2 (add+nop)
|
||||
constexpr int IXOR_C9 = 10; //1+0 p015 1 7+2 (xor+nop)
|
||||
constexpr int IMULH_R = 11; //1+2+1 0+(p1,p5)+0 3 3+3+3 (mov+mul+mov)
|
||||
constexpr int ISMULH_R = 12; //1+2+1 0+(p1,p5)+0 3 3+3+3 (mov+imul+mov)
|
||||
constexpr int IMUL_RCP = 13; //1+1 p015+p1 4 10+4 (mov+imul)
|
||||
enum class SuperscalarInstructionType { //uOPs (decode) execution ports latency code size
|
||||
ISUB_R = 0, //1 p015 1 3 (sub)
|
||||
IXOR_R = 1, //1 p015 1 3 (xor)
|
||||
IADD_RS = 2, //1 p01 1 4 (lea)
|
||||
IMUL_R = 3, //1 p1 3 4 (imul)
|
||||
IROR_C = 4, //1 p05 1 4 (ror)
|
||||
IADD_C7 = 5, //1 p015 1 7 (add)
|
||||
IXOR_C7 = 6, //1 p015 1 7 (xor)
|
||||
IADD_C8 = 7, //1+0 p015 1 7+1 (add+nop)
|
||||
IXOR_C8 = 8, //1+0 p015 1 7+1 (xor+nop)
|
||||
IADD_C9 = 9, //1+0 p015 1 7+2 (add+nop)
|
||||
IXOR_C9 = 10, //1+0 p015 1 7+2 (xor+nop)
|
||||
IMULH_R = 11, //1+2+1 0+(p1,p5)+0 3 3+3+3 (mov+mul+mov)
|
||||
ISMULH_R = 12, //1+2+1 0+(p1,p5)+0 3 3+3+3 (mov+imul+mov)
|
||||
IMUL_RCP = 13, //1+1 p015+p1 4 10+4 (mov+imul)
|
||||
|
||||
constexpr int COUNT = 14;
|
||||
constexpr int INVALID = -1;
|
||||
}
|
||||
INVALID = -1
|
||||
};
|
||||
|
||||
void generateSuperscalar(SuperscalarProgram& prog, Blake2Generator& gen);
|
||||
void executeSuperscalar(uint64_t(&r)[8], SuperscalarProgram& prog, std::vector<uint64_t> *reciprocals = nullptr);
|
||||
|
|
|
@ -50,7 +50,7 @@ namespace randomx {
|
|||
uint64_t imm;
|
||||
int64_t simm;
|
||||
};
|
||||
uint16_t type;
|
||||
InstructionType type;
|
||||
union {
|
||||
int16_t target;
|
||||
uint16_t shift;
|
||||
|
@ -58,6 +58,8 @@ namespace randomx {
|
|||
uint32_t memMask;
|
||||
};
|
||||
|
||||
static_assert(sizeof(InstructionByteCode) == 32, "Invalid packing of struct InstructionByteCode");
|
||||
|
||||
template<class Allocator, bool softAes>
|
||||
class InterpretedVm : public VmBase<Allocator, softAes> {
|
||||
public:
|
||||
|
|
Loading…
Reference in a new issue