namespace X86Disassembler.X86; using Operands; /// /// Handles decoding of ModR/M bytes in x86 instructions /// public class ModRMDecoder { // ModR/M byte masks private const byte MOD_MASK = 0xC0; // 11000000b private const byte REG_MASK = 0x38; // 00111000b private const byte RM_MASK = 0x07; // 00000111b // SIB byte masks private const byte SIB_SCALE_MASK = 0xC0; // 11000000b private const byte SIB_INDEX_MASK = 0x38; // 00111000b private const byte SIB_BASE_MASK = 0x07; // 00000111b // Register names for different sizes private static readonly string[] RegisterNames8 = {"al", "cl", "dl", "bl", "ah", "ch", "dh", "bh"}; private static readonly string[] RegisterNames16 = {"ax", "cx", "dx", "bx", "sp", "bp", "si", "di"}; private static readonly string[] RegisterNames32 = {"eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi"}; // The instruction decoder that owns this ModRM decoder private readonly InstructionDecoder _decoder; /// /// Initializes a new instance of the ModRMDecoder class /// /// The instruction decoder that owns this ModRM decoder public ModRMDecoder(InstructionDecoder decoder) { _decoder = decoder; } /// /// Maps the register index from the ModR/M byte to the RegisterIndex enum value /// /// The register index from the ModR/M byte (0-7) /// The corresponding RegisterIndex enum value private RegisterIndex MapModRMToRegisterIndex(int modRMRegIndex) { // The mapping from ModR/M register index to RegisterIndex enum is: // 0 -> A (EAX) // 1 -> C (ECX) // 2 -> D (EDX) // 3 -> B (EBX) // 4 -> Sp (ESP) // 5 -> Bp (EBP) // 6 -> Si (ESI) // 7 -> Di (EDI) return modRMRegIndex switch { 0 => RegisterIndex.A, // EAX 1 => RegisterIndex.C, // ECX 2 => RegisterIndex.D, // EDX 3 => RegisterIndex.B, // EBX 4 => RegisterIndex.Sp, // ESP 5 => RegisterIndex.Bp, // EBP 6 => RegisterIndex.Si, // ESI 7 => RegisterIndex.Di, // EDI _ => RegisterIndex.A // Default to EAX }; } /// /// Maps the register index from the ModR/M byte to the RegisterIndex enum value for 8-bit high registers /// /// The register index from the ModR/M byte (0-7) /// The corresponding RegisterIndex enum value for 8-bit high registers private RegisterIndex MapModRMToHighRegister8Index(int modRMRegIndex) { // For 8-bit high registers (AH, CH, DH, BH), the mapping is different return modRMRegIndex switch { 4 => RegisterIndex.A, // AH 5 => RegisterIndex.C, // CH 6 => RegisterIndex.D, // DH 7 => RegisterIndex.B, // BH _ => MapModRMToRegisterIndex(modRMRegIndex) // Fall back to normal mapping for other indices }; } /// /// Decodes a ModR/M byte to get the operand /// /// The mod field (2 bits) /// The r/m field as RegisterIndex /// True if the operand is 64-bit /// The operand object public Operand DecodeModRM(byte mod, RegisterIndex rmIndex, bool is64Bit) { int operandSize = is64Bit ? 64 : 32; switch (mod) { case 0: // [reg] or disp32 // Special case: [EBP] is encoded as disp32 with no base register if (rmIndex == RegisterIndex.Bp) // disp32 (was EBP/BP) { if (_decoder.CanReadUInt()) { uint disp32 = _decoder.ReadUInt32(); return OperandFactory.CreateDirectMemoryOperand(disp32, operandSize); } // Fallback for incomplete data return OperandFactory.CreateDirectMemoryOperand(0, operandSize); } // Special case: [ESP] is encoded with SIB byte if (rmIndex == RegisterIndex.Sp) // SIB (was ESP/SP) { // Handle SIB byte if (_decoder.CanReadByte()) { byte sib = _decoder.ReadByte(); return DecodeSIB(sib, 0, is64Bit); } // Fallback for incomplete data return OperandFactory.CreateBaseRegisterMemoryOperand(RegisterIndex.Sp, operandSize); } // Regular case: [reg] return OperandFactory.CreateBaseRegisterMemoryOperand(rmIndex, operandSize); case 1: // [reg + disp8] if (rmIndex == RegisterIndex.Sp) // SIB + disp8 (ESP/SP) { // Handle SIB byte if (_decoder.CanReadByte()) { byte sib = _decoder.ReadByte(); sbyte disp8 = (sbyte)(_decoder.CanReadByte() ? _decoder.ReadByte() : 0); return DecodeSIB(sib, (uint)disp8, is64Bit); } // Fallback for incomplete data return OperandFactory.CreateBaseRegisterMemoryOperand(RegisterIndex.Sp, operandSize); } else { if (_decoder.CanReadByte()) { sbyte disp8 = (sbyte)_decoder.ReadByte(); // For EBP (BP), always create a displacement memory operand, even if displacement is 0 // This is because [EBP] with no displacement is encoded as [EBP+0] if (disp8 == 0 && rmIndex != RegisterIndex.Bp) { return OperandFactory.CreateBaseRegisterMemoryOperand(rmIndex, operandSize); } return OperandFactory.CreateDisplacementMemoryOperand(rmIndex, disp8, operandSize); } // Fallback for incomplete data return OperandFactory.CreateBaseRegisterMemoryOperand(rmIndex, operandSize); } case 2: // [reg + disp32] if (rmIndex == RegisterIndex.Sp) // SIB + disp32 (ESP/SP) { // Handle SIB byte if (_decoder.CanReadUInt()) { byte sib = _decoder.ReadByte(); uint disp32 = _decoder.ReadUInt32(); return DecodeSIB(sib, disp32, is64Bit); } // Fallback for incomplete data return OperandFactory.CreateBaseRegisterMemoryOperand(RegisterIndex.Sp, operandSize); } else { if (_decoder.CanReadUInt()) { uint disp32 = _decoder.ReadUInt32(); // For EBP (BP), always create a displacement memory operand, even if displacement is 0 // This is because [EBP] with no displacement is encoded as [EBP+disp] if (rmIndex == RegisterIndex.Bp) { return OperandFactory.CreateDisplacementMemoryOperand(rmIndex, (int)disp32, operandSize); } // Only show displacement if it's not zero if (disp32 == 0) { return OperandFactory.CreateBaseRegisterMemoryOperand(rmIndex, operandSize); } return OperandFactory.CreateDisplacementMemoryOperand(rmIndex, (int)disp32, operandSize); } // Fallback for incomplete data return OperandFactory.CreateBaseRegisterMemoryOperand(rmIndex, operandSize); } case 3: // reg (direct register access) return OperandFactory.CreateRegisterOperand(rmIndex, operandSize); default: // Fallback for invalid mod value return OperandFactory.CreateRegisterOperand(RegisterIndex.A, operandSize); } } /// /// Peaks a ModR/M byte and returns the raw field values, without advancing position /// /// A tuple containing the raw mod, reg, and rm fields from the ModR/M byte public byte PeakModRMReg() { if (!_decoder.CanReadByte()) { return 0; } byte modRM = _decoder.PeakByte(); // Extract fields from ModR/M byte byte regIndex = (byte)((modRM & REG_MASK) >> 3); // Middle 3 bits (bits 3-5) return regIndex; } /// /// Reads a ModR/M byte and returns the raw field values /// /// A tuple containing the raw mod, reg, and rm fields from the ModR/M byte public (byte mod, byte reg, byte rm) ReadModRMRaw() { if (!_decoder.CanReadByte()) { return (0, 0, 0); } byte modRM = _decoder.ReadByte(); // Extract fields from ModR/M byte byte mod = (byte)((modRM & MOD_MASK) >> 6); // Top 2 bits (bits 6-7) byte regIndex = (byte)((modRM & REG_MASK) >> 3); // Middle 3 bits (bits 3-5) byte rmIndex = (byte)(modRM & RM_MASK); // Bottom 3 bits (bits 0-2) return (mod, regIndex, rmIndex); } /// /// Reads and decodes a ModR/M byte for standard 32-bit operands /// /// A tuple containing the mod, reg, rm fields and the decoded operand public (byte mod, RegisterIndex reg, RegisterIndex rm, Operand operand) ReadModRM() { return ReadModRMInternal(false, false); } /// /// Reads and decodes a ModR/M byte for 64-bit operands /// /// A tuple containing the mod, reg, rm fields and the decoded operand public (byte mod, RegisterIndex reg, RegisterIndex rm, Operand operand) ReadModRM64() { return ReadModRMInternal(true, false); } /// /// Reads and decodes a ModR/M byte for 8-bit operands /// /// A tuple containing the mod, reg, rm fields and the decoded operand public (byte mod, RegisterIndex reg, RegisterIndex rm, Operand operand) ReadModRM8() { return ReadModRMInternal(false, true); } /// /// Internal implementation for reading and decoding a ModR/M byte /// /// True if the operand is 64-bit /// True if the operand is 8-bit /// A tuple containing the mod, reg, rm fields and the decoded operand private (byte mod, RegisterIndex reg, RegisterIndex rm, Operand operand) ReadModRMInternal(bool is64Bit, bool is8Bit) { if (!_decoder.CanReadByte()) { return (0, RegisterIndex.A, RegisterIndex.A, OperandFactory.CreateRegisterOperand(RegisterIndex.A, is64Bit ? 64 : (is8Bit ? 8 : 32))); } byte modRM = _decoder.ReadByte(); // Extract fields from ModR/M byte byte mod = (byte)((modRM & MOD_MASK) >> 6); byte regIndex = (byte)((modRM & REG_MASK) >> 3); byte rmIndex = (byte)(modRM & RM_MASK); // For 8-bit registers with mod=3, we need to check if they are high registers bool isRmHighRegister = is8Bit && mod == 3 && rmIndex >= 4; bool isRegHighRegister = is8Bit && regIndex >= 4; // Map the ModR/M register indices to RegisterIndex enum values RegisterIndex reg = isRegHighRegister ? MapModRMToHighRegister8Index(regIndex) : MapModRMToRegisterIndex(regIndex); RegisterIndex rm = isRmHighRegister ? MapModRMToHighRegister8Index(rmIndex) : MapModRMToRegisterIndex(rmIndex); // Create the operand based on the mod and rm fields Operand operand = DecodeModRM(mod, rm, is64Bit); // For 8-bit operands, set the size to 8 if (is8Bit) { operand.Size = 8; } return (mod, reg, rm, operand); } /// /// Decodes a SIB byte /// /// The SIB byte /// The displacement value /// True if the operand is 64-bit /// The decoded SIB operand private Operand DecodeSIB(byte sib, uint displacement, bool is64Bit) { int operandSize = is64Bit ? 64 : 32; // Extract fields from SIB byte byte scale = (byte)((sib & SIB_SCALE_MASK) >> 6); int indexIndex = (sib & SIB_INDEX_MASK) >> 3; int baseIndex = sib & SIB_BASE_MASK; // Map the SIB register indices to RegisterIndex enum values RegisterIndex index = MapModRMToRegisterIndex(indexIndex); RegisterIndex @base = MapModRMToRegisterIndex(baseIndex); // Special case: ESP/SP (4) in index field means no index register if (index == RegisterIndex.Sp) { // Special case: EBP/BP (5) in base field with no displacement means disp32 only if (@base == RegisterIndex.Bp && displacement == 0) { if (_decoder.CanReadUInt()) { uint disp32 = _decoder.ReadUInt32(); int scaleValue = 1 << scale; // 1, 2, 4, or 8 // Create a scaled index memory operand with displacement but no base register return OperandFactory.CreateScaledIndexMemoryOperand( index, scaleValue, null, (int)disp32, operandSize); } // Fallback for incomplete data return OperandFactory.CreateScaledIndexMemoryOperand( index, 1 << scale, null, 0, operandSize); } // Base register only with displacement if (displacement == 0) { return OperandFactory.CreateBaseRegisterMemoryOperand(@base, operandSize); } return OperandFactory.CreateDisplacementMemoryOperand(@base, (int)displacement, operandSize); } // Special case: EBP/BP (5) in base field with no displacement means disp32 only if (@base == RegisterIndex.Bp && displacement == 0) { if (_decoder.CanReadUInt()) { uint disp32 = _decoder.ReadUInt32(); int scaleValue = 1 << scale; // 1, 2, 4, or 8 // Create a scaled index memory operand with displacement but no base register return OperandFactory.CreateScaledIndexMemoryOperand( index, scaleValue, null, (int)disp32, operandSize); } // Fallback for incomplete data return OperandFactory.CreateScaledIndexMemoryOperand( index, 1 << scale, null, 0, operandSize); } // Normal case with base and index registers int scaleFactor = 1 << scale; // 1, 2, 4, or 8 // Create a scaled index memory operand return OperandFactory.CreateScaledIndexMemoryOperand( index, scaleFactor, @base, (int)displacement, operandSize); } /// /// Gets the register name based on the register index and size /// /// The register index as RegisterIndex enum /// The register size (8, 16, or 32 bits) /// The register name public static string GetRegisterName(RegisterIndex regIndex, int size) { // Convert RegisterIndex to raw index for array access int index = (int)regIndex; return size switch { 8 => RegisterNames8[index], 16 => RegisterNames16[index], 32 => RegisterNames32[index], _ => RegisterNames32[index] // Default to 32-bit registers }; } }