package asm import ( "fmt" "math" ) type NewAssembler func(temporaryRegister Register) (AssemblerBase, error) // Register represents architecture-specific registers. type Register byte // NilRegister is the only architecture-independent register, and // can be used to indicate that no register is specified. const NilRegister Register = 0 // Instruction represents architecture-specific instructions. type Instruction uint16 // to accommodate the high cardinality of vector ops // ConditionalRegisterState represents architecture-specific conditional // register's states. type ConditionalRegisterState byte // ConditionalRegisterStateUnset is the only architecture-independent conditional state, and // can be used to indicate that no conditional state is specified. const ConditionalRegisterStateUnset ConditionalRegisterState = 0 // Node represents a node in the linked list of assembled operations. type Node interface { fmt.Stringer // AssignJumpTarget assigns the given target node as the destination of // jump instruction for this Node. AssignJumpTarget(target Node) // AssignDestinationConstant assigns the given constant as the destination // of the instruction for this node. AssignDestinationConstant(value ConstantValue) // AssignSourceConstant assigns the given constant as the source // of the instruction for this node. AssignSourceConstant(value ConstantValue) // OffsetInBinary returns the offset of this node in the assembled binary. OffsetInBinary() NodeOffsetInBinary } // NodeOffsetInBinary represents an offset of this node in the final binary. type NodeOffsetInBinary = uint64 // ConstantValue represents a constant value used in an instruction. type ConstantValue = int64 // StaticConst represents an arbitrary constant bytes which are pooled and emitted by assembler into the binary. // These constants can be referenced by instructions. type StaticConst = []byte // StaticConstKey returns a string whose underlying bytes equal the original const. func StaticConstKey(c StaticConst) string { return string(c) } // AssemblerBase is the common interface for assemblers among multiple architectures. // // Note: some of them can be implemented in an arch-independent way, but not all can be // implemented as such. However, we intentionally put such arch-dependant methods here // in order to provide the common documentation interface. // // Note: this interface is coupled and heavily influenced by golang-asm's API (i.e. Go's official assembler). // Therefore, we will do the refactoring after golang-asm removal. type AssemblerBase interface { // Assemble produces the final binary for the assembled operations. Assemble() ([]byte, error) // SetJumpTargetOnNext instructs the assembler that the next node must be // assigned to the given node's jump destination. SetJumpTargetOnNext(nodes ...Node) // BuildJumpTable calculates the offsets between the first instruction `initialInstructions[0]` // and others (e.g. initialInstructions[3]), and wrote the calculated offsets into pre-allocated // `table` slice in little endian. // // TODO: This can be hidden into assembler implementation after golang-asm removal. BuildJumpTable(table []byte, initialInstructions []Node) // CompileStandAlone adds an instruction to take no arguments. CompileStandAlone(instruction Instruction) Node // CompileConstToRegister adds an instruction where source operand is `value` as constant and destination is `destinationReg` register. CompileConstToRegister(instruction Instruction, value ConstantValue, destinationReg Register) Node // CompileRegisterToRegister adds an instruction where source and destination operands are registers. CompileRegisterToRegister(instruction Instruction, from, to Register) // CompileMemoryToRegister adds an instruction where source operands is the memory address specified by `sourceBaseReg+sourceOffsetConst` // and the destination is `destinationReg` register. CompileMemoryToRegister( instruction Instruction, sourceBaseReg Register, sourceOffsetConst ConstantValue, destinationReg Register, ) // CompileRegisterToMemory adds an instruction where source operand is `sourceRegister` register and the destination is the // memory address specified by `destinationBaseRegister+destinationOffsetConst`. CompileRegisterToMemory( instruction Instruction, sourceRegister Register, destinationBaseRegister Register, destinationOffsetConst ConstantValue, ) // CompileJump adds jump-type instruction and returns the corresponding Node in the assembled linked list. CompileJump(jmpInstruction Instruction) Node // CompileJumpToRegister adds jump-type instruction whose destination is the memory address specified by `reg` register. CompileJumpToRegister(jmpInstruction Instruction, reg Register) // CompileReadInstructionAddress adds an ADR instruction to set the absolute address of "target instruction" // into destinationRegister. "target instruction" is specified by beforeTargetInst argument and // the target is determined by "the instruction right after beforeTargetInst type". // // For example, if `beforeTargetInst == RET` and we have the instruction sequence like // `ADR -> X -> Y -> ... -> RET -> MOV`, then the `ADR` instruction emitted by this function set the absolute // address of `MOV` instruction into the destination register. CompileReadInstructionAddress(destinationRegister Register, beforeAcquisitionTargetInstruction Instruction) } // JumpTableMaximumOffset represents the limit on the size of jump table in bytes. // When users try loading an extremely large WebAssembly binary which contains a br_table // statement with approximately 4294967296 (2^32) targets. Realistically speaking, that kind of binary // could result in more than ten gigabytes of native compiled code where we have to care about // huge stacks whose height might exceed 32-bit range, and such huge stack doesn't work with the // current implementation. const JumpTableMaximumOffset = math.MaxUint32