/**
* vim: set ts=4 :
* ================================================================
* SourceMod BinTools Extension
* Copyright (C) 2004-2007 AlliedModders LLC. All rights reserved.
* ================================================================
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public License,
* version 3.0, as published by the Free Software Foundation.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see .
*
* As a special exception, AlliedModders LLC gives you permission to
* link the code of this program (as well as its derivative works) to
* "Half-Life 2," the "Source Engine," the "SourcePawn JIT," and any
* Game MODs that run on software by the Valve Corporation. You must
* obey the GNU General Public License in all respects for all other
* code used. Additionally, AlliedModders LLC grants this exception
* to all derivative works. AlliedModders LLC defines further
* exceptions, found in LICENSE.txt (as of this writing, version
* JULY-31-2007), or .
*
* Version: $Id$
*/
#include
#include "extension.h"
#include
#include
#include "jit_call.h"
jit_uint32_t g_StackUsage = 0;
jit_uint32_t g_StackAlign = 0;
jit_uint32_t g_RegDecoder = 0;
/********************
* Assembly Helpers *
********************/
inline jit_uint8_t _DecodeRegister3(jit_uint32_t val)
{
switch (val % 3)
{
case 0:
{
return REG_EAX;
}
case 1:
{
return REG_EDX;
}
case 2:
{
return REG_ECX;
}
}
/* Should never happen */
return 0xFF;
}
/********************
* Assembly Opcodes *
********************/
inline void Write_Execution_Prologue(JitWriter *jit, bool is_void, bool has_params)
{
//push ebp
//mov ebp, esp
//if !is_void
// push edi
// mov edi, [ebp+12]
//if has_params
// push ebx
// mov ebx, [ebp+8]
//push esi
//mov esi, esp
//and esp, 0xFFFFFFF0
//sub esp,
IA32_Push_Reg(jit, REG_EBP);
IA32_Mov_Reg_Rm(jit, REG_EBP, REG_ESP, MOD_REG);
if (!is_void)
{
IA32_Push_Reg(jit, REG_EDI);
IA32_Mov_Reg_Rm_Disp8(jit, REG_EDI, REG_EBP, 12);
}
if (has_params)
{
IA32_Push_Reg(jit, REG_EBX);
IA32_Mov_Reg_Rm_Disp8(jit, REG_EBX, REG_EBP, 8);
}
IA32_Push_Reg(jit, REG_ESI);
IA32_Mov_Reg_Rm(jit, REG_ESI, REG_ESP, MOD_REG);
IA32_And_Rm_Imm8(jit, REG_ESP, MOD_REG, -16);
if (!jit->outbase)
{
/* Alloc this instruction before knowing the real stack usage */
IA32_Sub_Rm_Imm32(jit, REG_ESP, 1337, MOD_REG);
} else {
if (g_StackAlign)
{
IA32_Sub_Rm_Imm32(jit, REG_ESP, g_StackAlign, MOD_REG);
}
}
}
inline void Write_Function_Epilogue(JitWriter *jit, bool is_void, bool has_params)
{
//mov esp, esi
//pop esi
//if has_params
// pop ebx
//if !is_void
// pop edi
//mov esp, ebp
//pop ebp
//ret
IA32_Mov_Reg_Rm(jit, REG_ESP, REG_ESI, MOD_REG);
IA32_Pop_Reg(jit, REG_ESI);
if (has_params)
{
IA32_Pop_Reg(jit, REG_EBX);
}
if (!is_void)
{
IA32_Pop_Reg(jit, REG_EDI);
}
IA32_Mov_Reg_Rm(jit, REG_ESP, REG_EBP, MOD_REG);
IA32_Pop_Reg(jit, REG_EBP);
IA32_Return(jit);
}
inline void Write_PushPOD(JitWriter *jit, const PassEncode *pEnc)
{
jit_uint8_t reg = _DecodeRegister3(g_RegDecoder++);
if (pEnc->info.flags & PASSFLAG_BYVAL)
{
switch (pEnc->info.size)
{
case 1:
{
//movzx reg, BYTE PTR [ebx+]
//push reg
if (pEnc->offset < SCHAR_MAX)
{
IA32_Movzx_Reg32_Rm8_Disp8(jit, reg, REG_EBX, (jit_int8_t)pEnc->offset);
} else if (!pEnc->offset) {
IA32_Movzx_Reg32_Rm8(jit, reg, REG_EBX, MOD_MEM_REG);
} else {
IA32_Movzx_Reg32_Rm8_Disp32(jit, reg, REG_EBX, pEnc->offset);
}
IA32_Push_Reg(jit, reg);
g_StackUsage += 4;
break;
}
case 2:
{
//movzx reg, WORD PTR [ebx+]
//push reg
jit->write_ubyte(IA32_16BIT_PREFIX);
if (pEnc->offset < SCHAR_MAX)
{
IA32_Movzx_Reg32_Rm16_Disp8(jit, reg, REG_EBX, (jit_int8_t)pEnc->offset);
} else if (!pEnc->offset) {
IA32_Movzx_Reg32_Rm16(jit, reg, REG_EBX, MOD_MEM_REG);
} else {
IA32_Movzx_Reg32_Rm16_Disp32(jit, reg, REG_EBX, pEnc->offset);
}
IA32_Push_Reg(jit, reg);
g_StackUsage += 4;
break;
}
case 4:
{
//mov reg, DWORD PTR [ebx+]
//push reg
if (pEnc->offset < SCHAR_MAX)
{
IA32_Mov_Reg_Rm_Disp8(jit, reg, REG_EBX, (jit_int8_t)pEnc->offset);
} else if (!pEnc->offset) {
IA32_Mov_Reg_Rm(jit, reg, REG_EBX, MOD_MEM_REG);
} else {
IA32_Mov_Reg_Rm_Disp32(jit, reg, REG_EBX, pEnc->offset);
}
IA32_Push_Reg(jit, reg);
g_StackUsage += 4;
break;
}
case 8:
{
//mov reg, DWORD PTR [ebx++4]
//mov reg2, DWORD PTR [ebx+]
//push reg
//push reg2
jit_uint8_t reg2 = _DecodeRegister3(g_RegDecoder++);
if (pEnc->offset+4 < SCHAR_MAX)
{
IA32_Mov_Reg_Rm_Disp8(jit, reg, REG_EBX, (jit_int8_t)(pEnc->offset+4));
} else {
IA32_Mov_Reg_Rm_Disp32(jit, reg, REG_EBX, pEnc->offset+4);
}
if (pEnc->offset < SCHAR_MAX)
{
IA32_Mov_Reg_Rm_Disp8(jit, reg2, REG_EBX, (jit_int8_t)pEnc->offset);
} else if (!pEnc->offset) {
IA32_Mov_Reg_Rm(jit, reg, REG_EBX, MOD_MEM_REG);
} else {
IA32_Mov_Reg_Rm_Disp32(jit, reg2, REG_EBX, pEnc->offset);
}
IA32_Push_Reg(jit, reg);
IA32_Push_Reg(jit, reg2);
g_StackUsage += 8;
break;
}
}
} else if (pEnc->info.flags & PASSFLAG_BYREF) {
//lea reg, [ebx+]
//push reg
if (!pEnc->offset)
{
IA32_Push_Reg(jit, REG_EBX);
g_StackUsage += 4;
return;
}
if (pEnc->offset < SCHAR_MAX)
{
IA32_Lea_DispRegImm8(jit, reg, REG_EBX, (jit_int8_t)pEnc->offset);
} else {
IA32_Lea_DispRegImm32(jit, reg, REG_EBX, pEnc->offset);
}
IA32_Push_Reg(jit, reg);
g_StackUsage += 4;
}
}
inline void Write_PushFloat(JitWriter *jit, const PassEncode *pEnc)
{
if (pEnc->info.flags & PASSFLAG_BYVAL)
{
switch (pEnc->info.size)
{
case 4:
{
//fld DWORD PTR [ebx+]
//push reg
//fstp DWORD PTR [esp]
if (pEnc->offset < SCHAR_MAX)
{
IA32_Fld_Mem32_Disp8(jit, REG_EBX, (jit_int8_t)pEnc->offset);
} else if (!pEnc->offset) {
IA32_Fld_Mem32(jit, REG_EBX);
} else {
IA32_Fld_Mem32_Disp32(jit, REG_EBX, pEnc->offset);
}
IA32_Push_Reg(jit, _DecodeRegister3(g_RegDecoder++));
IA32_Fstp_Mem32_ESP(jit);
g_StackUsage += 4;
break;
}
case 8:
{
//fld QWORD PTR [ebx+]
//sub esp, 8
//fstp QWORD PTR [esp]
if (pEnc->offset < SCHAR_MAX)
{
IA32_Fld_Mem64_Disp8(jit, REG_EBX, (jit_int8_t)pEnc->offset);
} else if (!pEnc->offset) {
IA32_Fld_Mem64(jit, REG_EBX);
} else {
IA32_Fld_Mem64_Disp32(jit, REG_EBX, pEnc->offset);
}
IA32_Sub_Rm_Imm8(jit, REG_ESP, 8, MOD_REG);
IA32_Fstp_Mem64_ESP(jit);
g_StackUsage += 8;
break;
}
}
} else if (pEnc->info.flags & PASSFLAG_BYREF) {
//lea reg, [ebx+]
//push reg
if (!pEnc->offset)
{
IA32_Push_Reg(jit, REG_EBX);
g_StackUsage += 4;
return;
}
jit_uint8_t reg = _DecodeRegister3(g_RegDecoder++);
if (pEnc->offset < SCHAR_MAX)
{
IA32_Lea_DispRegImm8(jit, reg, REG_EBX, (jit_int8_t)pEnc->offset);
} else {
IA32_Lea_DispRegImm32(jit, reg, REG_EBX, pEnc->offset);
}
IA32_Push_Reg(jit, reg);
g_StackUsage += 4;
}
}
inline void Write_PushObject(JitWriter *jit, const PassEncode *pEnc)
{
if (pEnc->info.flags & PASSFLAG_BYVAL)
{
#ifdef PLATFORM_POSIX
if (pEnc->info.flags & PASSFLAG_ODTOR)
{
goto push_byref;
}
#endif
jit_uint32_t dwords = pEnc->info.size >> 2;
jit_uint32_t bytes = pEnc->info.size & 0x3;
//sub esp,
//cld
//push edi
//push esi
//lea edi, [esp+8]
//lea esi, [ebx+]
//if dwords
// mov ecx,
// rep movsd
//if bytes
// mov ecx,
// rep movsb
//pop esi
//pop edi
if (pEnc->info.size < SCHAR_MAX)
{
IA32_Sub_Rm_Imm8(jit, REG_ESP, (jit_int8_t)pEnc->info.size, MOD_REG);
} else {
IA32_Sub_Rm_Imm32(jit, REG_ESP, pEnc->info.size, MOD_REG);
}
IA32_Cld(jit);
IA32_Push_Reg(jit, REG_EDI);
IA32_Push_Reg(jit, REG_ESI);
IA32_Lea_Reg_DispRegMultImm8(jit, REG_EDI, REG_NOIDX, REG_ESP, NOSCALE, 8);
if (pEnc->offset < SCHAR_MAX)
{
IA32_Lea_DispRegImm8(jit, REG_ESI, REG_EBX, (jit_int8_t)pEnc->offset);
} else if (!pEnc->offset) {
IA32_Mov_Reg_Rm(jit, REG_ESI, REG_EBX, MOD_REG);
} else {
IA32_Lea_DispRegImm32(jit, REG_ESI, REG_EBX, pEnc->offset);
}
if (dwords)
{
IA32_Mov_Reg_Imm32(jit, REG_ECX, dwords);
IA32_Rep(jit);
IA32_Movsd(jit);
}
if (bytes)
{
IA32_Mov_Reg_Imm32(jit, REG_ECX, bytes);
IA32_Rep(jit);
IA32_Movsb(jit);
}
IA32_Pop_Reg(jit, REG_ESI);
IA32_Pop_Reg(jit, REG_EDI);
g_StackUsage += pEnc->info.size;
} else if (pEnc->info.flags & PASSFLAG_BYREF) {
#ifdef PLATFORM_POSIX
push_byref:
#endif
if (!pEnc->offset)
{
IA32_Push_Reg(jit, REG_EBX);
g_StackUsage += 4;
return;
}
//lea reg, [ebx+]
//push reg
jit_uint8_t reg = _DecodeRegister3(g_RegDecoder++);
if (pEnc->offset < SCHAR_MAX)
{
IA32_Lea_DispRegImm8(jit, reg, REG_EBX, (jit_int8_t)pEnc->offset);
} else {
IA32_Lea_DispRegImm32(jit, reg, REG_EBX, pEnc->offset);
}
IA32_Push_Reg(jit, reg);
g_StackUsage += 4;
}
}
inline void Write_PushThisPtr(JitWriter *jit)
{
#ifdef PLATFORM_POSIX
//mov reg, [ebx]
//push reg
jit_uint8_t reg = _DecodeRegister3(g_RegDecoder++);
IA32_Mov_Reg_Rm(jit, reg, REG_EBX, MOD_MEM_REG);
IA32_Push_Reg(jit, reg);
g_StackUsage += 4;
#elif defined PLATFORM_WINDOWS
//mov ecx, [ebx]
IA32_Mov_Reg_Rm(jit, REG_ECX, REG_EBX, MOD_MEM_REG);
#endif
}
inline void Write_PushRetBuffer(JitWriter *jit)
{
//push edi
IA32_Push_Reg(jit, REG_EDI);
}
inline void Write_CallFunction(JitWriter *jit, FuncAddrMethod method, CallWrapper *pWrapper)
{
if (method == FuncAddr_Direct)
{
//call
jitoffs_t call = IA32_Call_Imm32(jit, 0);
IA32_Write_Jump32_Abs(jit, call, pWrapper->m_Addrs[ADDR_CALLEE]);
} else if (method == FuncAddr_VTable) {
//*(this + thisOffs + vtblOffs)[vtblIdx]
//mov edx, [ebx]
//mov eax, [edx++]
//mov edx, [eax+*4]
//call edx
jit_uint32_t total_offs = pWrapper->m_VtInfo.thisOffs + pWrapper->m_VtInfo.vtblOffs;
jit_uint32_t vfunc_pos = pWrapper->m_VtInfo.vtblIdx * 4;
IA32_Mov_Reg_Rm(jit, REG_EDX, REG_EBX, MOD_MEM_REG);
if (total_offs < SCHAR_MAX)
{
IA32_Mov_Reg_Rm_Disp8(jit, REG_EAX, REG_EDX, (jit_int8_t)total_offs);
} else if (!total_offs) {
IA32_Mov_Reg_Rm(jit, REG_EAX, REG_EDX, MOD_MEM_REG);
} else {
IA32_Mov_Reg_Rm_Disp32(jit, REG_EAX, REG_EDX, total_offs);
}
if (vfunc_pos < SCHAR_MAX)
{
IA32_Mov_Reg_Rm_Disp8(jit, REG_EDX, REG_EAX, (jit_int8_t)vfunc_pos);
} else if (!vfunc_pos) {
IA32_Mov_Reg_Rm(jit, REG_EDX, REG_EAX, MOD_MEM_REG);
} else {
IA32_Mov_Reg_Rm_Disp32(jit, REG_EDX, REG_EAX, vfunc_pos);
}
IA32_Call_Reg(jit, REG_EDX);
}
}
inline void Write_RectifyStack(JitWriter *jit, jit_uint32_t value)
{
//add esp,
if (value < SCHAR_MAX)
{
IA32_Add_Rm_Imm8(jit, REG_ESP, (jit_int8_t)value, MOD_REG);
} else {
IA32_Add_Rm_Imm32(jit, REG_ESP, value, MOD_REG);
}
}
inline void Write_MovRet2Buf(JitWriter *jit, const PassInfo *pRet)
{
if (pRet->type == PassType_Float)
{
switch (pRet->size)
{
case 4:
{
//fstp DWORD PTR [edi]
IA32_Fstp_Mem32(jit, REG_EDI);
break;
}
case 8:
{
//fstp QWORD PTR [edi]
IA32_Fstp_Mem64(jit, REG_EDI);
break;
}
}
return;
}
switch (pRet->size)
{
case 1:
{
//mov BYTE PTR [edi], al
IA32_Mov_Rm8_Reg8(jit, REG_EDI, REG_EAX, MOD_MEM_REG);
break;
}
case 2:
{
//mov WORD PTR [edi], ax
jit->write_ubyte(IA32_16BIT_PREFIX);
IA32_Mov_Rm_Reg(jit, REG_EDI, REG_EAX, MOD_MEM_REG);
break;
}
case 4:
{
//mov DWORD PTR [edi], eax
IA32_Mov_Rm_Reg(jit, REG_EDI, REG_EAX, MOD_MEM_REG);
break;
}
case 8:
{
//mov DWORD PTR [edi], eax
//mov DWORD PTR [edi+4], edx
IA32_Mov_Rm_Reg(jit, REG_EDI, REG_EAX, MOD_MEM_REG);
IA32_Mov_Rm_Reg_Disp8(jit, REG_EDI, REG_EDX, 4);
break;
}
}
}
/******************************
* Assembly Compiler Function *
******************************/
void JIT_Compile(CallWrapper *pWrapper, FuncAddrMethod method)
{
JitWriter writer;
JitWriter *jit = &writer;
jit_uint32_t CodeSize = 0;
bool Needs_Retbuf = false;
CallConvention Convention = pWrapper->GetCallConvention();
jit_uint32_t ParamCount = pWrapper->GetParamCount();
const PassInfo *pRet = pWrapper->GetReturnInfo();
bool hasParams = (ParamCount || Convention == CallConv_ThisCall);
g_StackUsage = 0;
writer.outbase = NULL;
writer.outptr = NULL;
jit_rewind:
/* Write function prologue */
Write_Execution_Prologue(jit, (pRet) ? false : true, hasParams);
/* Write parameter push code */
for (jit_int32_t i=ParamCount-1; i>=0; i--)
{
const PassEncode *pEnc = pWrapper->GetParamInfo(i);
switch (pEnc->info.type)
{
case PassType_Basic:
{
Write_PushPOD(jit, pEnc);
break;
}
case PassType_Float:
{
Write_PushFloat(jit, pEnc);
break;
}
case PassType_Object:
{
Write_PushObject(jit, pEnc);
break;
}
}
}
/* Prepare the this ptr if applicable */
if (Convention == CallConv_ThisCall)
{
Write_PushThisPtr(jit);
}
/* Skip the return buffer stuff if this is a void function */
if (!pRet)
{
goto skip_retbuffer;
}
if ((pRet->type == PassType_Object) && (pRet->flags & PASSFLAG_BYVAL))
{
#ifdef PLATFORM_POSIX
Needs_Retbuf = true;
#elif defined PLATFORM_WINDOWS
if ((Convention == CallConv_ThisCall) ||
((Convention == CallConv_Cdecl) &&
((pRet->size > 8) || (pRet->flags & PASSFLAG_ODTOR|PASSFLAG_OCTOR|PASSFLAG_OASSIGNOP))))
{
Needs_Retbuf = true;
}
#endif
}
/* Prepare the return buffer in case we are returning objects by value. */
if (Needs_Retbuf)
{
Write_PushRetBuffer(jit);
}
skip_retbuffer:
/* Write the calling code */
Write_CallFunction(jit, method, pWrapper);
/* Clean up the calling stack */
#ifdef PLATFORM_WINDOWS
if ((ParamCount || Needs_Retbuf) && (Convention == CallConv_Cdecl))
{
/* Pop all parameters from the stack + hidden return pointer */
jit_uint32_t total = (Needs_Retbuf) ? g_StackUsage + sizeof(void *) : g_StackUsage;
Write_RectifyStack(jit, total);
#elif defined PLATFORM_POSIX
if (hasParams)
{
/* Pop all parameters from the stack */
Write_RectifyStack(jit, g_StackUsage);
#endif
}
/* Copy the return type to the return buffer if the function is not void */
if (pRet && !Needs_Retbuf)
{
Write_MovRet2Buf(jit, pRet);
}
/* Write Function Epilogue */
Write_Function_Epilogue(jit, (pRet) ? false : true, hasParams);
if (writer.outbase == NULL)
{
CodeSize = writer.get_outputpos();
writer.outbase = (jitcode_t)g_SPEngine->ExecAlloc(CodeSize);
writer.outptr = writer.outbase;
pWrapper->m_Addrs[ADDR_CODEBASE] = writer.outbase;
g_StackAlign = (g_StackUsage) ? ((g_StackUsage & 0xFFFFFFF0) + 16) - g_StackUsage : 0;
g_StackUsage = 0;
g_RegDecoder = 0;
Needs_Retbuf = false;
goto jit_rewind;
}
}