1) JIT compilation/optimization now occurs per-function, and only when functions are first used. We're now officially a whole-method JIT rather than an AOT compiler (albiet, still a simple JIT). This has two implications: Functions are now much better abstracted internally, and loading a plugin is now much less expensive. If a function contains calls to other functions, THOSE functions are only compiled when they're invoked as well. 2) I've removed debug mode. We always show full backtraces now, as there was a very cheap way to implement this which really cleaned up everything. This is great for a number of reasons -- there's less code, the JIT is better designed, we don't need to relocate debug tables, and best of all we no longer have to tell users to enable debug mode at their own expense. --HG-- extra : convert_revision : svn%3A39bc706e-5318-0410-9160-8a85361fbb7c/trunk%402459
		
			
				
	
	
		
			707 lines
		
	
	
		
			22 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			707 lines
		
	
	
		
			22 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /**
 | |
|  * vim: set ts=4 :
 | |
|  * =============================================================================
 | |
|  * SourceMod
 | |
|  * Copyright (C) 2004-2008 AlliedModders LLC.  All rights reserved.
 | |
|  * =============================================================================
 | |
|  *
 | |
|  * This program is free software; you can redistribute it and/or modify it under
 | |
|  * the terms of the GNU General Public License, version 3.0, as published by the
 | |
|  * Free Software Foundation.
 | |
|  * 
 | |
|  * This program is distributed in the hope that it will be useful, but WITHOUT
 | |
|  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
 | |
|  * FOR A PARTICULAR PURPOSE.  See the GNU General Public License for more
 | |
|  * details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU General Public License along with
 | |
|  * this program.  If not, see <http://www.gnu.org/licenses/>.
 | |
|  *
 | |
|  * As a special exception, AlliedModders LLC gives you permission to link the
 | |
|  * code of this program (as well as its derivative works) to "Half-Life 2," the
 | |
|  * "Source Engine," the "SourcePawn JIT," and any Game MODs that run on software
 | |
|  * by the Valve Corporation.  You must obey the GNU General Public License in
 | |
|  * all respects for all other code used.  Additionally, AlliedModders LLC grants
 | |
|  * this exception to all derivative works.  AlliedModders LLC defines further
 | |
|  * exceptions, found in LICENSE.txt (as of this writing, version JULY-31-2007),
 | |
|  * or <http://www.sourcemod.net/license.php>.
 | |
|  *
 | |
|  * Version: $Id$
 | |
|  */
 | |
| 
 | |
| #include <limits.h>
 | |
| #include <string.h>
 | |
| #include <malloc.h>
 | |
| #include "jit_x86.h"
 | |
| #include "opcode_helpers.h"
 | |
| #include "x86_macros.h"
 | |
| 
 | |
| jitoffs_t Write_Execute_Function(JitWriter *jit)
 | |
| {
 | |
| 	/** 
 | |
| 	 * The variables we're passed in:
 | |
| 	 *  void *vars[], void *entry_func
 | |
| 	 */
 | |
| 
 | |
| 	/**
 | |
| 	 * !NOTE!
 | |
| 	 * Currently, we do not accept ctx->frm as the new frame pointer.
 | |
| 	 * Instead, we copy the frame from the stack pointer.
 | |
| 	 * This is because we do not support resuming or sleeping!
 | |
| 	 */
 | |
| 
 | |
| 	//push ebp
 | |
| 	//mov ebp, esp
 | |
| 	IA32_Push_Reg(jit, REG_EBP);
 | |
| 	IA32_Mov_Reg_Rm(jit, REG_EBP, REG_ESP, MOD_REG);
 | |
| 
 | |
| 	//push esi
 | |
| 	//push edi
 | |
| 	//push ebx
 | |
| 	IA32_Push_Reg(jit, REG_ESI);
 | |
| 	IA32_Push_Reg(jit, REG_EDI);
 | |
| 	IA32_Push_Reg(jit, REG_EBX);
 | |
| 
 | |
| 	/* Prep us for doing the real work */
 | |
| 	//mov esi, [ebp+param0]			;get vars
 | |
| 	//mov ecx, [ebp+param1]			;get entry addr
 | |
| 	//mov eax, [esi+MEMORY]			;get memory base
 | |
| 	//mov edx, [esi+CONTEXT]		;get context
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_ESI, REG_EBP, 8 + 4*0);
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_ECX, REG_EBP, 8 + 4*1);
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_EAX, REG_ESI, AMX_INFO_MEMORY);
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_EDX, REG_ESI, AMX_INFO_CONTEXT);
 | |
| 
 | |
| 	/* Set up run-time registers */
 | |
| 	//mov edi, [edx+SP]				;non-reloc SP
 | |
| 	//add edi, eax					;reloc SP
 | |
| 	//mov ebp, eax					;DAT
 | |
| 	//mov ebx, edi					;reloc FRM
 | |
| 	//mov [esi+NSTACK], esp			;save ESP
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_EDI, REG_EDX, offsetof(sp_context_t, sp));
 | |
| 	IA32_Add_Rm_Reg(jit, REG_EDI, REG_EAX, MOD_REG);
 | |
| 	IA32_Mov_Reg_Rm(jit, REG_EBP, REG_EAX, MOD_REG);
 | |
| 	IA32_Mov_Reg_Rm(jit, REG_EBX, REG_EDI, MOD_REG);
 | |
| 	IA32_Mov_Rm_Reg_Disp8(jit, REG_ESI, REG_ESP, AMX_INFO_NSTACK);
 | |
| 
 | |
| 	/* by now, everything is set up, so we can call into the plugin */
 | |
| 	//call ecx
 | |
| 	IA32_Call_Reg(jit, REG_ECX);
 | |
| 
 | |
| 	/* if the code flow gets to here, there was a normal return */
 | |
| 	//mov ecx, [esi+RETVAL]			;get retval pointer
 | |
| 	//mov [ecx], eax				;store retval from PRI
 | |
| 	//mov eax, SP_ERROR_NONE		;set no error
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_ECX, AMX_REG_INFO, AMX_INFO_RETVAL);
 | |
| 	IA32_Mov_Rm_Reg(jit, REG_ECX, AMX_REG_PRI, MOD_MEM_REG);
 | |
| 	IA32_Mov_Reg_Imm32(jit, REG_EAX, SP_ERROR_NONE);
 | |
| 
 | |
| 	/* save where error checking/halting functions should go to */
 | |
| 	jitoffs_t offs_return = jit->get_outputpos();
 | |
| 	//mov esp, [esi+NSTACK]			;restore stack pointer
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_ESP, REG_ESI, AMX_INFO_NSTACK);
 | |
| 
 | |
| 	/* Restore SP */
 | |
| 	//mov ecx, [esi+CONTEXT]
 | |
| 	//sub edi, ebp
 | |
| 	//mov [ecx+SP], edi
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_ECX, REG_ESI, AMX_INFO_CONTEXT);
 | |
| 	IA32_Sub_Reg_Rm(jit, REG_EDI, REG_EBP, MOD_REG);
 | |
| 	IA32_Mov_Rm_Reg_Disp8(jit, REG_ECX, REG_EDI, offsetof(sp_context_t, sp));
 | |
| 
 | |
| 	//pop ebx
 | |
| 	//pop edi
 | |
| 	//pop esi
 | |
| 	//pop ebp
 | |
| 	//ret
 | |
| 	IA32_Pop_Reg(jit, REG_EBX);
 | |
| 	IA32_Pop_Reg(jit, REG_EDI);
 | |
| 	IA32_Pop_Reg(jit, REG_ESI);
 | |
| 	IA32_Pop_Reg(jit, REG_EBP);
 | |
| 	IA32_Return(jit);
 | |
| 
 | |
| 	return offs_return;
 | |
| }
 | |
| 
 | |
| void Write_GetError(JitWriter *jit)
 | |
| {
 | |
| 	//mov eax, [esi+info.context]
 | |
| 	//mov eax, [eax+ctx.error]
 | |
| 	//jmp [jit_return]
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_EAX, AMX_REG_INFO, AMX_INFO_CONTEXT);
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_EAX, REG_EAX, offsetof(sp_context_t, n_err));
 | |
| 	IA32_Jump_Imm32_Abs(jit, g_Jit.GetReturnPoint());
 | |
| }
 | |
| 
 | |
| void Write_SetError(JitWriter *jit, int error)
 | |
| {
 | |
| 	//mov eax, <error>
 | |
| 	//jmp [jit_return]
 | |
| 	IA32_Mov_Reg_Imm32(jit, REG_EAX, error);
 | |
| 	IA32_Jump_Imm32_Abs(jit, g_Jit.GetReturnPoint());
 | |
| }
 | |
| 
 | |
| void Write_Check_DivZero(JitWriter *jit, jit_uint8_t reg)
 | |
| {
 | |
| 	//test reg, reg
 | |
| 	//jz :error
 | |
| 	IA32_Test_Rm_Reg(jit, reg, reg, MOD_REG);
 | |
| 	IA32_Jump_Cond_Imm32_Rel(jit, CC_Z, ((CompData *)jit->data)->jit_error_divzero);
 | |
| }
 | |
| 
 | |
| void Write_CheckHeap_Min(JitWriter *jit)
 | |
| {
 | |
| 	/* Check if the stack went beyond the heap low.
 | |
| 	 * This usually means there was a compiler error.
 | |
| 	 * NOTE: Special optimization here.
 | |
| 	 * The heap low is always known ahead of time! :)
 | |
| 	 */
 | |
| 	CompData *data = (CompData *)jit->data;
 | |
| 	//cmp [esi+info.heap], <heaplow>
 | |
| 	//jb :error
 | |
| 	IA32_Cmp_Rm_Imm32_Disp8(jit, AMX_REG_INFO, AMX_INFO_HEAP, data->plugin->data_size);
 | |
| 	IA32_Jump_Cond_Imm32_Rel(jit, CC_B, data->jit_error_heapmin);
 | |
| }
 | |
| 
 | |
| void Write_CheckHeap_Low(JitWriter *jit)
 | |
| {
 | |
| 	/* Check if the heap is trying to grow beyond the stack.
 | |
| 	 */
 | |
| 	//mov ecx, [esi+info.heap]
 | |
| 	//lea ecx, [ebp+ecx+STACK_MARGIN]
 | |
| 	//cmp ecx, edi
 | |
| 	//ja :error		; I think this is right
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, AMX_REG_TMP, AMX_REG_INFO, AMX_INFO_HEAP);
 | |
| 	IA32_Lea_Reg_DispRegMultImm8(jit, AMX_REG_TMP, AMX_REG_DAT, AMX_REG_TMP, NOSCALE, STACK_MARGIN);
 | |
| 	IA32_Cmp_Reg_Rm(jit, AMX_REG_TMP, AMX_REG_STK, MOD_REG);
 | |
| 	IA32_Jump_Cond_Imm32_Rel(jit, CC_A, ((CompData *)jit->data)->jit_error_heaplow);
 | |
| }
 | |
| 
 | |
| void Write_CheckStack_Min(JitWriter *jit)
 | |
| {
 | |
| 	/* Check if the stack went beyond the stack top
 | |
| 	 * This usually means there was a compiler error.
 | |
| 	 */
 | |
| 	//cmp edi, [esi+info.stacktop]
 | |
| 	//jae :error
 | |
| 	IA32_Cmp_Reg_Rm_Disp8(jit, AMX_REG_STK, AMX_REG_INFO, AMX_INFO_STACKTOP);
 | |
| 	IA32_Jump_Cond_Imm32_Rel(jit, CC_AE, ((CompData *)jit->data)->jit_error_stackmin);
 | |
| }
 | |
| 
 | |
| void Write_CheckStack_Low(JitWriter *jit)
 | |
| {
 | |
| 	/* Check if the stack went beyond the heap boundary.
 | |
| 	 * Unfortunately this one isn't as quick as the other check.
 | |
| 	 * The stack margin check is important for sysreq.n having space.
 | |
| 	 */
 | |
| 	//mov ecx, [esi+info.heap]
 | |
| 	//lea ecx, [ebp+ecx+STACK_MARGIN]
 | |
| 	//cmp edi, ecx
 | |
| 	//jb :error		; I think this is right
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, AMX_REG_TMP, AMX_REG_INFO, AMX_INFO_HEAP);
 | |
| 	IA32_Lea_Reg_DispRegMultImm8(jit, AMX_REG_TMP, AMX_REG_DAT, AMX_REG_TMP, NOSCALE, STACK_MARGIN);
 | |
| 	IA32_Cmp_Reg_Rm(jit, AMX_REG_STK, AMX_REG_TMP, MOD_REG);
 | |
| 	IA32_Jump_Cond_Imm32_Rel(jit, CC_B, ((CompData *)jit->data)->jit_error_stacklow);
 | |
| }
 | |
| 
 | |
| void Write_Check_VerifyAddr(JitWriter *jit, jit_uint8_t reg)
 | |
| {
 | |
| 	/* :TODO: Should this be checking for below heaplow?
 | |
| 	 * The old JIT did not.
 | |
| 	 */
 | |
| 
 | |
| 	/** 
 | |
| 	 * :TODO: If we can't find a nicer way of doing this,
 | |
| 	 *  then scrap it on high optimizations.  The second portion is not needed at all!
 | |
| 	 */
 | |
| 
 | |
| 	/* Part 1: Check if we're in the memory bounds */
 | |
| 	//cmp <reg>, <stpu>
 | |
| 	//jae :error
 | |
| 	IA32_Cmp_Rm_Imm32(jit, MOD_REG, reg, ((CompData *)jit->data)->plugin->mem_size);
 | |
| 	IA32_Jump_Cond_Imm32_Rel(jit, CC_AE, ((CompData *)jit->data)->jit_error_memaccess);
 | |
| 
 | |
| 	/* Part 2: Check if we're in the invalid region between HP and SP */
 | |
| 	jitoffs_t jmp;
 | |
| 	//cmp <reg>, [esi+info.heap]
 | |
| 	//jb :continue
 | |
| 	//lea ecx, [ebp+<reg>]
 | |
| 	//cmp edi, ecx
 | |
| 	//jb :error
 | |
| 	//:continue
 | |
| 	IA32_Cmp_Reg_Rm_Disp8(jit, reg, AMX_REG_INFO, AMX_INFO_HEAP);
 | |
| 	jmp = IA32_Jump_Cond_Imm8(jit, CC_B, 0);
 | |
| 	IA32_Lea_Reg_DispRegMultImm8(jit, AMX_REG_TMP, AMX_REG_DAT, reg, NOSCALE, 0);
 | |
| 	IA32_Cmp_Reg_Rm(jit, AMX_REG_TMP, AMX_REG_STK, MOD_REG);
 | |
| 	IA32_Jump_Cond_Imm32_Rel(jit, CC_B, ((CompData *)jit->data)->jit_error_memaccess);
 | |
| 	IA32_Send_Jump8_Here(jit, jmp);
 | |
| }
 | |
| 
 | |
| void Macro_PushN_Addr(JitWriter *jit, int i)
 | |
| {
 | |
| 	//push eax
 | |
| 	//mov eax, [esi+frm]
 | |
| 	//loop i times:
 | |
| 	// lea ecx, [eax+<val>]
 | |
| 	// mov [edi-4*i], ecx
 | |
| 	//sub edi, 4*N
 | |
| 	//pop eax
 | |
| 
 | |
| 	cell_t val;
 | |
| 	int n = 1;
 | |
| 	IA32_Push_Reg(jit, AMX_REG_PRI);
 | |
| 	IA32_Mov_Reg_Rm(jit, AMX_REG_PRI, AMX_REG_INFO, MOD_MEM_REG);
 | |
| 	do
 | |
| 	{
 | |
| 		val = jit->read_cell();
 | |
| 		if (val <= SCHAR_MAX && val >= SCHAR_MIN)
 | |
| 			IA32_Lea_DispRegImm8(jit, AMX_REG_TMP, AMX_REG_PRI, (jit_int8_t)val);
 | |
| 		else
 | |
| 			IA32_Lea_DispRegImm32(jit, AMX_REG_TMP, AMX_REG_PRI, val);
 | |
| 		IA32_Mov_Rm_Reg_Disp8(jit, AMX_REG_STK, AMX_REG_TMP, -4*n);
 | |
| 	} while (n++ < i);
 | |
| 	IA32_Sub_Rm_Imm8(jit, AMX_REG_STK, 4*i, MOD_REG);
 | |
| 	IA32_Pop_Reg(jit, AMX_REG_PRI);
 | |
| }
 | |
| 
 | |
| void Macro_PushN_S(JitWriter *jit, int i)
 | |
| {
 | |
| 	//loop i times:
 | |
| 	// mov ecx, [ebx+<val>]
 | |
| 	// mov [edi-4*i], ecx
 | |
| 	//sub edi, 4*N
 | |
| 
 | |
| 	cell_t val;
 | |
| 	int n = 1;
 | |
| 	do 
 | |
| 	{
 | |
| 		val = jit->read_cell();
 | |
| 		if (val <= SCHAR_MAX && val >= SCHAR_MIN)
 | |
| 			IA32_Mov_Reg_Rm_Disp8(jit, AMX_REG_TMP, AMX_REG_FRM, (jit_int8_t)val);
 | |
| 		else
 | |
| 			IA32_Mov_Reg_Rm_Disp32(jit, AMX_REG_TMP, AMX_REG_FRM, val);
 | |
| 		IA32_Mov_Rm_Reg_Disp8(jit, AMX_REG_STK, AMX_REG_TMP, -4*n);
 | |
| 	} while (n++ < i);
 | |
| 	IA32_Sub_Rm_Imm8(jit, AMX_REG_STK, 4*i, MOD_REG);
 | |
| }
 | |
| 
 | |
| void Macro_PushN_C(JitWriter *jit, int i)
 | |
| {
 | |
| 	//loop i times:
 | |
| 	// mov [edi-4*i], <val>
 | |
| 	//sub edi, 4*N
 | |
| 
 | |
| 	int n = 1;
 | |
| 	do 
 | |
| 	{
 | |
| 		IA32_Mov_Rm_Imm32_Disp8(jit, AMX_REG_STK, jit->read_cell(), -4*n);
 | |
| 	} while (n++ < i);
 | |
| 	IA32_Sub_Rm_Imm8(jit, AMX_REG_STK, 4*i, MOD_REG);
 | |
| }
 | |
| 
 | |
| void Macro_PushN(JitWriter *jit, int i)
 | |
| {
 | |
| 	//loop i times:
 | |
| 	// mov ecx, [ebp+<val>]
 | |
| 	// mov [edi-4*i], ecx
 | |
| 	//sub edi, 4*N
 | |
| 
 | |
| 	cell_t val;
 | |
| 	int n = 1;
 | |
| 	do 
 | |
| 	{
 | |
| 		val = jit->read_cell();
 | |
| 		if (val <= SCHAR_MAX && val >= SCHAR_MIN)
 | |
| 			IA32_Mov_Reg_Rm_Disp8(jit, AMX_REG_TMP, AMX_REG_DAT, (jit_int8_t)val);
 | |
| 		else
 | |
| 			IA32_Mov_Reg_Rm_Disp32(jit, AMX_REG_TMP, AMX_REG_DAT, val);
 | |
| 		IA32_Mov_Rm_Reg_Disp8(jit, AMX_REG_STK, AMX_REG_TMP, -4*n);
 | |
| 	} while (n++ < i);
 | |
| 	IA32_Sub_Rm_Imm8(jit, AMX_REG_STK, 4*i, MOD_REG);
 | |
| }
 | |
| 
 | |
| void WriteOp_Sysreq_C_Function(JitWriter *jit)
 | |
| {
 | |
| 	/* The small daddy of the big daddy of opcodes.
 | |
| 	 * ecx - native index
 | |
| 	 */
 | |
| 	CompData *data = (CompData *)jit->data;
 | |
| 
 | |
| 	/* save registers we will need */
 | |
| 	//push edx
 | |
| 	IA32_Push_Reg(jit, AMX_REG_ALT);
 | |
| 
 | |
| 	/* Align the stack to 16 bytes */
 | |
| 	//push ebx
 | |
| 	//mov ebx, esp
 | |
| 	//and esp, 0xFFFFFF0
 | |
| 	//sub esp, 4
 | |
| 	IA32_Push_Reg(jit, REG_EBX);
 | |
| 	IA32_Mov_Reg_Rm(jit, REG_EBX, REG_ESP, MOD_REG);
 | |
| 	IA32_And_Rm_Imm8(jit, REG_ESP, MOD_REG, -16);
 | |
| 	IA32_Sub_Rm_Imm8(jit, REG_ESP, 4, MOD_REG);
 | |
| 
 | |
| 	/* push some callback stuff */
 | |
| 	//push edi		; stack
 | |
| 	//push ecx		; native index
 | |
| 	IA32_Push_Reg(jit, AMX_REG_STK);
 | |
| 	IA32_Push_Reg(jit, REG_ECX);
 | |
| 
 | |
| 	/* Relocate stack, heap, frm information, then store back */
 | |
| 	//mov eax, [esi+context]
 | |
| 	//mov ecx, [esi+hea]
 | |
| 	//sub edi, ebp
 | |
| 	//mov [eax+hp], ecx
 | |
| 	//mov ecx, [esi]
 | |
| 	//mov [eax+sp], edi
 | |
| 	//mov [eax+frm], ecx
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_EAX, AMX_REG_INFO, AMX_INFO_CONTEXT);
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, AMX_REG_TMP, AMX_REG_INFO, AMX_INFO_HEAP);
 | |
| 	IA32_Sub_Reg_Rm(jit, AMX_REG_STK, AMX_REG_DAT, MOD_REG);
 | |
| 	IA32_Mov_Rm_Reg_Disp8(jit, REG_EAX, AMX_REG_TMP, offsetof(sp_context_t, hp));
 | |
| 	IA32_Mov_Reg_Rm(jit, AMX_REG_TMP, AMX_INFO_FRM, MOD_MEM_REG);
 | |
| 	IA32_Mov_Rm_Reg_Disp8(jit, REG_EAX, AMX_REG_STK, offsetof(sp_context_t, sp));
 | |
| 	IA32_Mov_Rm_Reg_Disp8(jit, REG_EAX, AMX_REG_TMP, offsetof(sp_context_t, frm));
 | |
| 
 | |
| 	/* finally, push the last parameter and make the call */
 | |
| 	//push eax		; context
 | |
| 	//call NativeCallback
 | |
| 	IA32_Push_Reg(jit, REG_EAX);
 | |
| 	jitoffs_t call = IA32_Call_Imm32(jit, 0);
 | |
| 	IA32_Write_Jump32_Abs(jit, call, (void *)NativeCallback);
 | |
| 
 | |
| 	/* Test for error */
 | |
| 	//mov ecx, [esi+context]
 | |
| 	//cmp [ecx+err], 0
 | |
| 	//jnz :error
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, AMX_REG_TMP, AMX_REG_INFO, AMX_INFO_CONTEXT);
 | |
| 	IA32_Cmp_Rm_Disp8_Imm8(jit, AMX_REG_TMP, offsetof(sp_context_t, n_err), 0);
 | |
| 	IA32_Jump_Cond_Imm32_Rel(jit, CC_NZ, data->jit_extern_error);
 | |
| 
 | |
| 	/* restore what we damaged */
 | |
| 	//mov esp, ebx
 | |
| 	//pop ebx
 | |
| 	//add edi, ebp
 | |
| 	//pop edx
 | |
| 	IA32_Mov_Reg_Rm(jit, REG_ESP, REG_EBX, MOD_REG);
 | |
| 	IA32_Pop_Reg(jit, REG_EBX);
 | |
| 	IA32_Add_Reg_Rm(jit, AMX_REG_STK, AMX_REG_DAT, MOD_REG);
 | |
| 	IA32_Pop_Reg(jit, AMX_REG_ALT);
 | |
| 
 | |
| 	//ret
 | |
| 	IA32_Return(jit);
 | |
| }
 | |
| 
 | |
| typedef struct array_creation_s
 | |
| {
 | |
| 	const cell_t *dim_list;				/* Dimension sizes */
 | |
| 	cell_t dim_count;					/* Number of dimensions */
 | |
| 	cell_t *data_offs;					/* Current offset AFTER the indirection vectors (data) */
 | |
| 	cell_t *base;						/* array base */
 | |
| } array_creation_t;
 | |
| 
 | |
| cell_t _GenerateArrayIndirectionVectors(array_creation_t *ar, int dim, cell_t cur_offs)
 | |
| {
 | |
| 	cell_t write_offs = cur_offs;
 | |
| 	cell_t *data_offs = ar->data_offs;
 | |
| 
 | |
| 	cur_offs += ar->dim_list[dim];
 | |
| 
 | |
| 	/**
 | |
| 	 * Dimension n-x where x > 2 will have sub-vectors.  
 | |
| 	 * Otherwise, we just need to reference the data section.
 | |
| 	 */
 | |
| 	if (ar->dim_count > 2 && dim < ar->dim_count - 2)
 | |
| 	{
 | |
| 		/**
 | |
| 		 * For each index at this dimension, write offstes to our sub-vectors.
 | |
| 		 * After we write one sub-vector, we generate its sub-vectors recursively.
 | |
| 		 * At the end, we're given the next offset we can use.
 | |
| 		 */
 | |
| 		for (int i = 0; i < ar->dim_list[dim]; i++)
 | |
| 		{
 | |
| 			ar->base[write_offs] = (cur_offs - write_offs) * sizeof(cell_t);
 | |
| 			write_offs++;
 | |
| 			cur_offs = _GenerateArrayIndirectionVectors(ar, dim + 1, cur_offs);
 | |
| 		}
 | |
| 	} else {
 | |
| 		/**
 | |
| 		 * In this section, there are no sub-vectors, we need to write offsets 
 | |
| 		 * to the data.  This is separate so the data stays in one big chunk.
 | |
| 		 * The data offset will increment by the size of the last dimension, 
 | |
| 		 * because that is where the data is finally computed as. 
 | |
| 		 */
 | |
| 		for (int i = 0; i < ar->dim_list[dim]; i++)
 | |
| 		{
 | |
| 			ar->base[write_offs] = (*data_offs - write_offs) * sizeof(cell_t);
 | |
| 			write_offs++;
 | |
| 			*data_offs = *data_offs + ar->dim_list[dim + 1];
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	return cur_offs;
 | |
| }
 | |
| 
 | |
| static cell_t calc_indirection(const array_creation_t *ar, cell_t dim)
 | |
| {
 | |
| 	cell_t size = ar->dim_list[dim];
 | |
| 
 | |
| 	if (dim < ar->dim_count - 2)
 | |
| 	{
 | |
| 		size += ar->dim_list[dim] * calc_indirection(ar, dim + 1);
 | |
| 	}
 | |
| 
 | |
| 	return size;
 | |
| }
 | |
| 
 | |
| void GenerateArrayIndirectionVectors(cell_t *arraybase, cell_t dims[], cell_t _dimcount, bool autozero)
 | |
| {
 | |
| 	array_creation_t ar;
 | |
| 	cell_t data_offs;
 | |
| 
 | |
| 	/* Reverse the dimensions */
 | |
| 	cell_t dim_list[sDIMEN_MAX];
 | |
| 	int cur_dim = 0;
 | |
| 	for (int i = _dimcount - 1; i >= 0; i--)
 | |
| 	{
 | |
| 		dim_list[cur_dim++] = dims[i];
 | |
| 	}
 | |
| 	
 | |
| 	ar.base = arraybase;
 | |
| 	ar.dim_list = dim_list;
 | |
| 	ar.dim_count = _dimcount;
 | |
| 	ar.data_offs = &data_offs;
 | |
| 
 | |
| 	data_offs = calc_indirection(&ar, 0);
 | |
| 
 | |
| 	_GenerateArrayIndirectionVectors(&ar, 0, 0);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * A few notes about this function.
 | |
|  * I was more concerned about efficient use of registers here, rather than 
 | |
|  *  fine-tuned optimization.  The reason is that the code is already complicated,
 | |
|  *  and it is very easy to mess up.
 | |
|  */
 | |
| void WriteIntrinsic_GenArray(JitWriter *jit)
 | |
| {
 | |
| 	jitoffs_t err1, err2;
 | |
| 
 | |
| 	/**
 | |
| 	 * save important values
 | |
| 	 */
 | |
| 	//push ebx
 | |
| 	//push eax
 | |
| 	//push edx
 | |
| 	//push ecx				;value is referenced on stack
 | |
| 	IA32_Push_Reg(jit, REG_EBX);
 | |
| 	IA32_Push_Reg(jit, REG_EAX);
 | |
| 	IA32_Push_Reg(jit, REG_EDX);
 | |
| 	IA32_Push_Reg(jit, REG_ECX);
 | |
| 
 | |
| 	/**
 | |
| 	 * Calculate how many cells will be needed.
 | |
| 	 */
 | |
| 	//mov edx, [edi]		;get last dimension's count
 | |
| 	//mov eax, 1			;position at second to last dimension
 | |
| 	//:loop
 | |
| 	//cmp eax, [esp]		;compare to # of params
 | |
| 	//jae :done				;end loop if done
 | |
| 	//mov ecx, [edi+eax*4]	;get dimension size
 | |
| 	//imul edx, ecx			;multiply by size
 | |
| 	//add eax, 1			;increment
 | |
| 	//add edx, ecx			;add size (indirection vector)
 | |
| 	//jmp :loop				;jump back
 | |
| 	//:done
 | |
| 	IA32_Mov_Reg_Rm(jit, REG_EDX, AMX_REG_STK, MOD_MEM_REG);
 | |
| 	IA32_Mov_Reg_Imm32(jit, REG_EAX, 1);
 | |
| 	jitoffs_t loop1 = jit->get_outputpos();
 | |
| 	IA32_Cmp_Reg_Rm_ESP(jit, REG_EAX);
 | |
| 	jitoffs_t done1 = IA32_Jump_Cond_Imm8(jit, CC_AE, 0);
 | |
| 	IA32_Mov_Reg_Rm_Disp_Reg(jit, REG_ECX, AMX_REG_STK, REG_EAX, SCALE4);
 | |
| 	IA32_IMul_Reg_Rm(jit, REG_EDX, REG_ECX, MOD_REG);
 | |
| 	IA32_Add_Rm_Imm8(jit, REG_EAX, 1, MOD_REG);
 | |
| 	IA32_Add_Reg_Rm(jit, REG_EDX, REG_ECX, MOD_REG);
 | |
| 	IA32_Write_Jump8(jit, IA32_Jump_Imm8(jit, loop1), loop1);
 | |
| 	IA32_Send_Jump8_Here(jit, done1);
 | |
| 
 | |
| 	/* Test if we have heap space for this */
 | |
| 	//mov eax, [esi+info.heap]	;get heap pointer
 | |
| 	//lea eax, [eax+edx*4]		;new heap pointer
 | |
| 	//cmp eax, [esi+info.datasz] ;compare to heap low
 | |
| 	//jbe :error				;die if we hit this (it should always be >)
 | |
| 	//add eax, ebp				;relocate to stack
 | |
| 	//cmp eax, edi				;die if above the stack pointer
 | |
| 	//jae :error
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_EAX, AMX_REG_INFO, AMX_INFO_HEAP);
 | |
| 	IA32_Lea_Reg_DispRegMult(jit, REG_EAX, REG_EAX, REG_EDX, SCALE4);
 | |
| 	IA32_Cmp_Reg_Rm_Disp8(jit, REG_EAX, AMX_REG_INFO, AMX_INFO_DATASIZE);
 | |
| 	err1 = IA32_Jump_Cond_Imm32(jit, CC_BE, 0);
 | |
| 	IA32_Add_Reg_Rm(jit, REG_EAX, AMX_REG_DAT, MOD_REG);
 | |
| 	IA32_Cmp_Reg_Rm(jit, REG_EAX, AMX_REG_STK, MOD_REG);
 | |
| 	err2 = IA32_Jump_Cond_Imm32(jit, CC_AE, 0);
 | |
| 	
 | |
| 	/* Prepare for indirection iteration */
 | |
| 	//mov eax, [esi+info.heap]	;get heap pointer
 | |
| 	//lea ebx, [eax+edx*4]		;new heap pointer
 | |
| 	//mov [esi+info.heap], ebx	;store back
 | |
| 	//push eax					;save heap pointer - we need it
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_EAX, AMX_REG_INFO, AMX_INFO_HEAP);
 | |
| 	IA32_Lea_Reg_DispRegMult(jit, REG_EBX, REG_EAX, REG_EDX, SCALE4);
 | |
| 	IA32_Mov_Rm_Reg_Disp8(jit, AMX_REG_INFO, REG_EBX, AMX_INFO_HEAP);
 | |
| 	IA32_Push_Reg(jit, REG_EAX);
 | |
| 
 | |
| 	WriteOp_Tracker_Push_Reg(jit, REG_EDX);
 | |
| 	
 | |
| 	/* This part is too messy to do in straight assembly.
 | |
| 	 * I'm letting the compiler handle it and thus it's in C.
 | |
| 	 */
 | |
| 	//lea ebx, [ebp+eax]		;get base pointer
 | |
| 	//push dword [esp-8]		;push autozero
 | |
| 	//push dword [esp-8]		;push dimension count
 | |
| 	//push edi					;push dim array
 | |
| 	//push ebx
 | |
| 	//call GenerateArrayIndirectionVectors
 | |
| 	//add esp, 4*4
 | |
| 	IA32_Lea_Reg_DispRegMult(jit, REG_EBX, REG_EAX, REG_EBP, NOSCALE);
 | |
| 	IA32_Push_Rm_Disp8_ESP(jit, 8);
 | |
| 	IA32_Push_Rm_Disp8_ESP(jit, 8);
 | |
| 	IA32_Push_Reg(jit, REG_EDI);
 | |
| 	IA32_Push_Reg(jit, REG_EBX);
 | |
| 	IA32_Write_Jump32_Abs(jit, IA32_Call_Imm32(jit, 0), (void *)&GenerateArrayIndirectionVectors);
 | |
| 	IA32_Add_Rm_Imm8(jit, REG_ESP, 4*4, MOD_REG);
 | |
| 
 | |
| 	/* Store the heap pointer back into the stack */
 | |
| 	//pop eax					;restore heap pointer
 | |
| 	//pop ecx					;restore param count
 | |
| 	//lea edi, [edi+ecx*4-4]	;pop params-4 off the stack
 | |
| 	//mov [edi], eax			;store back the heap pointer
 | |
| 	IA32_Pop_Reg(jit, REG_EAX);
 | |
| 	IA32_Pop_Reg(jit, REG_ECX);
 | |
| 	IA32_Lea_Reg_DispRegMultImm8(jit, AMX_REG_STK, AMX_REG_STK, REG_ECX, SCALE4, -4);
 | |
| 	IA32_Mov_Rm_Reg(jit, AMX_REG_STK, REG_EAX, MOD_MEM_REG);
 | |
| 
 | |
| 	/* Return to caller */
 | |
| 	//pop edx
 | |
| 	//pop eax
 | |
| 	//pop ebx
 | |
| 	//ret
 | |
| 	IA32_Pop_Reg(jit, REG_ECX);
 | |
| 	IA32_Pop_Reg(jit, REG_EAX);
 | |
| 	IA32_Pop_Reg(jit, REG_EBX);
 | |
| 	IA32_Return(jit);
 | |
| 
 | |
| 	//:error
 | |
| 	IA32_Send_Jump32_Here(jit, err1);
 | |
| 	IA32_Send_Jump32_Here(jit, err2);
 | |
| 	Write_SetError(jit, SP_ERROR_ARRAY_TOO_BIG);
 | |
| }
 | |
| 
 | |
| void WriteOp_Tracker_Push_Reg(JitWriter *jit, uint8_t reg)
 | |
| {
 | |
| 	/* Save registers that may be damaged by the call */
 | |
| 	//push eax
 | |
| 	//push ecx
 | |
| 	//push edi
 | |
| 	//lea edi, [<reg>*4]		; we want the count in bytes not in cells
 | |
| 	IA32_Push_Reg(jit, AMX_REG_PRI);
 | |
| 	if (reg == REG_ECX)
 | |
| 	{
 | |
| 		IA32_Push_Reg(jit, AMX_REG_TMP);
 | |
| 	}
 | |
| 	IA32_Push_Reg(jit, AMX_REG_STK);
 | |
| 	IA32_Lea_Reg_RegMultImm32(jit, REG_EDI, reg, SCALE4, 0);
 | |
| 
 | |
| 	/* Get the context ptr, push it and call the check */
 | |
| 	//mov eax, [esi+context]
 | |
| 	//push eax
 | |
| 	//call JIT_VerifyOrAllocateTracker
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_EAX, AMX_REG_INFO, AMX_INFO_CONTEXT);
 | |
| 	IA32_Push_Reg(jit, REG_EAX);
 | |
| 	jitoffs_t call = IA32_Call_Imm32(jit, 0);
 | |
| 	IA32_Write_Jump32_Abs(jit, call, (void *)JIT_VerifyOrAllocateTracker);
 | |
| 
 | |
| 	/* Check for errors */
 | |
| 	//cmp eax, 0
 | |
| 	//jnz :error
 | |
| 	IA32_Cmp_Rm_Imm8(jit, MOD_REG, REG_EAX, 0);
 | |
| 	IA32_Jump_Cond_Imm32_Abs(jit, CC_NZ, g_Jit.GetReturnPoint());
 | |
| 
 | |
| 	/* Restore */
 | |
| 	//pop eax
 | |
| 	IA32_Pop_Reg(jit, REG_EAX);
 | |
| 	
 | |
| 	/* Push the register into the stack and increment pCur */
 | |
| 	//mov edx, [eax+vm[]]
 | |
| 	//mov eax, [edx+pcur]
 | |
| 	//add [edx+pcur], 4
 | |
| 	//mov [eax], edi
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_EDX, REG_EAX, offsetof(sp_context_t, vm[JITVARS_TRACKER]));
 | |
| 	IA32_Mov_Reg_Rm_Disp8(jit, REG_EAX, REG_EDX, offsetof(tracker_t, pCur));
 | |
| 	IA32_Add_Rm_Imm8_Disp8(jit, REG_EDX, 4, offsetof(tracker_t, pCur));
 | |
| 	IA32_Mov_Rm_Reg(jit, REG_EAX, REG_EDI, MOD_MEM_REG);
 | |
| 
 | |
| 	/* Restore PRI, ALT and STK */
 | |
| 	//pop edi
 | |
| 	//pop ecx
 | |
| 	//pop eax
 | |
| 	IA32_Pop_Reg(jit, AMX_REG_STK);
 | |
| 	if (reg == REG_ECX)
 | |
| 	{
 | |
| 		IA32_Pop_Reg(jit, AMX_REG_TMP);
 | |
| 	}
 | |
| 	IA32_Pop_Reg(jit, AMX_REG_PRI);
 | |
| }
 | |
| 
 | |
| int JIT_VerifyOrAllocateTracker(sp_context_t *ctx)
 | |
| {
 | |
| 	tracker_t *trk = (tracker_t *)(ctx->vm[JITVARS_TRACKER]);
 | |
| 
 | |
| 	if ((size_t)(trk->pCur - trk->pBase) >= trk->size)
 | |
| 	{
 | |
| 		return SP_ERROR_TRACKER_BOUNDS;
 | |
| 	}
 | |
| 
 | |
| 	if (trk->pCur+1 - (trk->pBase + trk->size) == 0)
 | |
| 	{
 | |
| 		size_t disp = trk->size - 1;
 | |
| 		trk->size *= 2;
 | |
| 		trk->pBase = (ucell_t *)realloc(trk->pBase, trk->size * sizeof(cell_t));
 | |
| 
 | |
| 		if (!trk->pBase)
 | |
| 		{
 | |
| 			return SP_ERROR_TRACKER_BOUNDS;
 | |
| 		}
 | |
| 
 | |
| 		trk->pCur = trk->pBase + disp;
 | |
| 	}
 | |
| 
 | |
| 	return SP_ERROR_NONE;
 | |
| }
 | |
| 
 | |
| int JIT_VerifyLowBoundTracker(sp_context_t *ctx)
 | |
| {
 | |
| 	tracker_t *trk = (tracker_t *)(ctx->vm[JITVARS_TRACKER]);
 | |
| 
 | |
| 	if (trk->pCur <= trk->pBase)
 | |
| 	{
 | |
| 		return SP_ERROR_TRACKER_BOUNDS;
 | |
| 	}
 | |
| 
 | |
| 	return SP_ERROR_NONE;
 | |
| }
 | |
| 
 | |
| void AlignMe(JitWriter *jit)
 | |
| {
 | |
| 	jitoffs_t cur_offs = jit->get_outputpos();
 | |
| 	jitoffs_t offset = ((cur_offs & 0xFFFFFFF0) + 16) - cur_offs;
 | |
| 
 | |
| 	if (offset)
 | |
| 	{
 | |
| 		for (jit_uint32_t i=0; i<offset; i++)
 | |
| 		{
 | |
| 			jit->write_ubyte(IA32_INT3);
 | |
| 		}
 | |
| 	}
 | |
| }
 |