/* Pawn compiler - Staging buffer and optimizer * * The staging buffer * ------------------ * The staging buffer allows buffered output of generated code, deletion * of redundant code, optimization by a tinkering process and reversing * the ouput of evaluated expressions (which is used for the reversed * evaluation of arguments in functions). * Initially, stgwrite() writes to the file directly, but after a call to * stgset(TRUE), output is redirected to the buffer. After a call to * stgset(FALSE), stgwrite()'s output is directed to the file again. Thus * only one routine is used for writing to the output, which can be * buffered output or direct output. * * staging buffer variables: stgbuf - the buffer * stgidx - current index in the staging buffer * staging - if true, write to the staging buffer; * if false, write to file directly. * * The peephole optimizer uses a dual "pipeline". The staging buffer (described * above) gets optimized for each expression or sub-expression in a function * call. The peephole optimizer is recursive, but it does not span multiple * sub-expressions. However, the data gets written to a second buffer that * behaves much like the staging buffer. This second buffer gathers all * optimized strings from the staging buffer for a complete expression. The * peephole optmizer then runs over this second buffer to find optimzations * across function parameter boundaries. * * * Copyright (c) ITB CompuPhase, 1997-2006 * * This software is provided "as-is", without any express or implied warranty. * In no event will the authors be held liable for any damages arising from * the use of this software. * * Permission is granted to anyone to use this software for any purpose, * including commercial applications, and to alter it and redistribute it * freely, subject to the following restrictions: * * 1. The origin of this software must not be misrepresented; you must not * claim that you wrote the original software. If you use this software in * a product, an acknowledgment in the product documentation would be * appreciated but is not required. * 2. Altered source versions must be plainly marked as such, and must not be * misrepresented as being the original software. * 3. This notice may not be removed or altered from any source distribution. * * Version: $Id$ */ #include #include #include /* for atoi() */ #include #include #if defined FORTIFY #include #endif #include "sc.h" #if defined _MSC_VER #pragma warning(push) #pragma warning(disable:4125) /* decimal digit terminates octal escape sequence */ #endif #include "sc7.scp" #if defined _MSC_VER #pragma warning(pop) #endif static int stgstring(char *start,char *end); static void stgopt(char *start,char *end,int (*outputfunc)(char *str)); #define sSTG_GROW 512 #define sSTG_MAX 20480 static char *stgbuf=NULL; static int stgmax=0; /* current size of the staging buffer */ static char *stgpipe=NULL; static int pipemax=0; /* current size of the stage pipe, a second staging buffer */ static int pipeidx=0; #define CHECK_STGBUFFER(index) if ((int)(index)>=stgmax) grow_stgbuffer(&stgbuf, stgmax, (index)+1) #define CHECK_STGPIPE(index) if ((int)(index)>=pipemax) grow_stgbuffer(&stgpipe, pipemax, (index)+1) static void grow_stgbuffer(char **buffer, int curmax, int requiredsize) { char *p; int clear= (*buffer==NULL); /* if previously none, empty buffer explicitly */ assert(curmaxsSTG_MAX) error(102,"staging buffer"); /* staging buffer overflow (fatal error) */ curmax=requiredsize+sSTG_GROW; if (*buffer!=NULL) p=(char *)realloc(*buffer,curmax*sizeof(char)); else p=(char *)malloc(curmax*sizeof(char)); if (p==NULL) error(102,"staging buffer"); /* staging buffer overflow (fatal error) */ *buffer=p; if (clear) **buffer='\0'; } SC_FUNC void stgbuffer_cleanup(void) { if (stgbuf!=NULL) { free(stgbuf); stgbuf=NULL; stgmax=0; } /* if */ if (stgpipe!=NULL) { free(stgpipe); stgpipe=NULL; pipemax=0; pipeidx=0; } /* if */ } /* the variables "stgidx" and "staging" are declared in "scvars.c" */ /* stgmark * * Copies a mark into the staging buffer. At this moment there are three * possible marks: * sSTARTREORDER identifies the beginning of a series of expression * strings that must be written to the output file in * reordered order * sENDREORDER identifies the end of 'reverse evaluation' * sEXPRSTART + idx only valid within a block that is evaluated in * reordered order, it identifies the start of an * expression; the "idx" value is the argument position * * Global references: stgidx (altered) * stgbuf (altered) * staging (referred to only) */ SC_FUNC void stgmark(char mark) { if (staging) { CHECK_STGBUFFER(stgidx); stgbuf[stgidx++]=mark; } /* if */ } static int rebuffer(char *str) { if (sc_status==statWRITE) { if (pipeidx>=2 && stgpipe[pipeidx-1]=='\0' && stgpipe[pipeidx-2]!='\n') pipeidx-=1; /* overwrite last '\0' */ while (*str!='\0') { /* copy to staging buffer */ CHECK_STGPIPE(pipeidx); stgpipe[pipeidx++]=*str++; } /* while */ CHECK_STGPIPE(pipeidx); stgpipe[pipeidx++]='\0'; } /* if */ return TRUE; } static int filewrite(char *str) { if (sc_status==statWRITE) return pc_writeasm(outf,str); return TRUE; } /* stgwrite * * Writes the string "st" to the staging buffer or to the output file. In the * case of writing to the staging buffer, the terminating byte of zero is * copied too, but... the optimizer can only work on complete lines (not on * fractions of it. Therefore if the string is staged, if the last character * written to the buffer is a '\0' and the previous-to-last is not a '\n', * the string is concatenated to the last string in the buffer (the '\0' is * overwritten). This also means an '\n' used in the middle of a string isn't * recognized and could give wrong results with the optimizer. * Even when writing to the output file directly, all strings are buffered * until a whole line is complete. * * Global references: stgidx (altered) * stgbuf (altered) * staging (referred to only) */ SC_FUNC void stgwrite(const char *st) { int len; if (staging) { assert(stgidx==0 || stgbuf!=NULL); /* staging buffer must be valid if there is (apparently) something in it */ if (stgidx>=2 && stgbuf[stgidx-1]=='\0' && stgbuf[stgidx-2]!='\n') stgidx-=1; /* overwrite last '\0' */ while (*st!='\0') { /* copy to staging buffer */ CHECK_STGBUFFER(stgidx); stgbuf[stgidx++]=*st++; } /* while */ CHECK_STGBUFFER(stgidx); stgbuf[stgidx++]='\0'; } else { len=(stgbuf!=NULL) ? strlen(stgbuf) : 0; CHECK_STGBUFFER(len+strlen(st)+1); strcat(stgbuf,st); len=strlen(stgbuf); if (len>0 && stgbuf[len-1]=='\n') { filewrite(stgbuf); stgbuf[0]='\0'; } /* if */ } /* if */ } /* stgout * * Writes the staging buffer to the output file via stgstring() (for * reversing expressions in the buffer) and stgopt() (for optimizing). It * resets "stgidx". * * Global references: stgidx (altered) * stgbuf (referred to only) * staging (referred to only) */ SC_FUNC void stgout(int index) { int reordered=0; int idx; if (!staging) return; assert(pipeidx==0); /* first pass: sub-expressions */ if (sc_status==statWRITE) reordered=stgstring(&stgbuf[index],&stgbuf[stgidx]); stgidx=index; /* second pass: optimize the buffer created in the first pass */ if (sc_status==statWRITE) { if (reordered) { stgopt(stgpipe,stgpipe+pipeidx,filewrite); } else { /* there is no sense in re-optimizing if the order of the sub-expressions * did not change; so output directly */ for (idx=0; idx=0) stack[arg].end=start-1; /* finish previous argument */ arg=(unsigned char)*start - sEXPRSTART; stack[arg].start=start+1; if (arg>=argc) argc=arg+1; } /* if */ start++; } else { start+=strlen(start)+1; } /* if */ } /* switch */ } while (nest); /* enddo */ if (arg>=0) stack[arg].end=start-1; /* finish previous argument */ while (argc>0) { argc--; stgstring(stack[argc].start,stack[argc].end); } /* while */ free(stack); } else { ptr=start; while (ptr0) filewrite(stgbuf); } /* if */ stgbuf[0]='\0'; } /* phopt_init * Initialize all sequence strings of the peehole optimizer. The strings * are embedded in the .EXE file in compressed format, here we expand * them (and allocate memory for the sequences). */ static SEQUENCE *sequences; SC_FUNC int phopt_init(void) { int number, i, len; char str[160]; /* count number of sequences */ for (number=0; sequences_cmp[number].find!=NULL; number++) /* nothing */; number++; /* include an item for the NULL terminator */ if ((sequences=(SEQUENCE*)malloc(number * sizeof(SEQUENCE)))==NULL) return FALSE; /* pre-initialize all to NULL (in case of failure) */ for (i=0; i (PAWN_CELL_SIZE/4) * MAX_OPT_CAT #define MAX_ALIAS sNAMEMAX #else #define MAX_ALIAS (PAWN_CELL_SIZE/4) * MAX_OPT_CAT #endif static int matchsequence(char *start,char *end,char *pattern, char symbols[MAX_OPT_VARS][MAX_ALIAS+1], int *match_length) { int var,i; char str[MAX_ALIAS+1]; char *start_org=start; cell value; char *ptr; *match_length=0; for (var=0; var=end) return FALSE; switch (*pattern) { case '%': /* new "symbol" */ pattern++; assert(isdigit(*pattern)); var=atoi(pattern) - 1; assert(var>=0 && var=0 && var=0 && var0) { /* delete a section */ memmove(dest,dest+offset,dest_length-offset); memset(dest+dest_length-offset,0xcc,offset); /* not needed, but for cleanlyness */ } else if (offset<0) { /* insert a section */ memmove(dest-offset, dest, dest_length); } /* if */ memcpy(dest, replace, repl_length); } /* stgopt * * Optimizes the staging buffer by checking for series of instructions that * can be coded more compact. The routine expects the lines in the staging * buffer to be separated with '\n' and '\0' characters. * * The longest sequences should probably be checked first. */ static void stgopt(char *start,char *end,int (*outputfunc)(char *str)) { char symbols[MAX_OPT_VARS][MAX_ALIAS+1]; int seq,match_length,repl_length; int matches; char *debut=start; /* save original start of the buffer */ assert(sequences!=NULL); /* do not match anything if debug-level is maximum */ if (pc_optimize>sOPTIMIZE_NONE && sc_status==statWRITE) { do { matches=0; start=debut; while (start=0); if (*sequences[seq].find=='\0') { if (pc_optimize==sOPTIMIZE_NOMACRO) { break; /* don't look further */ } else { seq++; /* continue with next string */ continue; } /* if */ } /* if */ if (matchsequence(start,end,sequences[seq].find,symbols,&match_length)) { char *replace=replacesequence(sequences[seq].replace,symbols,&repl_length); /* If the replacement is bigger than the original section, we may need * to "grow" the staging buffer. This is quite complex, due to the * re-ordering of expressions that can also happen in the staging * buffer. In addition, it should not happen: the peephole optimizer * must replace sequences with *shorter* sequences, not longer ones. * So, I simply forbid sequences that are longer than the ones they * are meant to replace. */ assert(match_length>=repl_length); if (match_length>=repl_length) { strreplace(start,replace,match_length,repl_length,(int)(end-start)); end-=match_length-repl_length; free(replace); code_idx-=sequences[seq].savesize; seq=0; /* restart search for matches */ matches++; } else { /* actually, we should never get here (match_length0); } /* if (pc_optimize>sOPTIMIZE_NONE && sc_status==statWRITE) */ for (start=debut; start