* Regex Little Changes * Prevented to triple and double call `strlen`. * More informative message on `if (offset >= len)`. * Add missing parametr in navite `MatchRegex`. * Regex Little Changes v2 * Using `strdup` instead `strcpy`. * Replaced NULL to nullptr. * Removed note about MatchOffset. Co-Authored-By: Headline <headline@users.noreply.github.com> * Removed padding. Co-Authored-By: Headline <headline@users.noreply.github.com> * Removed more padding. Co-Authored-By: Headline <headline@users.noreply.github.com> Co-authored-by: Headline <michaelwflaherty@me.com>
		
			
				
	
	
		
			292 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			SourcePawn
		
	
	
	
	
	
			
		
		
	
	
			292 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			SourcePawn
		
	
	
	
	
	
/**
 | 
						|
 * vim: set ts=4 sw=4 tw=99 noet :
 | 
						|
 * =============================================================================
 | 
						|
 * SourceMod (C)2004-2008 AlliedModders LLC.  All rights reserved.
 | 
						|
 * =============================================================================
 | 
						|
 *
 | 
						|
 * This file is part of the SourceMod/SourcePawn SDK.
 | 
						|
 *
 | 
						|
 * This program is free software; you can redistribute it and/or modify it under
 | 
						|
 * the terms of the GNU General Public License, version 3.0, as published by the
 | 
						|
 * Free Software Foundation.
 | 
						|
 *
 | 
						|
 * This program is distributed in the hope that it will be useful, but WITHOUT
 | 
						|
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
 | 
						|
 * FOR A PARTICULAR PURPOSE.  See the GNU General Public License for more
 | 
						|
 * details.
 | 
						|
 *
 | 
						|
 * You should have received a copy of the GNU General Public License along with
 | 
						|
 * this program.  If not, see <http://www.gnu.org/licenses/>.
 | 
						|
 *
 | 
						|
 * As a special exception, AlliedModders LLC gives you permission to link the
 | 
						|
 * code of this program (as well as its derivative works) to "Half-Life 2," the
 | 
						|
 * "Source Engine," the "SourcePawn JIT," and any Game MODs that run on software
 | 
						|
 * by the Valve Corporation.  You must obey the GNU General Public License in
 | 
						|
 * all respects for all other code used.  Additionally, AlliedModders LLC grants
 | 
						|
 * this exception to all derivative works.  AlliedModders LLC defines further
 | 
						|
 * exceptions, found in LICENSE.txt (as of this writing, version JULY-31-2007),
 | 
						|
 * or <http://www.sourcemod.net/license.php>.
 | 
						|
 *
 | 
						|
 * Version: $Id$
 | 
						|
 */
 | 
						|
 | 
						|
#if defined _regex_included
 | 
						|
 #endinput
 | 
						|
#endif
 | 
						|
#define _regex_included
 | 
						|
 | 
						|
/**
 | 
						|
 * @section     Flags for compiling regex expressions.  These come directly from the
 | 
						|
 * pcre library and can be used in MatchRegex and CompileRegex.
 | 
						|
 */
 | 
						|
#define PCRE_CASELESS           0x00000001 /* Ignore Case */
 | 
						|
#define PCRE_MULTILINE          0x00000002 /* Multilines (affects ^ and $ so that they match the start/end of a line rather than matching the start/end of the string). */
 | 
						|
#define PCRE_DOTALL             0x00000004 /* Single line (affects . so that it matches any character, even new line characters). */
 | 
						|
#define PCRE_EXTENDED           0x00000008 /* Pattern extension (ignore whitespace and # comments). */
 | 
						|
#define PCRE_ANCHORED           0x00000010 /* Force pattern anchoring. */
 | 
						|
#define PCRE_DOLLAR_ENDONLY     0x00000020 /* $ not to match newline at end. */
 | 
						|
#define PCRE_UNGREEDY           0x00000200 /* Invert greediness of quantifiers */
 | 
						|
#define PCRE_NOTEMPTY           0x00000400 /* An empty string is not a valid match. */
 | 
						|
#define PCRE_UTF8               0x00000800 /* Use UTF-8 Chars */
 | 
						|
#define PCRE_NO_UTF8_CHECK      0x00002000 /* Do not check the pattern for UTF-8 validity (only relevant if PCRE_UTF8 is set) */
 | 
						|
#define PCRE_UCP                0x20000000 /* Use Unicode properties for \ed, \ew, etc. */
 | 
						|
 | 
						|
 | 
						|
/**
 | 
						|
 * Regex expression error codes.
 | 
						|
 */
 | 
						|
enum RegexError
 | 
						|
{
 | 
						|
	REGEX_ERROR_NONE = 0,               /* No error */
 | 
						|
 | 
						|
	REGEX_ERROR_ASSERT = 1,             /* internal error ? */
 | 
						|
	REGEX_ERROR_BADBR,                  /* invalid repeat counts in {} */
 | 
						|
	REGEX_ERROR_BADPAT,                 /* pattern error */
 | 
						|
	REGEX_ERROR_BADRPT,                 /* ? * + invalid */
 | 
						|
	REGEX_ERROR_EBRACE,                 /* unbalanced {} */
 | 
						|
	REGEX_ERROR_EBRACK,                 /* unbalanced [] */
 | 
						|
	REGEX_ERROR_ECOLLATE,               /* collation error - not relevant */
 | 
						|
	REGEX_ERROR_ECTYPE,                 /* bad class */
 | 
						|
	REGEX_ERROR_EESCAPE,                /* bad escape sequence */
 | 
						|
	REGEX_ERROR_EMPTY,                  /* empty expression */
 | 
						|
	REGEX_ERROR_EPAREN,                 /* unbalanced () */
 | 
						|
	REGEX_ERROR_ERANGE,                 /* bad range inside [] */
 | 
						|
	REGEX_ERROR_ESIZE,                  /* expression too big */
 | 
						|
	REGEX_ERROR_ESPACE,                 /* failed to get memory */
 | 
						|
	REGEX_ERROR_ESUBREG,                /* bad back reference */
 | 
						|
	REGEX_ERROR_INVARG,                 /* bad argument */
 | 
						|
 | 
						|
	REGEX_ERROR_NOMATCH = -1,           /* No match was found */
 | 
						|
	REGEX_ERROR_NULL = -2,
 | 
						|
	REGEX_ERROR_BADOPTION = -3,
 | 
						|
	REGEX_ERROR_BADMAGIC = -4,
 | 
						|
	REGEX_ERROR_UNKNOWN_OPCODE = -5,
 | 
						|
	REGEX_ERROR_NOMEMORY = -6,
 | 
						|
	REGEX_ERROR_NOSUBSTRING = -7,
 | 
						|
	REGEX_ERROR_MATCHLIMIT = -8,
 | 
						|
	REGEX_ERROR_CALLOUT = -9,           /* Never used by PCRE itself */
 | 
						|
	REGEX_ERROR_BADUTF8 = -10,
 | 
						|
	REGEX_ERROR_BADUTF8_OFFSET = -11,
 | 
						|
	REGEX_ERROR_PARTIAL = -12,
 | 
						|
	REGEX_ERROR_BADPARTIAL = -13,
 | 
						|
	REGEX_ERROR_INTERNAL = -14,
 | 
						|
	REGEX_ERROR_BADCOUNT = -15,
 | 
						|
	REGEX_ERROR_DFA_UITEM = -16,
 | 
						|
	REGEX_ERROR_DFA_UCOND = -17,
 | 
						|
	REGEX_ERROR_DFA_UMLIMIT = -18,
 | 
						|
	REGEX_ERROR_DFA_WSSIZE = -19,
 | 
						|
	REGEX_ERROR_DFA_RECURSE = -20,
 | 
						|
	REGEX_ERROR_RECURSIONLIMIT = -21,
 | 
						|
	REGEX_ERROR_NULLWSLIMIT = -22,      /* No longer actually used */
 | 
						|
	REGEX_ERROR_BADNEWLINE = -23,
 | 
						|
	REGEX_ERROR_BADOFFSET = -24,
 | 
						|
	REGEX_ERROR_SHORTUTF8 = -25,
 | 
						|
	REGEX_ERROR_RECURSELOOP = -26,
 | 
						|
	REGEX_ERROR_JIT_STACKLIMIT = -27,
 | 
						|
	REGEX_ERROR_BADMODE = -28,
 | 
						|
	REGEX_ERROR_BADENDIANNESS = -29,
 | 
						|
	REGEX_ERROR_DFA_BADRESTART = -30,
 | 
						|
	REGEX_ERROR_JIT_BADOPTION = -31,
 | 
						|
	REGEX_ERROR_BADLENGTH = -32
 | 
						|
};
 | 
						|
 | 
						|
// Regular expression objects are used to match or decompose strings based on
 | 
						|
// patterns.
 | 
						|
methodmap Regex < Handle
 | 
						|
{
 | 
						|
	// Compile a regular expression.
 | 
						|
	//
 | 
						|
	// @param pattern       The regular expression pattern.
 | 
						|
	// @param flags         General flags for the regular expression.
 | 
						|
	// @param error         Error message encountered, if applicable.
 | 
						|
	// @param maxLen        Maximum string length of the error buffer.
 | 
						|
	// @param errcode       Regex type error code encountered, if applicable.
 | 
						|
	public native Regex(const char[] pattern, int flags = 0, char[] error="", int maxLen = 0, RegexError &errcode = REGEX_ERROR_NONE);
 | 
						|
 | 
						|
	// Matches a string against a pre-compiled regular expression pattern.
 | 
						|
	//
 | 
						|
	// @param str           The string to check.
 | 
						|
	// @param ret           Error code, if applicable.
 | 
						|
	// @param offset        Offset in the string to start searching from. MatchOffset returns the offset of the match.
 | 
						|
	// @return              Number of captures found or -1 on failure.
 | 
						|
	//
 | 
						|
	// @note Use the regex handle passed to this function to extract
 | 
						|
	//       matches with GetSubString().
 | 
						|
	public native int Match(const char[] str, RegexError &ret = REGEX_ERROR_NONE, int offset = 0);
 | 
						|
 | 
						|
	// Gets all matches from a string against a pre-compiled regular expression pattern.
 | 
						|
	//
 | 
						|
	// @param str           The string to check.
 | 
						|
	// @param ret           Error code, if applicable.
 | 
						|
	// @return              Number of matches found or -1 on failure.
 | 
						|
	//
 | 
						|
	// @note Use GetSubString() and loop from 0 -> totalmatches - 1.
 | 
						|
	public native int MatchAll(const char[] str, RegexError &ret = REGEX_ERROR_NONE);
 | 
						|
 | 
						|
	// Returns a matched substring from a regex handle.
 | 
						|
	//
 | 
						|
	// Substring ids start at 0 and end at captures-1, where captures is the
 | 
						|
	// number returned by Regex.Match or Regex.CaptureCount.
 | 
						|
	//
 | 
						|
	// @param str_id        The index of the expression to get - starts at 0, and ends at captures - 1.
 | 
						|
	// @param buffer        The buffer to set to the matching substring.
 | 
						|
	// @param maxlen        The maximum string length of the buffer.
 | 
						|
	// @param match         Match to get the captures for - starts at 0, and ends at MatchCount() -1
 | 
						|
	// @return              True if a substring was found, False on fail/error
 | 
						|
	//
 | 
						|
	// @note str_id = 0 is the full captured string, anything else is the capture group index.
 | 
						|
	//       if Regex.Match is used match can only be 0
 | 
						|
	public native bool GetSubString(int str_id, char[] buffer, int maxlen, int match = 0);
 | 
						|
 | 
						|
	// Returns number of matches
 | 
						|
	//
 | 
						|
	// When using Match this is always 1 or 0 (unless an error occured)
 | 
						|
	// @return              Total number of matches found.
 | 
						|
	public native int MatchCount();
 | 
						|
 | 
						|
	// Returns number of captures for a match
 | 
						|
	//
 | 
						|
	// @param match         Match to get the number of captures for. Match starts at 0, and ends at MatchCount() -1
 | 
						|
	// @return              Number of captures in the match.
 | 
						|
	//
 | 
						|
	// @note Use GetSubString() and loop from 1 -> captures -1 for str_id to get all captures
 | 
						|
	public native int CaptureCount(int match = 0);
 | 
						|
 | 
						|
	// Returns the string offset of a match.
 | 
						|
	//
 | 
						|
	// @param match         Match to get the offset of. Match starts at 0, and ends at MatchCount() -1
 | 
						|
	// @return              Offset of the match in the string.
 | 
						|
	public native int MatchOffset(int match = 0);
 | 
						|
};
 | 
						|
 | 
						|
/**
 | 
						|
 * Precompile a regular expression.  Use this if you intend on using the
 | 
						|
 * same expression multiple times.  Pass the regex handle returned here to
 | 
						|
 * MatchRegex to check for matches.
 | 
						|
 *
 | 
						|
 * @param pattern       The regular expression pattern.
 | 
						|
 * @param flags         General flags for the regular expression.
 | 
						|
 * @param error         Error message encountered, if applicable.
 | 
						|
 * @param maxLen        Maximum string length of the error buffer.
 | 
						|
 * @param errcode       Regex type error code encountered, if applicable.
 | 
						|
 * @return              Valid regex handle on success, INVALID_HANDLE on failure.
 | 
						|
 */
 | 
						|
native Regex CompileRegex(const char[] pattern, int flags = 0, char[] error="", int maxLen = 0, RegexError &errcode = REGEX_ERROR_NONE);
 | 
						|
 | 
						|
/**
 | 
						|
 * Matches a string against a pre-compiled regular expression pattern.
 | 
						|
 *
 | 
						|
 * @param regex         Regex Handle from CompileRegex()
 | 
						|
 * @param str           The string to check.
 | 
						|
 * @param ret           Error code, if applicable.
 | 
						|
 * @param offset        Offset in the string to start searching from.
 | 
						|
 * @return              Number of captures found or -1 on failure.
 | 
						|
 *
 | 
						|
 * @note Use the regex handle passed to this function to extract
 | 
						|
 *       matches with GetRegexSubString().
 | 
						|
 */
 | 
						|
native int MatchRegex(Handle regex, const char[] str, RegexError &ret = REGEX_ERROR_NONE, int offset = 0);
 | 
						|
 | 
						|
/**
 | 
						|
 * Returns a matched substring from a regex handle.
 | 
						|
 * Substring ids start at 0 and end at captures-1, where captures is the number returned
 | 
						|
 * by MatchRegex.
 | 
						|
 *
 | 
						|
 * @param regex         The regex handle to extract data from.
 | 
						|
 * @param str_id        The index of the expression to get - starts at 0, and ends at captures - 1.
 | 
						|
 * @param buffer        The buffer to set to the matching substring.
 | 
						|
 * @param maxlen        The maximum string length of the buffer.
 | 
						|
 * @return              True if a substring was found, False on fail/error
 | 
						|
 *
 | 
						|
 * @note str_id = 0 is the full captured string, anything else is the capture group index.
 | 
						|
 *
 | 
						|
 */
 | 
						|
native bool GetRegexSubString(Handle regex, int str_id, char[] buffer, int maxlen);
 | 
						|
 | 
						|
/**
 | 
						|
 * Matches a string against a regular expression pattern.
 | 
						|
 *
 | 
						|
 * @note If you intend on using the same regular expression pattern
 | 
						|
 *       multiple times, consider using CompileRegex and MatchRegex
 | 
						|
 *       instead of making this function reparse the expression each time.
 | 
						|
 *
 | 
						|
 * @param str           The string to check.
 | 
						|
 * @param pattern       The regular expression pattern.
 | 
						|
 * @param flags         General flags for the regular expression.
 | 
						|
 * @param error         Error message, if applicable.
 | 
						|
 * @param maxLen        Maximum length of the error buffer.
 | 
						|
 * @return              Number of substrings found or -1 on failure.
 | 
						|
 */
 | 
						|
stock int SimpleRegexMatch(const char[] str, const char[] pattern, int flags = 0, char[] error="", int maxLen = 0)
 | 
						|
{
 | 
						|
	Regex regex = new Regex(pattern, flags, error, maxLen);
 | 
						|
	if (!regex)
 | 
						|
	{
 | 
						|
		return -1;
 | 
						|
	}
 | 
						|
 | 
						|
	int substrings = regex.Match(str);
 | 
						|
	delete regex;
 | 
						|
 | 
						|
	return substrings;
 | 
						|
}
 | 
						|
 | 
						|
/**
 | 
						|
 * @endsection
 | 
						|
 */
 | 
						|
 | 
						|
/**
 | 
						|
 * Do not edit below this line!
 | 
						|
 */
 | 
						|
public Extension __ext_regex =
 | 
						|
{
 | 
						|
	name = "Regex Extension",
 | 
						|
	file = "regex.ext",
 | 
						|
#if defined AUTOLOAD_EXTENSIONS
 | 
						|
	autoload = 1,
 | 
						|
#else
 | 
						|
	autoload = 0,
 | 
						|
#endif
 | 
						|
#if defined REQUIRE_EXTENSIONS
 | 
						|
	required = 1,
 | 
						|
#else
 | 
						|
	required = 0,
 | 
						|
#endif
 | 
						|
};
 | 
						|
 | 
						|
#if !defined REQUIRE_EXTENSIONS
 | 
						|
public void __ext_regex_SetNTVOptional()
 | 
						|
{
 | 
						|
	MarkNativeAsOptional("CompileRegex");
 | 
						|
	MarkNativeAsOptional("MatchRegex");
 | 
						|
	MarkNativeAsOptional("GetRegexSubString");
 | 
						|
	MarkNativeAsOptional("Regex.Regex");
 | 
						|
	MarkNativeAsOptional("Regex.Match");
 | 
						|
	MarkNativeAsOptional("Regex.MatchAll");
 | 
						|
	MarkNativeAsOptional("Regex.GetSubString");
 | 
						|
	MarkNativeAsOptional("Regex.MatchCount");
 | 
						|
	MarkNativeAsOptional("Regex.CaptureCount");
 | 
						|
	MarkNativeAsOptional("Regex.MatchOffset");
 | 
						|
}
 | 
						|
#endif
 |