Permalink
Cannot retrieve contributors at this time
4621 lines (4097 sloc)
116 KB
/********************************************************************** | |
regexec.c - Onigmo (Oniguruma-mod) (regular expression library) | |
**********************************************************************/ | |
/*- | |
* Copyright (c) 2002-2008 K.Kosako <sndgk393 AT ybb DOT ne DOT jp> | |
* Copyright (c) 2011-2016 K.Takata <kentkt AT csc DOT jp> | |
* All rights reserved. | |
* | |
* Redistribution and use in source and binary forms, with or without | |
* modification, are permitted provided that the following conditions | |
* are met: | |
* 1. Redistributions of source code must retain the above copyright | |
* notice, this list of conditions and the following disclaimer. | |
* 2. Redistributions in binary form must reproduce the above copyright | |
* notice, this list of conditions and the following disclaimer in the | |
* documentation and/or other materials provided with the distribution. | |
* | |
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND | |
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | |
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | |
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE | |
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL | |
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS | |
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) | |
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT | |
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY | |
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF | |
* SUCH DAMAGE. | |
*/ | |
#include "regint.h" | |
#ifdef RUBY | |
# undef USE_MATCH_RANGE_MUST_BE_INSIDE_OF_SPECIFIED_RANGE | |
#else | |
# define USE_MATCH_RANGE_MUST_BE_INSIDE_OF_SPECIFIED_RANGE | |
#endif | |
#ifndef USE_TOKEN_THREADED_VM | |
# ifdef __GNUC__ | |
# define USE_TOKEN_THREADED_VM 1 | |
# else | |
# define USE_TOKEN_THREADED_VM 0 | |
# endif | |
#endif | |
#ifdef RUBY | |
# define ENC_DUMMY_FLAG (1<<24) | |
static inline int | |
rb_enc_asciicompat(OnigEncoding enc) | |
{ | |
return ONIGENC_MBC_MINLEN(enc)==1 && !((enc)->ruby_encoding_index & ENC_DUMMY_FLAG); | |
} | |
# undef ONIGENC_IS_MBC_ASCII_WORD | |
# define ONIGENC_IS_MBC_ASCII_WORD(enc,s,end) \ | |
(rb_enc_asciicompat(enc) ? (ISALNUM(*s) || *s=='_') : \ | |
onigenc_ascii_is_code_ctype( \ | |
ONIGENC_MBC_TO_CODE(enc,s,end),ONIGENC_CTYPE_WORD,enc)) | |
#endif /* RUBY */ | |
#ifdef USE_CRNL_AS_LINE_TERMINATOR | |
# define ONIGENC_IS_MBC_CRNL(enc,p,end) \ | |
(ONIGENC_MBC_TO_CODE(enc,p,end) == 13 && \ | |
ONIGENC_MBC_TO_CODE(enc,(p+enclen(enc,p,end)),end) == 10) | |
# define ONIGENC_IS_MBC_NEWLINE_EX(enc,p,start,end,option,check_prev) \ | |
is_mbc_newline_ex((enc),(p),(start),(end),(option),(check_prev)) | |
static int | |
is_mbc_newline_ex(OnigEncoding enc, const UChar *p, const UChar *start, | |
const UChar *end, OnigOptionType option, int check_prev) | |
{ | |
if (IS_NEWLINE_CRLF(option)) { | |
if (ONIGENC_MBC_TO_CODE(enc, p, end) == 0x0a) { | |
if (check_prev) { | |
const UChar *prev = onigenc_get_prev_char_head(enc, start, p, end); | |
if ((prev != NULL) && ONIGENC_MBC_TO_CODE(enc, prev, end) == 0x0d) | |
return 0; | |
else | |
return 1; | |
} | |
else | |
return 1; | |
} | |
else { | |
const UChar *pnext = p + enclen(enc, p, end); | |
if (pnext < end && | |
ONIGENC_MBC_TO_CODE(enc, p, end) == 0x0d && | |
ONIGENC_MBC_TO_CODE(enc, pnext, end) == 0x0a) | |
return 1; | |
if (ONIGENC_IS_MBC_NEWLINE(enc, p, end)) | |
return 1; | |
return 0; | |
} | |
} | |
else { | |
return ONIGENC_IS_MBC_NEWLINE(enc, p, end); | |
} | |
} | |
#else /* USE_CRNL_AS_LINE_TERMINATOR */ | |
# define ONIGENC_IS_MBC_NEWLINE_EX(enc,p,start,end,option,check_prev) \ | |
ONIGENC_IS_MBC_NEWLINE((enc), (p), (end)) | |
#endif /* USE_CRNL_AS_LINE_TERMINATOR */ | |
#ifdef USE_CAPTURE_HISTORY | |
static void history_tree_free(OnigCaptureTreeNode* node); | |
static void | |
history_tree_clear(OnigCaptureTreeNode* node) | |
{ | |
int i; | |
if (IS_NOT_NULL(node)) { | |
for (i = 0; i < node->num_childs; i++) { | |
if (IS_NOT_NULL(node->childs[i])) { | |
history_tree_free(node->childs[i]); | |
} | |
} | |
for (i = 0; i < node->allocated; i++) { | |
node->childs[i] = (OnigCaptureTreeNode* )0; | |
} | |
node->num_childs = 0; | |
node->beg = ONIG_REGION_NOTPOS; | |
node->end = ONIG_REGION_NOTPOS; | |
node->group = -1; | |
xfree(node->childs); | |
node->childs = (OnigCaptureTreeNode** )0; | |
} | |
} | |
static void | |
history_tree_free(OnigCaptureTreeNode* node) | |
{ | |
history_tree_clear(node); | |
xfree(node); | |
} | |
static void | |
history_root_free(OnigRegion* r) | |
{ | |
if (IS_NOT_NULL(r->history_root)) { | |
history_tree_free(r->history_root); | |
r->history_root = (OnigCaptureTreeNode* )0; | |
} | |
} | |
static OnigCaptureTreeNode* | |
history_node_new(void) | |
{ | |
OnigCaptureTreeNode* node; | |
node = (OnigCaptureTreeNode* )xmalloc(sizeof(OnigCaptureTreeNode)); | |
CHECK_NULL_RETURN(node); | |
node->childs = (OnigCaptureTreeNode** )0; | |
node->allocated = 0; | |
node->num_childs = 0; | |
node->group = -1; | |
node->beg = ONIG_REGION_NOTPOS; | |
node->end = ONIG_REGION_NOTPOS; | |
return node; | |
} | |
static int | |
history_tree_add_child(OnigCaptureTreeNode* parent, OnigCaptureTreeNode* child) | |
{ | |
# define HISTORY_TREE_INIT_ALLOC_SIZE 8 | |
if (parent->num_childs >= parent->allocated) { | |
int n, i; | |
if (IS_NULL(parent->childs)) { | |
n = HISTORY_TREE_INIT_ALLOC_SIZE; | |
parent->childs = | |
(OnigCaptureTreeNode** )xmalloc(sizeof(OnigCaptureTreeNode*) * n); | |
CHECK_NULL_RETURN_MEMERR(parent->childs); | |
} | |
else { | |
OnigCaptureTreeNode** tmp; | |
n = parent->allocated * 2; | |
tmp = | |
(OnigCaptureTreeNode** )xrealloc(parent->childs, | |
sizeof(OnigCaptureTreeNode*) * n); | |
if (tmp == 0) { | |
history_tree_clear(parent); | |
return ONIGERR_MEMORY; | |
} | |
parent->childs = tmp; | |
} | |
for (i = parent->allocated; i < n; i++) { | |
parent->childs[i] = (OnigCaptureTreeNode* )0; | |
} | |
parent->allocated = n; | |
} | |
parent->childs[parent->num_childs] = child; | |
parent->num_childs++; | |
return 0; | |
} | |
static OnigCaptureTreeNode* | |
history_tree_clone(OnigCaptureTreeNode* node) | |
{ | |
int i, r; | |
OnigCaptureTreeNode *clone, *child; | |
clone = history_node_new(); | |
CHECK_NULL_RETURN(clone); | |
clone->beg = node->beg; | |
clone->end = node->end; | |
for (i = 0; i < node->num_childs; i++) { | |
child = history_tree_clone(node->childs[i]); | |
if (IS_NULL(child)) { | |
history_tree_free(clone); | |
return (OnigCaptureTreeNode* )0; | |
} | |
r = history_tree_add_child(clone, child); | |
if (r != 0) { | |
history_tree_free(child); | |
history_tree_free(clone); | |
return (OnigCaptureTreeNode* )0; | |
} | |
} | |
return clone; | |
} | |
extern OnigCaptureTreeNode* | |
onig_get_capture_tree(OnigRegion* region) | |
{ | |
return region->history_root; | |
} | |
#endif /* USE_CAPTURE_HISTORY */ | |
extern void | |
onig_region_clear(OnigRegion* region) | |
{ | |
int i; | |
for (i = 0; i < region->num_regs; i++) { | |
region->beg[i] = region->end[i] = ONIG_REGION_NOTPOS; | |
} | |
#ifdef USE_CAPTURE_HISTORY | |
history_root_free(region); | |
#endif | |
} | |
extern int | |
onig_region_resize(OnigRegion* region, int n) | |
{ | |
region->num_regs = n; | |
if (n < ONIG_NREGION) | |
n = ONIG_NREGION; | |
if (region->allocated == 0) { | |
region->beg = (OnigPosition* )xmalloc(n * sizeof(OnigPosition)); | |
if (region->beg == 0) | |
return ONIGERR_MEMORY; | |
region->end = (OnigPosition* )xmalloc(n * sizeof(OnigPosition)); | |
if (region->end == 0) { | |
xfree(region->beg); | |
return ONIGERR_MEMORY; | |
} | |
region->allocated = n; | |
} | |
else if (region->allocated < n) { | |
OnigPosition *tmp; | |
region->allocated = 0; | |
tmp = (OnigPosition* )xrealloc(region->beg, n * sizeof(OnigPosition)); | |
if (tmp == 0) { | |
xfree(region->beg); | |
xfree(region->end); | |
return ONIGERR_MEMORY; | |
} | |
region->beg = tmp; | |
tmp = (OnigPosition* )xrealloc(region->end, n * sizeof(OnigPosition)); | |
if (tmp == 0) { | |
xfree(region->beg); | |
xfree(region->end); | |
return ONIGERR_MEMORY; | |
} | |
region->end = tmp; | |
region->allocated = n; | |
} | |
return 0; | |
} | |
static int | |
onig_region_resize_clear(OnigRegion* region, int n) | |
{ | |
int r; | |
r = onig_region_resize(region, n); | |
if (r != 0) return r; | |
onig_region_clear(region); | |
return 0; | |
} | |
extern int | |
onig_region_set(OnigRegion* region, int at, int beg, int end) | |
{ | |
if (at < 0) return ONIGERR_INVALID_ARGUMENT; | |
if (at >= region->allocated) { | |
int r = onig_region_resize(region, at + 1); | |
if (r < 0) return r; | |
} | |
region->beg[at] = beg; | |
region->end[at] = end; | |
return 0; | |
} | |
extern void | |
onig_region_init(OnigRegion* region) | |
{ | |
region->num_regs = 0; | |
region->allocated = 0; | |
region->beg = (OnigPosition* )0; | |
region->end = (OnigPosition* )0; | |
#ifdef USE_CAPTURE_HISTORY | |
region->history_root = (OnigCaptureTreeNode* )0; | |
#endif | |
} | |
extern OnigRegion* | |
onig_region_new(void) | |
{ | |
OnigRegion* r; | |
r = (OnigRegion* )xmalloc(sizeof(OnigRegion)); | |
if (r) | |
onig_region_init(r); | |
return r; | |
} | |
extern void | |
onig_region_free(OnigRegion* r, int free_self) | |
{ | |
if (r) { | |
if (r->allocated > 0) { | |
if (r->beg) xfree(r->beg); | |
if (r->end) xfree(r->end); | |
r->allocated = 0; | |
} | |
#ifdef USE_CAPTURE_HISTORY | |
history_root_free(r); | |
#endif | |
if (free_self) xfree(r); | |
} | |
} | |
extern void | |
onig_region_copy(OnigRegion* to, const OnigRegion* from) | |
{ | |
#define RREGC_SIZE (sizeof(int) * from->num_regs) | |
int i, r; | |
if (to == from) return; | |
r = onig_region_resize(to, from->num_regs); | |
if (r) return; | |
for (i = 0; i < from->num_regs; i++) { | |
to->beg[i] = from->beg[i]; | |
to->end[i] = from->end[i]; | |
} | |
to->num_regs = from->num_regs; | |
#ifdef USE_CAPTURE_HISTORY | |
history_root_free(to); | |
if (IS_NOT_NULL(from->history_root)) { | |
to->history_root = history_tree_clone(from->history_root); | |
} | |
#endif | |
} | |
/** stack **/ | |
#define INVALID_STACK_INDEX -1 | |
/* stack type */ | |
/* used by normal-POP */ | |
#define STK_ALT 0x0001 | |
#define STK_LOOK_BEHIND_NOT 0x0002 | |
#define STK_POS_NOT 0x0003 | |
/* handled by normal-POP */ | |
#define STK_MEM_START 0x0100 | |
#define STK_MEM_END 0x8200 | |
#define STK_REPEAT_INC 0x0300 | |
#define STK_STATE_CHECK_MARK 0x1000 | |
/* avoided by normal-POP */ | |
#define STK_NULL_CHECK_START 0x3000 | |
#define STK_NULL_CHECK_END 0x5000 /* for recursive call */ | |
#define STK_MEM_END_MARK 0x8400 | |
#define STK_POS 0x0500 /* used when POP-POS */ | |
#define STK_STOP_BT 0x0600 /* mark for "(?>...)" */ | |
#define STK_REPEAT 0x0700 | |
#define STK_CALL_FRAME 0x0800 | |
#define STK_RETURN 0x0900 | |
#define STK_VOID 0x0a00 /* for fill a blank */ | |
#define STK_ABSENT_POS 0x0b00 /* for absent */ | |
#define STK_ABSENT 0x0c00 /* absent inner loop marker */ | |
/* stack type check mask */ | |
#define STK_MASK_POP_USED 0x00ff | |
#define STK_MASK_TO_VOID_TARGET 0x10ff | |
#define STK_MASK_MEM_END_OR_MARK 0x8000 /* MEM_END or MEM_END_MARK */ | |
#ifdef USE_FIND_LONGEST_SEARCH_ALL_OF_RANGE | |
# define MATCH_ARG_INIT(msa, arg_option, arg_region, arg_start, arg_gpos) do {\ | |
(msa).stack_p = (void* )0;\ | |
(msa).options = (arg_option);\ | |
(msa).region = (arg_region);\ | |
(msa).start = (arg_start);\ | |
(msa).gpos = (arg_gpos);\ | |
(msa).best_len = ONIG_MISMATCH;\ | |
} while(0) | |
#else | |
# define MATCH_ARG_INIT(msa, arg_option, arg_region, arg_start, arg_gpos) do {\ | |
(msa).stack_p = (void* )0;\ | |
(msa).options = (arg_option);\ | |
(msa).region = (arg_region);\ | |
(msa).start = (arg_start);\ | |
(msa).gpos = (arg_gpos);\ | |
} while(0) | |
#endif | |
#ifdef USE_COMBINATION_EXPLOSION_CHECK | |
# define STATE_CHECK_BUFF_MALLOC_THRESHOLD_SIZE 16 | |
# define STATE_CHECK_BUFF_INIT(msa, str_len, offset, state_num) do { \ | |
if ((state_num) > 0 && str_len >= STATE_CHECK_STRING_THRESHOLD_LEN) {\ | |
unsigned int size = (unsigned int )(((str_len) + 1) * (state_num) + 7) >> 3;\ | |
offset = ((offset) * (state_num)) >> 3;\ | |
if (size > 0 && offset < size && size < STATE_CHECK_BUFF_MAX_SIZE) {\ | |
if (size >= STATE_CHECK_BUFF_MALLOC_THRESHOLD_SIZE) {\ | |
(msa).state_check_buff = (void* )xmalloc(size);\ | |
CHECK_NULL_RETURN_MEMERR((msa).state_check_buff);\ | |
}\ | |
else \ | |
(msa).state_check_buff = (void* )xalloca(size);\ | |
xmemset(((char* )((msa).state_check_buff)+(offset)), 0, \ | |
(size_t )(size - (offset))); \ | |
(msa).state_check_buff_size = size;\ | |
}\ | |
else {\ | |
(msa).state_check_buff = (void* )0;\ | |
(msa).state_check_buff_size = 0;\ | |
}\ | |
}\ | |
else {\ | |
(msa).state_check_buff = (void* )0;\ | |
(msa).state_check_buff_size = 0;\ | |
}\ | |
} while(0) | |
# define MATCH_ARG_FREE(msa) do {\ | |
if ((msa).stack_p) xfree((msa).stack_p);\ | |
if ((msa).state_check_buff_size >= STATE_CHECK_BUFF_MALLOC_THRESHOLD_SIZE) { \ | |
if ((msa).state_check_buff) xfree((msa).state_check_buff);\ | |
}\ | |
} while(0) | |
#else /* USE_COMBINATION_EXPLOSION_CHECK */ | |
# define MATCH_ARG_FREE(msa) if ((msa).stack_p) xfree((msa).stack_p) | |
#endif /* USE_COMBINATION_EXPLOSION_CHECK */ | |
#define MAX_PTR_NUM 100 | |
#define STACK_INIT(alloc_addr, heap_addr, ptr_num, stack_num) do {\ | |
if (ptr_num > MAX_PTR_NUM) {\ | |
alloc_addr = (char* )xmalloc(sizeof(OnigStackIndex) * (ptr_num));\ | |
heap_addr = alloc_addr;\ | |
if (msa->stack_p) {\ | |
stk_alloc = (OnigStackType* )(msa->stack_p);\ | |
stk_base = stk_alloc;\ | |
stk = stk_base;\ | |
stk_end = stk_base + msa->stack_n;\ | |
} else {\ | |
stk_alloc = (OnigStackType* )xalloca(sizeof(OnigStackType) * (stack_num));\ | |
stk_base = stk_alloc;\ | |
stk = stk_base;\ | |
stk_end = stk_base + (stack_num);\ | |
}\ | |
} else if (msa->stack_p) {\ | |
alloc_addr = (char* )xalloca(sizeof(OnigStackIndex) * (ptr_num));\ | |
heap_addr = NULL;\ | |
stk_alloc = (OnigStackType* )(msa->stack_p);\ | |
stk_base = stk_alloc;\ | |
stk = stk_base;\ | |
stk_end = stk_base + msa->stack_n;\ | |
}\ | |
else {\ | |
alloc_addr = (char* )xalloca(sizeof(OnigStackIndex) * (ptr_num)\ | |
+ sizeof(OnigStackType) * (stack_num));\ | |
heap_addr = NULL;\ | |
stk_alloc = (OnigStackType* )(alloc_addr + sizeof(OnigStackIndex) * (ptr_num));\ | |
stk_base = stk_alloc;\ | |
stk = stk_base;\ | |
stk_end = stk_base + (stack_num);\ | |
}\ | |
} while(0) | |
#define STACK_SAVE do{\ | |
if (stk_base != stk_alloc) {\ | |
msa->stack_p = stk_base;\ | |
msa->stack_n = stk_end - stk_base; /* TODO: check overflow */\ | |
};\ | |
} while(0) | |
static unsigned int MatchStackLimitSize = DEFAULT_MATCH_STACK_LIMIT_SIZE; | |
extern unsigned int | |
onig_get_match_stack_limit_size(void) | |
{ | |
return MatchStackLimitSize; | |
} | |
extern int | |
onig_set_match_stack_limit_size(unsigned int size) | |
{ | |
MatchStackLimitSize = size; | |
return 0; | |
} | |
static int | |
stack_double(OnigStackType** arg_stk_base, OnigStackType** arg_stk_end, | |
OnigStackType** arg_stk, OnigStackType* stk_alloc, OnigMatchArg* msa) | |
{ | |
size_t n; | |
OnigStackType *x, *stk_base, *stk_end, *stk; | |
stk_base = *arg_stk_base; | |
stk_end = *arg_stk_end; | |
stk = *arg_stk; | |
n = stk_end - stk_base; | |
if (stk_base == stk_alloc && IS_NULL(msa->stack_p)) { | |
x = (OnigStackType* )xmalloc(sizeof(OnigStackType) * n * 2); | |
if (IS_NULL(x)) { | |
STACK_SAVE; | |
return ONIGERR_MEMORY; | |
} | |
xmemcpy(x, stk_base, n * sizeof(OnigStackType)); | |
n *= 2; | |
} | |
else { | |
unsigned int limit_size = MatchStackLimitSize; | |
n *= 2; | |
if (limit_size != 0 && n > limit_size) { | |
if ((unsigned int )(stk_end - stk_base) == limit_size) | |
return ONIGERR_MATCH_STACK_LIMIT_OVER; | |
else | |
n = limit_size; | |
} | |
x = (OnigStackType* )xrealloc(stk_base, sizeof(OnigStackType) * n); | |
if (IS_NULL(x)) { | |
STACK_SAVE; | |
return ONIGERR_MEMORY; | |
} | |
} | |
*arg_stk = x + (stk - stk_base); | |
*arg_stk_base = x; | |
*arg_stk_end = x + n; | |
return 0; | |
} | |
#define STACK_ENSURE(n) do {\ | |
if (stk_end - stk < (n)) {\ | |
int r = stack_double(&stk_base, &stk_end, &stk, stk_alloc, msa);\ | |
if (r != 0) {\ | |
STACK_SAVE;\ | |
if (xmalloc_base) xfree(xmalloc_base);\ | |
return r;\ | |
}\ | |
}\ | |
} while(0) | |
#define STACK_AT(index) (stk_base + (index)) | |
#define GET_STACK_INDEX(stk) ((stk) - stk_base) | |
#define STACK_PUSH_TYPE(stack_type) do {\ | |
STACK_ENSURE(1);\ | |
stk->type = (stack_type);\ | |
STACK_INC;\ | |
} while(0) | |
#define IS_TO_VOID_TARGET(stk) (((stk)->type & STK_MASK_TO_VOID_TARGET) != 0) | |
#ifdef USE_COMBINATION_EXPLOSION_CHECK | |
# define STATE_CHECK_POS(s,snum) \ | |
(((s) - str) * num_comb_exp_check + ((snum) - 1)) | |
# define STATE_CHECK_VAL(v,snum) do {\ | |
if (state_check_buff != NULL) {\ | |
ptrdiff_t x = STATE_CHECK_POS(s,snum);\ | |
(v) = state_check_buff[x/8] & (1<<(x%8));\ | |
}\ | |
else (v) = 0;\ | |
} while(0) | |
# define ELSE_IF_STATE_CHECK_MARK(stk) \ | |
else if ((stk)->type == STK_STATE_CHECK_MARK) { \ | |
ptrdiff_t x = STATE_CHECK_POS(stk->u.state.pstr, stk->u.state.state_check);\ | |
state_check_buff[x/8] |= (1<<(x%8)); \ | |
} | |
# define STACK_PUSH(stack_type,pat,s,sprev,keep) do {\ | |
STACK_ENSURE(1);\ | |
stk->type = (stack_type);\ | |
stk->u.state.pcode = (pat);\ | |
stk->u.state.pstr = (s);\ | |
stk->u.state.pstr_prev = (sprev);\ | |
stk->u.state.state_check = 0;\ | |
stk->u.state.pkeep = (keep);\ | |
STACK_INC;\ | |
} while(0) | |
# define STACK_PUSH_ENSURED(stack_type,pat) do {\ | |
stk->type = (stack_type);\ | |
stk->u.state.pcode = (pat);\ | |
stk->u.state.state_check = 0;\ | |
STACK_INC;\ | |
} while(0) | |
# define STACK_PUSH_ALT_WITH_STATE_CHECK(pat,s,sprev,snum,keep) do {\ | |
STACK_ENSURE(1);\ | |
stk->type = STK_ALT;\ | |
stk->u.state.pcode = (pat);\ | |
stk->u.state.pstr = (s);\ | |
stk->u.state.pstr_prev = (sprev);\ | |
stk->u.state.state_check = ((state_check_buff != NULL) ? (snum) : 0);\ | |
stk->u.state.pkeep = (keep);\ | |
STACK_INC;\ | |
} while(0) | |
# define STACK_PUSH_STATE_CHECK(s,snum) do {\ | |
if (state_check_buff != NULL) {\ | |
STACK_ENSURE(1);\ | |
stk->type = STK_STATE_CHECK_MARK;\ | |
stk->u.state.pstr = (s);\ | |
stk->u.state.state_check = (snum);\ | |
STACK_INC;\ | |
}\ | |
} while(0) | |
#else /* USE_COMBINATION_EXPLOSION_CHECK */ | |
# define ELSE_IF_STATE_CHECK_MARK(stk) | |
# define STACK_PUSH(stack_type,pat,s,sprev,keep) do {\ | |
STACK_ENSURE(1);\ | |
stk->type = (stack_type);\ | |
stk->u.state.pcode = (pat);\ | |
stk->u.state.pstr = (s);\ | |
stk->u.state.pstr_prev = (sprev);\ | |
stk->u.state.pkeep = (keep);\ | |
STACK_INC;\ | |
} while(0) | |
# define STACK_PUSH_ENSURED(stack_type,pat) do {\ | |
stk->type = (stack_type);\ | |
stk->u.state.pcode = (pat);\ | |
STACK_INC;\ | |
} while(0) | |
#endif /* USE_COMBINATION_EXPLOSION_CHECK */ | |
#define STACK_PUSH_ALT(pat,s,sprev,keep) STACK_PUSH(STK_ALT,pat,s,sprev,keep) | |
#define STACK_PUSH_POS(s,sprev,keep) STACK_PUSH(STK_POS,NULL_UCHARP,s,sprev,keep) | |
#define STACK_PUSH_POS_NOT(pat,s,sprev,keep) STACK_PUSH(STK_POS_NOT,pat,s,sprev,keep) | |
#define STACK_PUSH_ABSENT STACK_PUSH_TYPE(STK_ABSENT) | |
#define STACK_PUSH_STOP_BT STACK_PUSH_TYPE(STK_STOP_BT) | |
#define STACK_PUSH_LOOK_BEHIND_NOT(pat,s,sprev,keep) \ | |
STACK_PUSH(STK_LOOK_BEHIND_NOT,pat,s,sprev,keep) | |
#define STACK_PUSH_REPEAT(id, pat) do {\ | |
STACK_ENSURE(1);\ | |
stk->type = STK_REPEAT;\ | |
stk->u.repeat.num = (id);\ | |
stk->u.repeat.pcode = (pat);\ | |
stk->u.repeat.count = 0;\ | |
STACK_INC;\ | |
} while(0) | |
#define STACK_PUSH_REPEAT_INC(sindex) do {\ | |
STACK_ENSURE(1);\ | |
stk->type = STK_REPEAT_INC;\ | |
stk->u.repeat_inc.si = (sindex);\ | |
STACK_INC;\ | |
} while(0) | |
#define STACK_PUSH_MEM_START(mnum, s) do {\ | |
STACK_ENSURE(1);\ | |
stk->type = STK_MEM_START;\ | |
stk->u.mem.num = (mnum);\ | |
stk->u.mem.pstr = (s);\ | |
stk->u.mem.start = mem_start_stk[mnum];\ | |
stk->u.mem.end = mem_end_stk[mnum];\ | |
mem_start_stk[mnum] = GET_STACK_INDEX(stk);\ | |
mem_end_stk[mnum] = INVALID_STACK_INDEX;\ | |
STACK_INC;\ | |
} while(0) | |
#define STACK_PUSH_MEM_END(mnum, s) do {\ | |
STACK_ENSURE(1);\ | |
stk->type = STK_MEM_END;\ | |
stk->u.mem.num = (mnum);\ | |
stk->u.mem.pstr = (s);\ | |
stk->u.mem.start = mem_start_stk[mnum];\ | |
stk->u.mem.end = mem_end_stk[mnum];\ | |
mem_end_stk[mnum] = GET_STACK_INDEX(stk);\ | |
STACK_INC;\ | |
} while(0) | |
#define STACK_PUSH_MEM_END_MARK(mnum) do {\ | |
STACK_ENSURE(1);\ | |
stk->type = STK_MEM_END_MARK;\ | |
stk->u.mem.num = (mnum);\ | |
STACK_INC;\ | |
} while(0) | |
#define STACK_GET_MEM_START(mnum, k) do {\ | |
int level = 0;\ | |
k = stk;\ | |
while (k > stk_base) {\ | |
k--;\ | |
if ((k->type & STK_MASK_MEM_END_OR_MARK) != 0 \ | |
&& k->u.mem.num == (mnum)) {\ | |
level++;\ | |
}\ | |
else if (k->type == STK_MEM_START && k->u.mem.num == (mnum)) {\ | |
if (level == 0) break;\ | |
level--;\ | |
}\ | |
}\ | |
} while(0) | |
#define STACK_GET_MEM_RANGE(k, mnum, start, end) do {\ | |
int level = 0;\ | |
while (k < stk) {\ | |
if (k->type == STK_MEM_START && k->u.mem.num == (mnum)) {\ | |
if (level == 0) (start) = k->u.mem.pstr;\ | |
level++;\ | |
}\ | |
else if (k->type == STK_MEM_END && k->u.mem.num == (mnum)) {\ | |
level--;\ | |
if (level == 0) {\ | |
(end) = k->u.mem.pstr;\ | |
break;\ | |
}\ | |
}\ | |
k++;\ | |
}\ | |
} while(0) | |
#define STACK_PUSH_NULL_CHECK_START(cnum, s) do {\ | |
STACK_ENSURE(1);\ | |
stk->type = STK_NULL_CHECK_START;\ | |
stk->u.null_check.num = (cnum);\ | |
stk->u.null_check.pstr = (s);\ | |
STACK_INC;\ | |
} while(0) | |
#define STACK_PUSH_NULL_CHECK_END(cnum) do {\ | |
STACK_ENSURE(1);\ | |
stk->type = STK_NULL_CHECK_END;\ | |
stk->u.null_check.num = (cnum);\ | |
STACK_INC;\ | |
} while(0) | |
#define STACK_PUSH_CALL_FRAME(pat) do {\ | |
STACK_ENSURE(1);\ | |
stk->type = STK_CALL_FRAME;\ | |
stk->u.call_frame.ret_addr = (pat);\ | |
STACK_INC;\ | |
} while(0) | |
#define STACK_PUSH_RETURN do {\ | |
STACK_ENSURE(1);\ | |
stk->type = STK_RETURN;\ | |
STACK_INC;\ | |
} while(0) | |
#define STACK_PUSH_ABSENT_POS(start, end) do {\ | |
STACK_ENSURE(1);\ | |
stk->type = STK_ABSENT_POS;\ | |
stk->u.absent_pos.abs_pstr = (start);\ | |
stk->u.absent_pos.end_pstr = (end);\ | |
STACK_INC;\ | |
} while(0) | |
#ifdef ONIG_DEBUG | |
# define STACK_BASE_CHECK(p, at) \ | |
if ((p) < stk_base) {\ | |
fprintf(stderr, "at %s\n", at);\ | |
goto stack_error;\ | |
} | |
#else | |
# define STACK_BASE_CHECK(p, at) | |
#endif | |
#define STACK_POP_ONE do {\ | |
stk--;\ | |
STACK_BASE_CHECK(stk, "STACK_POP_ONE"); \ | |
} while(0) | |
#define STACK_POP do {\ | |
switch (pop_level) {\ | |
case STACK_POP_LEVEL_FREE:\ | |
while (1) {\ | |
stk--;\ | |
STACK_BASE_CHECK(stk, "STACK_POP"); \ | |
if ((stk->type & STK_MASK_POP_USED) != 0) break;\ | |
ELSE_IF_STATE_CHECK_MARK(stk);\ | |
}\ | |
break;\ | |
case STACK_POP_LEVEL_MEM_START:\ | |
while (1) {\ | |
stk--;\ | |
STACK_BASE_CHECK(stk, "STACK_POP 2"); \ | |
if ((stk->type & STK_MASK_POP_USED) != 0) break;\ | |
else if (stk->type == STK_MEM_START) {\ | |
mem_start_stk[stk->u.mem.num] = stk->u.mem.start;\ | |
mem_end_stk[stk->u.mem.num] = stk->u.mem.end;\ | |
}\ | |
ELSE_IF_STATE_CHECK_MARK(stk);\ | |
}\ | |
break;\ | |
default:\ | |
while (1) {\ | |
stk--;\ | |
STACK_BASE_CHECK(stk, "STACK_POP 3"); \ | |
if ((stk->type & STK_MASK_POP_USED) != 0) break;\ | |
else if (stk->type == STK_MEM_START) {\ | |
mem_start_stk[stk->u.mem.num] = stk->u.mem.start;\ | |
mem_end_stk[stk->u.mem.num] = stk->u.mem.end;\ | |
}\ | |
else if (stk->type == STK_REPEAT_INC) {\ | |
STACK_AT(stk->u.repeat_inc.si)->u.repeat.count--;\ | |
}\ | |
else if (stk->type == STK_MEM_END) {\ | |
mem_start_stk[stk->u.mem.num] = stk->u.mem.start;\ | |
mem_end_stk[stk->u.mem.num] = stk->u.mem.end;\ | |
}\ | |
ELSE_IF_STATE_CHECK_MARK(stk);\ | |
}\ | |
break;\ | |
}\ | |
} while(0) | |
#define STACK_POP_TIL_POS_NOT do {\ | |
while (1) {\ | |
stk--;\ | |
STACK_BASE_CHECK(stk, "STACK_POP_TIL_POS_NOT"); \ | |
if (stk->type == STK_POS_NOT) break;\ | |
else if (stk->type == STK_MEM_START) {\ | |
mem_start_stk[stk->u.mem.num] = stk->u.mem.start;\ | |
mem_end_stk[stk->u.mem.num] = stk->u.mem.end;\ | |
}\ | |
else if (stk->type == STK_REPEAT_INC) {\ | |
STACK_AT(stk->u.repeat_inc.si)->u.repeat.count--;\ | |
}\ | |
else if (stk->type == STK_MEM_END) {\ | |
mem_start_stk[stk->u.mem.num] = stk->u.mem.start;\ | |
mem_end_stk[stk->u.mem.num] = stk->u.mem.end;\ | |
}\ | |
ELSE_IF_STATE_CHECK_MARK(stk);\ | |
}\ | |
} while(0) | |
#define STACK_POP_TIL_LOOK_BEHIND_NOT do {\ | |
while (1) {\ | |
stk--;\ | |
STACK_BASE_CHECK(stk, "STACK_POP_TIL_LOOK_BEHIND_NOT"); \ | |
if (stk->type == STK_LOOK_BEHIND_NOT) break;\ | |
else if (stk->type == STK_MEM_START) {\ | |
mem_start_stk[stk->u.mem.num] = stk->u.mem.start;\ | |
mem_end_stk[stk->u.mem.num] = stk->u.mem.end;\ | |
}\ | |
else if (stk->type == STK_REPEAT_INC) {\ | |
STACK_AT(stk->u.repeat_inc.si)->u.repeat.count--;\ | |
}\ | |
else if (stk->type == STK_MEM_END) {\ | |
mem_start_stk[stk->u.mem.num] = stk->u.mem.start;\ | |
mem_end_stk[stk->u.mem.num] = stk->u.mem.end;\ | |
}\ | |
ELSE_IF_STATE_CHECK_MARK(stk);\ | |
}\ | |
} while(0) | |
#define STACK_POP_TIL_ABSENT do {\ | |
while (1) {\ | |
stk--;\ | |
STACK_BASE_CHECK(stk, "STACK_POP_TIL_ABSENT"); \ | |
if (stk->type == STK_ABSENT) break;\ | |
else if (stk->type == STK_MEM_START) {\ | |
mem_start_stk[stk->u.mem.num] = stk->u.mem.start;\ | |
mem_end_stk[stk->u.mem.num] = stk->u.mem.end;\ | |
}\ | |
else if (stk->type == STK_REPEAT_INC) {\ | |
STACK_AT(stk->u.repeat_inc.si)->u.repeat.count--;\ | |
}\ | |
else if (stk->type == STK_MEM_END) {\ | |
mem_start_stk[stk->u.mem.num] = stk->u.mem.start;\ | |
mem_end_stk[stk->u.mem.num] = stk->u.mem.end;\ | |
}\ | |
ELSE_IF_STATE_CHECK_MARK(stk);\ | |
}\ | |
} while(0) | |
#define STACK_POP_ABSENT_POS(start, end) do {\ | |
stk--;\ | |
STACK_BASE_CHECK(stk, "STACK_POP_ABSENT_POS"); \ | |
(start) = stk->u.absent_pos.abs_pstr;\ | |
(end) = stk->u.absent_pos.end_pstr;\ | |
} while(0) | |
#define STACK_POS_END(k) do {\ | |
k = stk;\ | |
while (1) {\ | |
k--;\ | |
STACK_BASE_CHECK(k, "STACK_POS_END"); \ | |
if (IS_TO_VOID_TARGET(k)) {\ | |
k->type = STK_VOID;\ | |
}\ | |
else if (k->type == STK_POS) {\ | |
k->type = STK_VOID;\ | |
break;\ | |
}\ | |
}\ | |
} while(0) | |
#define STACK_STOP_BT_END do {\ | |
OnigStackType *k = stk;\ | |
while (1) {\ | |
k--;\ | |
STACK_BASE_CHECK(k, "STACK_STOP_BT_END"); \ | |
if (IS_TO_VOID_TARGET(k)) {\ | |
k->type = STK_VOID;\ | |
}\ | |
else if (k->type == STK_STOP_BT) {\ | |
k->type = STK_VOID;\ | |
break;\ | |
}\ | |
}\ | |
} while(0) | |
#define STACK_NULL_CHECK(isnull,id,s) do {\ | |
OnigStackType* k = stk;\ | |
while (1) {\ | |
k--;\ | |
STACK_BASE_CHECK(k, "STACK_NULL_CHECK"); \ | |
if (k->type == STK_NULL_CHECK_START) {\ | |
if (k->u.null_check.num == (id)) {\ | |
(isnull) = (k->u.null_check.pstr == (s));\ | |
break;\ | |
}\ | |
}\ | |
}\ | |
} while(0) | |
#define STACK_NULL_CHECK_REC(isnull,id,s) do {\ | |
int level = 0;\ | |
OnigStackType* k = stk;\ | |
while (1) {\ | |
k--;\ | |
STACK_BASE_CHECK(k, "STACK_NULL_CHECK_REC"); \ | |
if (k->type == STK_NULL_CHECK_START) {\ | |
if (k->u.null_check.num == (id)) {\ | |
if (level == 0) {\ | |
(isnull) = (k->u.null_check.pstr == (s));\ | |
break;\ | |
}\ | |
else level--;\ | |
}\ | |
}\ | |
else if (k->type == STK_NULL_CHECK_END) {\ | |
level++;\ | |
}\ | |
}\ | |
} while(0) | |
#define STACK_NULL_CHECK_MEMST(isnull,id,s,reg) do {\ | |
OnigStackType* k = stk;\ | |
while (1) {\ | |
k--;\ | |
STACK_BASE_CHECK(k, "STACK_NULL_CHECK_MEMST"); \ | |
if (k->type == STK_NULL_CHECK_START) {\ | |
if (k->u.null_check.num == (id)) {\ | |
if (k->u.null_check.pstr != (s)) {\ | |
(isnull) = 0;\ | |
break;\ | |
}\ | |
else {\ | |
UChar* endp;\ | |
(isnull) = 1;\ | |
while (k < stk) {\ | |
if (k->type == STK_MEM_START) {\ | |
if (k->u.mem.end == INVALID_STACK_INDEX) {\ | |
(isnull) = 0; break;\ | |
}\ | |
if (BIT_STATUS_AT(reg->bt_mem_end, k->u.mem.num))\ | |
endp = STACK_AT(k->u.mem.end)->u.mem.pstr;\ | |
else\ | |
endp = (UChar* )k->u.mem.end;\ | |
if (STACK_AT(k->u.mem.start)->u.mem.pstr != endp) {\ | |
(isnull) = 0; break;\ | |
}\ | |
else if (endp != s) {\ | |
(isnull) = -1; /* empty, but position changed */ \ | |
}\ | |
}\ | |
k++;\ | |
}\ | |
break;\ | |
}\ | |
}\ | |
}\ | |
}\ | |
} while(0) | |
#define STACK_NULL_CHECK_MEMST_REC(isnull,id,s,reg) do {\ | |
int level = 0;\ | |
OnigStackType* k = stk;\ | |
while (1) {\ | |
k--;\ | |
STACK_BASE_CHECK(k, "STACK_NULL_CHECK_MEMST_REC"); \ | |
if (k->type == STK_NULL_CHECK_START) {\ | |
if (k->u.null_check.num == (id)) {\ | |
if (level == 0) {\ | |
if (k->u.null_check.pstr != (s)) {\ | |
(isnull) = 0;\ | |
break;\ | |
}\ | |
else {\ | |
UChar* endp;\ | |
(isnull) = 1;\ | |
while (k < stk) {\ | |
if (k->type == STK_MEM_START) {\ | |
if (k->u.mem.end == INVALID_STACK_INDEX) {\ | |
(isnull) = 0; break;\ | |
}\ | |
if (BIT_STATUS_AT(reg->bt_mem_end, k->u.mem.num))\ | |
endp = STACK_AT(k->u.mem.end)->u.mem.pstr;\ | |
else\ | |
endp = (UChar* )k->u.mem.end;\ | |
if (STACK_AT(k->u.mem.start)->u.mem.pstr != endp) {\ | |
(isnull) = 0; break;\ | |
}\ | |
else if (endp != s) {\ | |
(isnull) = -1; /* empty, but position changed */ \ | |
}\ | |
}\ | |
k++;\ | |
}\ | |
break;\ | |
}\ | |
}\ | |
else {\ | |
level--;\ | |
}\ | |
}\ | |
}\ | |
else if (k->type == STK_NULL_CHECK_END) {\ | |
if (k->u.null_check.num == (id)) level++;\ | |
}\ | |
}\ | |
} while(0) | |
#define STACK_GET_REPEAT(id, k) do {\ | |
int level = 0;\ | |
k = stk;\ | |
while (1) {\ | |
k--;\ | |
STACK_BASE_CHECK(k, "STACK_GET_REPEAT"); \ | |
if (k->type == STK_REPEAT) {\ | |
if (level == 0) {\ | |
if (k->u.repeat.num == (id)) {\ | |
break;\ | |
}\ | |
}\ | |
}\ | |
else if (k->type == STK_CALL_FRAME) level--;\ | |
else if (k->type == STK_RETURN) level++;\ | |
}\ | |
} while(0) | |
#define STACK_RETURN(addr) do {\ | |
int level = 0;\ | |
OnigStackType* k = stk;\ | |
while (1) {\ | |
k--;\ | |
STACK_BASE_CHECK(k, "STACK_RETURN"); \ | |
if (k->type == STK_CALL_FRAME) {\ | |
if (level == 0) {\ | |
(addr) = k->u.call_frame.ret_addr;\ | |
break;\ | |
}\ | |
else level--;\ | |
}\ | |
else if (k->type == STK_RETURN)\ | |
level++;\ | |
}\ | |
} while(0) | |
#define STRING_CMP(s1,s2,len) do {\ | |
while (len-- > 0) {\ | |
if (*s1++ != *s2++) goto fail;\ | |
}\ | |
} while(0) | |
#define STRING_CMP_IC(case_fold_flag,s1,ps2,len,text_end) do {\ | |
if (string_cmp_ic(encode, case_fold_flag, s1, ps2, len, text_end) == 0) \ | |
goto fail; \ | |
} while(0) | |
static int string_cmp_ic(OnigEncoding enc, int case_fold_flag, | |
UChar* s1, UChar** ps2, OnigDistance mblen, const UChar* text_end) | |
{ | |
UChar buf1[ONIGENC_MBC_CASE_FOLD_MAXLEN]; | |
UChar buf2[ONIGENC_MBC_CASE_FOLD_MAXLEN]; | |
UChar *p1, *p2, *end1, *s2; | |
int len1, len2; | |
s2 = *ps2; | |
end1 = s1 + mblen; | |
while (s1 < end1) { | |
len1 = ONIGENC_MBC_CASE_FOLD(enc, case_fold_flag, &s1, text_end, buf1); | |
len2 = ONIGENC_MBC_CASE_FOLD(enc, case_fold_flag, &s2, text_end, buf2); | |
if (len1 != len2) return 0; | |
p1 = buf1; | |
p2 = buf2; | |
while (len1-- > 0) { | |
if (*p1 != *p2) return 0; | |
p1++; | |
p2++; | |
} | |
} | |
*ps2 = s2; | |
return 1; | |
} | |
#define STRING_CMP_VALUE(s1,s2,len,is_fail) do {\ | |
is_fail = 0;\ | |
while (len-- > 0) {\ | |
if (*s1++ != *s2++) {\ | |
is_fail = 1; break;\ | |
}\ | |
}\ | |
} while(0) | |
#define STRING_CMP_VALUE_IC(case_fold_flag,s1,ps2,len,text_end,is_fail) do {\ | |
if (string_cmp_ic(encode, case_fold_flag, s1, ps2, len, text_end) == 0) \ | |
is_fail = 1; \ | |
else \ | |
is_fail = 0; \ | |
} while(0) | |
#define IS_EMPTY_STR (str == end) | |
#define ON_STR_BEGIN(s) ((s) == str) | |
#define ON_STR_END(s) ((s) == end) | |
#ifdef USE_MATCH_RANGE_MUST_BE_INSIDE_OF_SPECIFIED_RANGE | |
# define DATA_ENSURE_CHECK1 (s < right_range) | |
# define DATA_ENSURE_CHECK(n) (s + (n) <= right_range) | |
# define DATA_ENSURE(n) if (s + (n) > right_range) goto fail | |
# define ABSENT_END_POS right_range | |
#else | |
# define DATA_ENSURE_CHECK1 (s < end) | |
# define DATA_ENSURE_CHECK(n) (s + (n) <= end) | |
# define DATA_ENSURE(n) if (s + (n) > end) goto fail | |
# define ABSENT_END_POS end | |
#endif /* USE_MATCH_RANGE_MUST_BE_INSIDE_OF_SPECIFIED_RANGE */ | |
#ifdef USE_CAPTURE_HISTORY | |
static int | |
make_capture_history_tree(OnigCaptureTreeNode* node, OnigStackType** kp, | |
OnigStackType* stk_top, UChar* str, regex_t* reg) | |
{ | |
int n, r; | |
OnigCaptureTreeNode* child; | |
OnigStackType* k = *kp; | |
while (k < stk_top) { | |
if (k->type == STK_MEM_START) { | |
n = k->u.mem.num; | |
if (n <= ONIG_MAX_CAPTURE_HISTORY_GROUP && | |
BIT_STATUS_AT(reg->capture_history, n) != 0) { | |
child = history_node_new(); | |
CHECK_NULL_RETURN_MEMERR(child); | |
child->group = n; | |
child->beg = k->u.mem.pstr - str; | |
r = history_tree_add_child(node, child); | |
if (r != 0) { | |
history_tree_free(child); | |
return r; | |
} | |
*kp = (k + 1); | |
r = make_capture_history_tree(child, kp, stk_top, str, reg); | |
if (r != 0) return r; | |
k = *kp; | |
child->end = k->u.mem.pstr - str; | |
} | |
} | |
else if (k->type == STK_MEM_END) { | |
if (k->u.mem.num == node->group) { | |
node->end = k->u.mem.pstr - str; | |
*kp = k; | |
return 0; | |
} | |
} | |
k++; | |
} | |
return 1; /* 1: root node ending. */ | |
} | |
#endif /* USE_CAPTURE_HISTORY */ | |
#ifdef USE_BACKREF_WITH_LEVEL | |
static int mem_is_in_memp(int mem, int num, UChar* memp) | |
{ | |
int i; | |
MemNumType m; | |
for (i = 0; i < num; i++) { | |
GET_MEMNUM_INC(m, memp); | |
if (mem == (int )m) return 1; | |
} | |
return 0; | |
} | |
static int backref_match_at_nested_level(regex_t* reg, | |
OnigStackType* top, OnigStackType* stk_base, | |
int ignore_case, int case_fold_flag, | |
int nest, int mem_num, UChar* memp, UChar** s, const UChar* send) | |
{ | |
UChar *ss, *p, *pstart, *pend = NULL_UCHARP; | |
int level; | |
OnigStackType* k; | |
level = 0; | |
k = top; | |
k--; | |
while (k >= stk_base) { | |
if (k->type == STK_CALL_FRAME) { | |
level--; | |
} | |
else if (k->type == STK_RETURN) { | |
level++; | |
} | |
else if (level == nest) { | |
if (k->type == STK_MEM_START) { | |
if (mem_is_in_memp(k->u.mem.num, mem_num, memp)) { | |
pstart = k->u.mem.pstr; | |
if (pend != NULL_UCHARP) { | |
if (pend - pstart > send - *s) return 0; /* or goto next_mem; */ | |
p = pstart; | |
ss = *s; | |
if (ignore_case != 0) { | |
if (string_cmp_ic(reg->enc, case_fold_flag, | |
pstart, &ss, pend - pstart, send) == 0) | |
return 0; /* or goto next_mem; */ | |
} | |
else { | |
while (p < pend) { | |
if (*p++ != *ss++) return 0; /* or goto next_mem; */ | |
} | |
} | |
*s = ss; | |
return 1; | |
} | |
} | |
} | |
else if (k->type == STK_MEM_END) { | |
if (mem_is_in_memp(k->u.mem.num, mem_num, memp)) { | |
pend = k->u.mem.pstr; | |
} | |
} | |
} | |
k--; | |
} | |
return 0; | |
} | |
#endif /* USE_BACKREF_WITH_LEVEL */ | |
#ifdef ONIG_DEBUG_STATISTICS | |
# ifdef _WIN32 | |
# include <windows.h> | |
static LARGE_INTEGER ts, te, freq; | |
# define GETTIME(t) QueryPerformanceCounter(&(t)) | |
# define TIMEDIFF(te,ts) (unsigned long )(((te).QuadPart - (ts).QuadPart) \ | |
* 1000000 / freq.QuadPart) | |
# else /* _WIN32 */ | |
# define USE_TIMEOFDAY | |
# ifdef USE_TIMEOFDAY | |
# ifdef HAVE_SYS_TIME_H | |
# include <sys/time.h> | |
# endif | |
# ifdef HAVE_UNISTD_H | |
# include <unistd.h> | |
# endif | |
static struct timeval ts, te; | |
# define GETTIME(t) gettimeofday(&(t), (struct timezone* )0) | |
# define TIMEDIFF(te,ts) (((te).tv_usec - (ts).tv_usec) + \ | |
(((te).tv_sec - (ts).tv_sec)*1000000)) | |
# else /* USE_TIMEOFDAY */ | |
# ifdef HAVE_SYS_TIMES_H | |
# include <sys/times.h> | |
# endif | |
static struct tms ts, te; | |
# define GETTIME(t) times(&(t)) | |
# define TIMEDIFF(te,ts) ((te).tms_utime - (ts).tms_utime) | |
# endif /* USE_TIMEOFDAY */ | |
# endif /* _WIN32 */ | |
static int OpCounter[256]; | |
static int OpPrevCounter[256]; | |
static unsigned long OpTime[256]; | |
static int OpCurr = OP_FINISH; | |
static int OpPrevTarget = OP_FAIL; | |
static int MaxStackDepth = 0; | |
# define MOP_IN(opcode) do {\ | |
if (opcode == OpPrevTarget) OpPrevCounter[OpCurr]++;\ | |
OpCurr = opcode;\ | |
OpCounter[opcode]++;\ | |
GETTIME(ts);\ | |
} while(0) | |
# define MOP_OUT do {\ | |
GETTIME(te);\ | |
OpTime[OpCurr] += TIMEDIFF(te, ts);\ | |
} while(0) | |
extern void | |
onig_statistics_init(void) | |
{ | |
int i; | |
for (i = 0; i < 256; i++) { | |
OpCounter[i] = OpPrevCounter[i] = 0; OpTime[i] = 0; | |
} | |
MaxStackDepth = 0; | |
# ifdef _WIN32 | |
QueryPerformanceFrequency(&freq); | |
# endif | |
} | |
extern void | |
onig_print_statistics(FILE* f) | |
{ | |
int i; | |
fprintf(f, " count prev time\n"); | |
for (i = 0; OnigOpInfo[i].opcode >= 0; i++) { | |
fprintf(f, "%8d: %8d: %10lu: %s\n", | |
OpCounter[i], OpPrevCounter[i], OpTime[i], OnigOpInfo[i].name); | |
} | |
fprintf(f, "\nmax stack depth: %d\n", MaxStackDepth); | |
} | |
# define STACK_INC do {\ | |
stk++;\ | |
if (stk - stk_base > MaxStackDepth) \ | |
MaxStackDepth = stk - stk_base;\ | |
} while(0) | |
#else /* ONIG_DEBUG_STATISTICS */ | |
# define STACK_INC stk++ | |
# define MOP_IN(opcode) | |
# define MOP_OUT | |
#endif /* ONIG_DEBUG_STATISTICS */ | |
#ifdef ONIG_DEBUG_MATCH | |
static char * | |
stack_type_str(int stack_type) | |
{ | |
switch (stack_type) { | |
case STK_ALT: return "Alt "; | |
case STK_LOOK_BEHIND_NOT: return "LBNot "; | |
case STK_POS_NOT: return "PosNot"; | |
case STK_MEM_START: return "MemS "; | |
case STK_MEM_END: return "MemE "; | |
case STK_REPEAT_INC: return "RepInc"; | |
case STK_STATE_CHECK_MARK: return "StChMk"; | |
case STK_NULL_CHECK_START: return "NulChS"; | |
case STK_NULL_CHECK_END: return "NulChE"; | |
case STK_MEM_END_MARK: return "MemEMk"; | |
case STK_POS: return "Pos "; | |
case STK_STOP_BT: return "StopBt"; | |
case STK_REPEAT: return "Rep "; | |
case STK_CALL_FRAME: return "Call "; | |
case STK_RETURN: return "Ret "; | |
case STK_VOID: return "Void "; | |
case STK_ABSENT_POS: return "AbsPos"; | |
case STK_ABSENT: return "Absent"; | |
default: return " "; | |
} | |
} | |
#endif | |
/* match data(str - end) from position (sstart). */ | |
/* if sstart == str then set sprev to NULL. */ | |
static OnigPosition | |
match_at(regex_t* reg, const UChar* str, const UChar* end, | |
#ifdef USE_MATCH_RANGE_MUST_BE_INSIDE_OF_SPECIFIED_RANGE | |
const UChar* right_range, | |
#endif | |
const UChar* sstart, UChar* sprev, OnigMatchArg* msa) | |
{ | |
static const UChar FinishCode[] = { OP_FINISH }; | |
int i, num_mem, pop_level; | |
ptrdiff_t n, best_len; | |
LengthType tlen, tlen2; | |
MemNumType mem; | |
RelAddrType addr; | |
OnigOptionType option = reg->options; | |
OnigEncoding encode = reg->enc; | |
OnigCaseFoldType case_fold_flag = reg->case_fold_flag; | |
UChar *s, *q, *sbegin; | |
UChar *p = reg->p; | |
UChar *pkeep; | |
char *alloca_base; | |
char *xmalloc_base = NULL; | |
OnigStackType *stk_alloc, *stk_base, *stk, *stk_end; | |
OnigStackType *stkp; /* used as any purpose. */ | |
OnigStackIndex si; | |
OnigStackIndex *repeat_stk; | |
OnigStackIndex *mem_start_stk, *mem_end_stk; | |
#ifdef USE_COMBINATION_EXPLOSION_CHECK | |
int scv; | |
unsigned char* state_check_buff = msa->state_check_buff; | |
int num_comb_exp_check = reg->num_comb_exp_check; | |
#endif | |
#if USE_TOKEN_THREADED_VM | |
# define OP_OFFSET 1 | |
# define VM_LOOP JUMP; | |
# define VM_LOOP_END | |
# define CASE(x) L_##x: sbegin = s; OPCODE_EXEC_HOOK; | |
# define DEFAULT L_DEFAULT: | |
# define NEXT sprev = sbegin; JUMP | |
# define JUMP RB_GNUC_EXTENSION_BLOCK(goto *oplabels[*p++]) | |
RB_GNUC_EXTENSION static const void *oplabels[] = { | |
&&L_OP_FINISH, /* matching process terminator (no more alternative) */ | |
&&L_OP_END, /* pattern code terminator (success end) */ | |
&&L_OP_EXACT1, /* single byte, N = 1 */ | |
&&L_OP_EXACT2, /* single byte, N = 2 */ | |
&&L_OP_EXACT3, /* single byte, N = 3 */ | |
&&L_OP_EXACT4, /* single byte, N = 4 */ | |
&&L_OP_EXACT5, /* single byte, N = 5 */ | |
&&L_OP_EXACTN, /* single byte */ | |
&&L_OP_EXACTMB2N1, /* mb-length = 2 N = 1 */ | |
&&L_OP_EXACTMB2N2, /* mb-length = 2 N = 2 */ | |
&&L_OP_EXACTMB2N3, /* mb-length = 2 N = 3 */ | |
&&L_OP_EXACTMB2N, /* mb-length = 2 */ | |
&&L_OP_EXACTMB3N, /* mb-length = 3 */ | |
&&L_OP_EXACTMBN, /* other length */ | |
&&L_OP_EXACT1_IC, /* single byte, N = 1, ignore case */ | |
&&L_OP_EXACTN_IC, /* single byte, ignore case */ | |
&&L_OP_CCLASS, | |
&&L_OP_CCLASS_MB, | |
&&L_OP_CCLASS_MIX, | |
&&L_OP_CCLASS_NOT, | |
&&L_OP_CCLASS_MB_NOT, | |
&&L_OP_CCLASS_MIX_NOT, | |
&&L_OP_ANYCHAR, /* "." */ | |
&&L_OP_ANYCHAR_ML, /* "." multi-line */ | |
&&L_OP_ANYCHAR_STAR, /* ".*" */ | |
&&L_OP_ANYCHAR_ML_STAR, /* ".*" multi-line */ | |
&&L_OP_ANYCHAR_STAR_PEEK_NEXT, | |
&&L_OP_ANYCHAR_ML_STAR_PEEK_NEXT, | |
&&L_OP_WORD, | |
&&L_OP_NOT_WORD, | |
&&L_OP_WORD_BOUND, | |
&&L_OP_NOT_WORD_BOUND, | |
# ifdef USE_WORD_BEGIN_END | |
&&L_OP_WORD_BEGIN, | |
&&L_OP_WORD_END, | |
# else | |
&&L_DEFAULT, | |
&&L_DEFAULT, | |
# endif | |
&&L_OP_ASCII_WORD, | |
&&L_OP_NOT_ASCII_WORD, | |
&&L_OP_ASCII_WORD_BOUND, | |
&&L_OP_NOT_ASCII_WORD_BOUND, | |
# ifdef USE_WORD_BEGIN_END | |
&&L_OP_ASCII_WORD_BEGIN, | |
&&L_OP_ASCII_WORD_END, | |
# else | |
&&L_DEFAULT, | |
&&L_DEFAULT, | |
# endif | |
&&L_OP_BEGIN_BUF, | |
&&L_OP_END_BUF, | |
&&L_OP_BEGIN_LINE, | |
&&L_OP_END_LINE, | |
&&L_OP_SEMI_END_BUF, | |
&&L_OP_BEGIN_POSITION, | |
&&L_OP_BACKREF1, | |
&&L_OP_BACKREF2, | |
&&L_OP_BACKREFN, | |
&&L_OP_BACKREFN_IC, | |
&&L_OP_BACKREF_MULTI, | |
&&L_OP_BACKREF_MULTI_IC, | |
# ifdef USE_BACKREF_WITH_LEVEL | |
&&L_OP_BACKREF_WITH_LEVEL, /* \k<xxx+n>, \k<xxx-n> */ | |
# else | |
&&L_DEFAULT, | |
# endif | |
&&L_OP_MEMORY_START, | |
&&L_OP_MEMORY_START_PUSH, /* push back-tracker to stack */ | |
&&L_OP_MEMORY_END_PUSH, /* push back-tracker to stack */ | |
# ifdef USE_SUBEXP_CALL | |
&&L_OP_MEMORY_END_PUSH_REC, /* push back-tracker to stack */ | |
# else | |
&&L_DEFAULT, | |
# endif | |
&&L_OP_MEMORY_END, | |
# ifdef USE_SUBEXP_CALL | |
&&L_OP_MEMORY_END_REC, /* push marker to stack */ | |
# else | |
&&L_DEFAULT, | |
# endif | |
&&L_OP_KEEP, | |
&&L_OP_FAIL, /* pop stack and move */ | |
&&L_OP_JUMP, | |
&&L_OP_PUSH, | |
&&L_OP_POP, | |
# ifdef USE_OP_PUSH_OR_JUMP_EXACT | |
&&L_OP_PUSH_OR_JUMP_EXACT1, /* if match exact then push, else jump. */ | |
# else | |
&&L_DEFAULT, | |
# endif | |
&&L_OP_PUSH_IF_PEEK_NEXT, /* if match exact then push, else none. */ | |
&&L_OP_REPEAT, /* {n,m} */ | |
&&L_OP_REPEAT_NG, /* {n,m}? (non greedy) */ | |
&&L_OP_REPEAT_INC, | |
&&L_OP_REPEAT_INC_NG, /* non greedy */ | |
&&L_OP_REPEAT_INC_SG, /* search and get in stack */ | |
&&L_OP_REPEAT_INC_NG_SG, /* search and get in stack (non greedy) */ | |
&&L_OP_NULL_CHECK_START, /* null loop checker start */ | |
&&L_OP_NULL_CHECK_END, /* null loop checker end */ | |
# ifdef USE_MONOMANIAC_CHECK_CAPTURES_IN_ENDLESS_REPEAT | |
&&L_OP_NULL_CHECK_END_MEMST, /* null loop checker end (with capture status) */ | |
# else | |
&&L_DEFAULT, | |
# endif | |
# ifdef USE_SUBEXP_CALL | |
&&L_OP_NULL_CHECK_END_MEMST_PUSH, /* with capture status and push check-end */ | |
# else | |
&&L_DEFAULT, | |
# endif | |
&&L_OP_PUSH_POS, /* (?=...) start */ | |
&&L_OP_POP_POS, /* (?=...) end */ | |
&&L_OP_PUSH_POS_NOT, /* (?!...) start */ | |
&&L_OP_FAIL_POS, /* (?!...) end */ | |
&&L_OP_PUSH_STOP_BT, /* (?>...) start */ | |
&&L_OP_POP_STOP_BT, /* (?>...) end */ | |
&&L_OP_LOOK_BEHIND, /* (?<=...) start (no needs end opcode) */ | |
&&L_OP_PUSH_LOOK_BEHIND_NOT, /* (?<!...) start */ | |
&&L_OP_FAIL_LOOK_BEHIND_NOT, /* (?<!...) end */ | |
&&L_OP_PUSH_ABSENT_POS, /* (?~...) start */ | |
&&L_OP_ABSENT, /* (?~...) start of inner loop */ | |
&&L_OP_ABSENT_END, /* (?~...) end */ | |
# ifdef USE_SUBEXP_CALL | |
&&L_OP_CALL, /* \g<name> */ | |
&&L_OP_RETURN, | |
# else | |
&&L_DEFAULT, | |
&&L_DEFAULT, | |
# endif | |
&&L_OP_CONDITION, | |
# ifdef USE_COMBINATION_EXPLOSION_CHECK | |
&&L_OP_STATE_CHECK_PUSH, /* combination explosion check and push */ | |
&&L_OP_STATE_CHECK_PUSH_OR_JUMP, /* check ok -> push, else jump */ | |
&&L_OP_STATE_CHECK, /* check only */ | |
# else | |
&&L_DEFAULT, | |
&&L_DEFAULT, | |
&&L_DEFAULT, | |
# endif | |
# ifdef USE_COMBINATION_EXPLOSION_CHECK | |
&&L_OP_STATE_CHECK_ANYCHAR_STAR, | |
&&L_OP_STATE_CHECK_ANYCHAR_ML_STAR, | |
# else | |
&&L_DEFAULT, | |
&&L_DEFAULT, | |
# endif | |
/* no need: IS_DYNAMIC_OPTION() == 0 */ | |
# if 0 /* no need: IS_DYNAMIC_OPTION() == 0 */ | |
&&L_OP_SET_OPTION_PUSH, /* set option and push recover option */ | |
&&L_OP_SET_OPTION /* set option */ | |
# else | |
&&L_DEFAULT, | |
&&L_DEFAULT | |
# endif | |
}; | |
#else /* USE_TOKEN_THREADED_VM */ | |
# define OP_OFFSET 0 | |
# define VM_LOOP \ | |
while (1) { \ | |
OPCODE_EXEC_HOOK; \ | |
sbegin = s; \ | |
switch (*p++) { | |
# define VM_LOOP_END } sprev = sbegin; } | |
# define CASE(x) case x: | |
# define DEFAULT default: | |
# define NEXT break | |
# define JUMP continue; break | |
#endif /* USE_TOKEN_THREADED_VM */ | |
#ifdef USE_SUBEXP_CALL | |
/* Stack #0 is used to store the pattern itself and used for (?R), \g<0>, | |
etc. Additional space is required. */ | |
# define ADD_NUMMEM 1 | |
#else | |
/* Stack #0 not is used. */ | |
# define ADD_NUMMEM 0 | |
#endif | |
n = reg->num_repeat + (reg->num_mem + ADD_NUMMEM) * 2; | |
STACK_INIT(alloca_base, xmalloc_base, n, INIT_MATCH_STACK_SIZE); | |
pop_level = reg->stack_pop_level; | |
num_mem = reg->num_mem; | |
repeat_stk = (OnigStackIndex* )alloca_base; | |
mem_start_stk = (OnigStackIndex* )(repeat_stk + reg->num_repeat); | |
mem_end_stk = mem_start_stk + (num_mem + ADD_NUMMEM); | |
{ | |
OnigStackIndex *pp = mem_start_stk; | |
for (; pp < repeat_stk + n; pp += 2) { | |
pp[0] = INVALID_STACK_INDEX; | |
pp[1] = INVALID_STACK_INDEX; | |
} | |
} | |
#ifndef USE_SUBEXP_CALL | |
mem_start_stk--; /* for index start from 1, | |
mem_start_stk[1]..mem_start_stk[num_mem] */ | |
mem_end_stk--; /* for index start from 1, | |
mem_end_stk[1]..mem_end_stk[num_mem] */ | |
#endif | |
#ifdef ONIG_DEBUG_MATCH | |
fprintf(stderr, "match_at: str: %"PRIuPTR" (%p), end: %"PRIuPTR" (%p), start: %"PRIuPTR" (%p), sprev: %"PRIuPTR" (%p)\n", | |
(uintptr_t )str, str, (uintptr_t )end, end, (uintptr_t )sstart, sstart, (uintptr_t )sprev, sprev); | |
fprintf(stderr, "size: %d, start offset: %d\n", | |
(int )(end - str), (int )(sstart - str)); | |
fprintf(stderr, "\n ofs> str stk:type addr:opcode\n"); | |
#endif | |
STACK_PUSH_ENSURED(STK_ALT, (UChar* )FinishCode); /* bottom stack */ | |
best_len = ONIG_MISMATCH; | |
s = (UChar* )sstart; | |
pkeep = (UChar* )sstart; | |
#ifdef ONIG_DEBUG_MATCH | |
# define OPCODE_EXEC_HOOK \ | |
if (s) { \ | |
UChar *op, *q, *bp, buf[50]; \ | |
int len; \ | |
op = p - OP_OFFSET; \ | |
fprintf(stderr, "%4"PRIdPTR"> \"", (*op == OP_FINISH) ? (ptrdiff_t )-1 : s - str); \ | |
bp = buf; \ | |
q = s; \ | |
if (*op != OP_FINISH) { /* s may not be a valid pointer if OP_FINISH. */ \ | |
for (i = 0; i < 7 && q < end; i++) { \ | |
len = enclen(encode, q, end); \ | |
while (len-- > 0) *bp++ = *q++; \ | |
} \ | |
if (q < end) { xmemcpy(bp, "...", 3); bp += 3; } \ | |
} \ | |
xmemcpy(bp, "\"", 1); bp += 1; \ | |
*bp = 0; \ | |
fputs((char* )buf, stderr); \ | |
for (i = 0; i < 20 - (bp - buf); i++) fputc(' ', stderr); \ | |
fprintf(stderr, "%4"PRIdPTR":%s %4"PRIdPTR":", \ | |
stk - stk_base - 1, \ | |
(stk > stk_base) ? stack_type_str(stk[-1].type) : " ", \ | |
(op == FinishCode) ? (ptrdiff_t )-1 : op - reg->p); \ | |
onig_print_compiled_byte_code(stderr, op, reg->p+reg->used, NULL, encode); \ | |
fprintf(stderr, "\n"); \ | |
} | |
#else | |
# define OPCODE_EXEC_HOOK ((void) 0) | |
#endif | |
VM_LOOP { | |
CASE(OP_END) MOP_IN(OP_END); | |
n = s - sstart; | |
if (n > best_len) { | |
OnigRegion* region; | |
#ifdef USE_FIND_LONGEST_SEARCH_ALL_OF_RANGE | |
if (IS_FIND_LONGEST(option)) { | |
if (n > msa->best_len) { | |
msa->best_len = n; | |
msa->best_s = (UChar* )sstart; | |
} | |
else | |
goto end_best_len; | |
} | |
#endif | |
best_len = n; | |
region = msa->region; | |
if (region) { | |
region->beg[0] = ((pkeep > s) ? s : pkeep) - str; | |
region->end[0] = s - str; | |
for (i = 1; i <= num_mem; i++) { | |
if (mem_end_stk[i] != INVALID_STACK_INDEX) { | |
if (BIT_STATUS_AT(reg->bt_mem_start, i)) | |
region->beg[i] = STACK_AT(mem_start_stk[i])->u.mem.pstr - str; | |
else | |
region->beg[i] = (UChar* )((void* )mem_start_stk[i]) - str; | |
region->end[i] = (BIT_STATUS_AT(reg->bt_mem_end, i) | |
? STACK_AT(mem_end_stk[i])->u.mem.pstr | |
: (UChar* )((void* )mem_end_stk[i])) - str; | |
} | |
else { | |
region->beg[i] = region->end[i] = ONIG_REGION_NOTPOS; | |
} | |
} | |
#ifdef USE_CAPTURE_HISTORY | |
if (reg->capture_history != 0) { | |
int r; | |
OnigCaptureTreeNode* node; | |
if (IS_NULL(region->history_root)) { | |
region->history_root = node = history_node_new(); | |
CHECK_NULL_RETURN_MEMERR(node); | |
} | |
else { | |
node = region->history_root; | |
history_tree_clear(node); | |
} | |
node->group = 0; | |
node->beg = ((pkeep > s) ? s : pkeep) - str; | |
node->end = s - str; | |
stkp = stk_base; | |
r = make_capture_history_tree(region->history_root, &stkp, | |
stk, (UChar* )str, reg); | |
if (r < 0) { | |
best_len = r; /* error code */ | |
goto finish; | |
} | |
} | |
#endif /* USE_CAPTURE_HISTORY */ | |
} /* if (region) */ | |
} /* n > best_len */ | |
#ifdef USE_FIND_LONGEST_SEARCH_ALL_OF_RANGE | |
end_best_len: | |
#endif | |
MOP_OUT; | |
if (IS_FIND_CONDITION(option)) { | |
if (IS_FIND_NOT_EMPTY(option) && s == sstart) { | |
best_len = ONIG_MISMATCH; | |
goto fail; /* for retry */ | |
} | |
if (IS_FIND_LONGEST(option) && DATA_ENSURE_CHECK1) { | |
goto fail; /* for retry */ | |
} | |
} | |
/* default behavior: return first-matching result. */ | |
goto finish; | |
NEXT; | |
CASE(OP_EXACT1) MOP_IN(OP_EXACT1); | |
DATA_ENSURE(1); | |
if (*p != *s) goto fail; | |
p++; s++; | |
MOP_OUT; | |
NEXT; | |
CASE(OP_EXACT1_IC) MOP_IN(OP_EXACT1_IC); | |
{ | |
int len; | |
UChar *q, lowbuf[ONIGENC_MBC_CASE_FOLD_MAXLEN]; | |
DATA_ENSURE(1); | |
len = ONIGENC_MBC_CASE_FOLD(encode, | |
/* DISABLE_CASE_FOLD_MULTI_CHAR(case_fold_flag), */ | |
case_fold_flag, | |
&s, end, lowbuf); | |
DATA_ENSURE(0); | |
q = lowbuf; | |
while (len-- > 0) { | |
if (*p != *q) { | |
goto fail; | |
} | |
p++; q++; | |
} | |
} | |
MOP_OUT; | |
NEXT; | |
CASE(OP_EXACT2) MOP_IN(OP_EXACT2); | |
DATA_ENSURE(2); | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
sprev = s; | |
p++; s++; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_EXACT3) MOP_IN(OP_EXACT3); | |
DATA_ENSURE(3); | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
sprev = s; | |
p++; s++; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_EXACT4) MOP_IN(OP_EXACT4); | |
DATA_ENSURE(4); | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
sprev = s; | |
p++; s++; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_EXACT5) MOP_IN(OP_EXACT5); | |
DATA_ENSURE(5); | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
sprev = s; | |
p++; s++; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_EXACTN) MOP_IN(OP_EXACTN); | |
GET_LENGTH_INC(tlen, p); | |
DATA_ENSURE(tlen); | |
while (tlen-- > 0) { | |
if (*p++ != *s++) goto fail; | |
} | |
sprev = s - 1; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_EXACTN_IC) MOP_IN(OP_EXACTN_IC); | |
{ | |
int len; | |
UChar *q, *endp, lowbuf[ONIGENC_MBC_CASE_FOLD_MAXLEN]; | |
GET_LENGTH_INC(tlen, p); | |
endp = p + tlen; | |
while (p < endp) { | |
sprev = s; | |
DATA_ENSURE(1); | |
len = ONIGENC_MBC_CASE_FOLD(encode, | |
/* DISABLE_CASE_FOLD_MULTI_CHAR(case_fold_flag), */ | |
case_fold_flag, | |
&s, end, lowbuf); | |
DATA_ENSURE(0); | |
q = lowbuf; | |
while (len-- > 0) { | |
if (*p != *q) goto fail; | |
p++; q++; | |
} | |
} | |
} | |
MOP_OUT; | |
JUMP; | |
CASE(OP_EXACTMB2N1) MOP_IN(OP_EXACTMB2N1); | |
DATA_ENSURE(2); | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
MOP_OUT; | |
NEXT; | |
CASE(OP_EXACTMB2N2) MOP_IN(OP_EXACTMB2N2); | |
DATA_ENSURE(4); | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
sprev = s; | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_EXACTMB2N3) MOP_IN(OP_EXACTMB2N3); | |
DATA_ENSURE(6); | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
sprev = s; | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_EXACTMB2N) MOP_IN(OP_EXACTMB2N); | |
GET_LENGTH_INC(tlen, p); | |
DATA_ENSURE(tlen * 2); | |
while (tlen-- > 0) { | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
} | |
sprev = s - 2; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_EXACTMB3N) MOP_IN(OP_EXACTMB3N); | |
GET_LENGTH_INC(tlen, p); | |
DATA_ENSURE(tlen * 3); | |
while (tlen-- > 0) { | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
if (*p != *s) goto fail; | |
p++; s++; | |
} | |
sprev = s - 3; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_EXACTMBN) MOP_IN(OP_EXACTMBN); | |
GET_LENGTH_INC(tlen, p); /* mb-len */ | |
GET_LENGTH_INC(tlen2, p); /* string len */ | |
tlen2 *= tlen; | |
DATA_ENSURE(tlen2); | |
while (tlen2-- > 0) { | |
if (*p != *s) goto fail; | |
p++; s++; | |
} | |
sprev = s - tlen; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_CCLASS) MOP_IN(OP_CCLASS); | |
DATA_ENSURE(1); | |
if (BITSET_AT(((BitSetRef )p), *s) == 0) goto fail; | |
p += SIZE_BITSET; | |
s += enclen(encode, s, end); /* OP_CCLASS can match mb-code. \D, \S */ | |
MOP_OUT; | |
NEXT; | |
CASE(OP_CCLASS_MB) MOP_IN(OP_CCLASS_MB); | |
if (! ONIGENC_IS_MBC_HEAD(encode, s, end)) goto fail; | |
cclass_mb: | |
GET_LENGTH_INC(tlen, p); | |
{ | |
OnigCodePoint code; | |
UChar *ss; | |
int mb_len; | |
DATA_ENSURE(1); | |
mb_len = enclen(encode, s, end); | |
DATA_ENSURE(mb_len); | |
ss = s; | |
s += mb_len; | |
code = ONIGENC_MBC_TO_CODE(encode, ss, s); | |
#ifdef PLATFORM_UNALIGNED_WORD_ACCESS | |
if (! onig_is_in_code_range(p, code)) goto fail; | |
#else | |
q = p; | |
ALIGNMENT_RIGHT(q); | |
if (! onig_is_in_code_range(q, code)) goto fail; | |
#endif | |
} | |
p += tlen; | |
MOP_OUT; | |
NEXT; | |
CASE(OP_CCLASS_MIX) MOP_IN(OP_CCLASS_MIX); | |
DATA_ENSURE(1); | |
if (ONIGENC_IS_MBC_HEAD(encode, s, end)) { | |
p += SIZE_BITSET; | |
goto cclass_mb; | |
} | |
else { | |
if (BITSET_AT(((BitSetRef )p), *s) == 0) | |
goto fail; | |
p += SIZE_BITSET; | |
GET_LENGTH_INC(tlen, p); | |
p += tlen; | |
s++; | |
} | |
MOP_OUT; | |
NEXT; | |
CASE(OP_CCLASS_NOT) MOP_IN(OP_CCLASS_NOT); | |
DATA_ENSURE(1); | |
if (BITSET_AT(((BitSetRef )p), *s) != 0) goto fail; | |
p += SIZE_BITSET; | |
s += enclen(encode, s, end); | |
MOP_OUT; | |
NEXT; | |
CASE(OP_CCLASS_MB_NOT) MOP_IN(OP_CCLASS_MB_NOT); | |
DATA_ENSURE(1); | |
if (! ONIGENC_IS_MBC_HEAD(encode, s, end)) { | |
s++; | |
GET_LENGTH_INC(tlen, p); | |
p += tlen; | |
goto cc_mb_not_success; | |
} | |
cclass_mb_not: | |
GET_LENGTH_INC(tlen, p); | |
{ | |
OnigCodePoint code; | |
UChar *ss; | |
int mb_len = enclen(encode, s, end); | |
if (! DATA_ENSURE_CHECK(mb_len)) { | |
DATA_ENSURE(1); | |
s = (UChar* )end; | |
p += tlen; | |
goto cc_mb_not_success; | |
} | |
ss = s; | |
s += mb_len; | |
code = ONIGENC_MBC_TO_CODE(encode, ss, s); | |
#ifdef PLATFORM_UNALIGNED_WORD_ACCESS | |
if (onig_is_in_code_range(p, code)) goto fail; | |
#else | |
q = p; | |
ALIGNMENT_RIGHT(q); | |
if (onig_is_in_code_range(q, code)) goto fail; | |
#endif | |
} | |
p += tlen; | |
cc_mb_not_success: | |
MOP_OUT; | |
NEXT; | |
CASE(OP_CCLASS_MIX_NOT) MOP_IN(OP_CCLASS_MIX_NOT); | |
DATA_ENSURE(1); | |
if (ONIGENC_IS_MBC_HEAD(encode, s, end)) { | |
p += SIZE_BITSET; | |
goto cclass_mb_not; | |
} | |
else { | |
if (BITSET_AT(((BitSetRef )p), *s) != 0) | |
goto fail; | |
p += SIZE_BITSET; | |
GET_LENGTH_INC(tlen, p); | |
p += tlen; | |
s++; | |
} | |
MOP_OUT; | |
NEXT; | |
CASE(OP_ANYCHAR) MOP_IN(OP_ANYCHAR); | |
DATA_ENSURE(1); | |
n = enclen(encode, s, end); | |
DATA_ENSURE(n); | |
if (ONIGENC_IS_MBC_NEWLINE_EX(encode, s, str, end, option, 0)) goto fail; | |
s += n; | |
MOP_OUT; | |
NEXT; | |
CASE(OP_ANYCHAR_ML) MOP_IN(OP_ANYCHAR_ML); | |
DATA_ENSURE(1); | |
n = enclen(encode, s, end); | |
DATA_ENSURE(n); | |
s += n; | |
MOP_OUT; | |
NEXT; | |
CASE(OP_ANYCHAR_STAR) MOP_IN(OP_ANYCHAR_STAR); | |
while (DATA_ENSURE_CHECK1) { | |
STACK_PUSH_ALT(p, s, sprev, pkeep); | |
n = enclen(encode, s, end); | |
DATA_ENSURE(n); | |
if (ONIGENC_IS_MBC_NEWLINE_EX(encode, s, str, end, option, 0)) goto fail; | |
sprev = s; | |
s += n; | |
} | |
MOP_OUT; | |
JUMP; | |
CASE(OP_ANYCHAR_ML_STAR) MOP_IN(OP_ANYCHAR_ML_STAR); | |
while (DATA_ENSURE_CHECK1) { | |
STACK_PUSH_ALT(p, s, sprev, pkeep); | |
n = enclen(encode, s, end); | |
if (n > 1) { | |
DATA_ENSURE(n); | |
sprev = s; | |
s += n; | |
} | |
else { | |
sprev = s; | |
s++; | |
} | |
} | |
MOP_OUT; | |
JUMP; | |
CASE(OP_ANYCHAR_STAR_PEEK_NEXT) MOP_IN(OP_ANYCHAR_STAR_PEEK_NEXT); | |
while (DATA_ENSURE_CHECK1) { | |
if (*p == *s) { | |
STACK_PUSH_ALT(p + 1, s, sprev, pkeep); | |
} | |
n = enclen(encode, s, end); | |
DATA_ENSURE(n); | |
if (ONIGENC_IS_MBC_NEWLINE_EX(encode, s, str, end, option, 0)) goto fail; | |
sprev = s; | |
s += n; | |
} | |
p++; | |
MOP_OUT; | |
NEXT; | |
CASE(OP_ANYCHAR_ML_STAR_PEEK_NEXT)MOP_IN(OP_ANYCHAR_ML_STAR_PEEK_NEXT); | |
while (DATA_ENSURE_CHECK1) { | |
if (*p == *s) { | |
STACK_PUSH_ALT(p + 1, s, sprev, pkeep); | |
} | |
n = enclen(encode, s, end); | |
if (n > 1) { | |
DATA_ENSURE(n); | |
sprev = s; | |
s += n; | |
} | |
else { | |
sprev = s; | |
s++; | |
} | |
} | |
p++; | |
MOP_OUT; | |
NEXT; | |
#ifdef USE_COMBINATION_EXPLOSION_CHECK | |
CASE(OP_STATE_CHECK_ANYCHAR_STAR) MOP_IN(OP_STATE_CHECK_ANYCHAR_STAR); | |
GET_STATE_CHECK_NUM_INC(mem, p); | |
while (DATA_ENSURE_CHECK1) { | |
STATE_CHECK_VAL(scv, mem); | |
if (scv) goto fail; | |
STACK_PUSH_ALT_WITH_STATE_CHECK(p, s, sprev, mem, pkeep); | |
n = enclen(encode, s, end); | |
DATA_ENSURE(n); | |
if (ONIGENC_IS_MBC_NEWLINE_EX(encode, s, str, end, option, 0)) goto fail; | |
sprev = s; | |
s += n; | |
} | |
MOP_OUT; | |
NEXT; | |
CASE(OP_STATE_CHECK_ANYCHAR_ML_STAR) | |
MOP_IN(OP_STATE_CHECK_ANYCHAR_ML_STAR); | |
GET_STATE_CHECK_NUM_INC(mem, p); | |
while (DATA_ENSURE_CHECK1) { | |
STATE_CHECK_VAL(scv, mem); | |
if (scv) goto fail; | |
STACK_PUSH_ALT_WITH_STATE_CHECK(p, s, sprev, mem, pkeep); | |
n = enclen(encode, s, end); | |
if (n > 1) { | |
DATA_ENSURE(n); | |
sprev = s; | |
s += n; | |
} | |
else { | |
sprev = s; | |
s++; | |
} | |
} | |
MOP_OUT; | |
NEXT; | |
#endif /* USE_COMBINATION_EXPLOSION_CHECK */ | |
CASE(OP_WORD) MOP_IN(OP_WORD); | |
DATA_ENSURE(1); | |
if (! ONIGENC_IS_MBC_WORD(encode, s, end)) | |
goto fail; | |
s += enclen(encode, s, end); | |
MOP_OUT; | |
NEXT; | |
CASE(OP_ASCII_WORD) MOP_IN(OP_ASCII_WORD); | |
DATA_ENSURE(1); | |
if (! ONIGENC_IS_MBC_ASCII_WORD(encode, s, end)) | |
goto fail; | |
s += enclen(encode, s, end); | |
MOP_OUT; | |
NEXT; | |
CASE(OP_NOT_WORD) MOP_IN(OP_NOT_WORD); | |
DATA_ENSURE(1); | |
if (ONIGENC_IS_MBC_WORD(encode, s, end)) | |
goto fail; | |
s += enclen(encode, s, end); | |
MOP_OUT; | |
NEXT; | |
CASE(OP_NOT_ASCII_WORD) MOP_IN(OP_NOT_ASCII_WORD); | |
DATA_ENSURE(1); | |
if (ONIGENC_IS_MBC_ASCII_WORD(encode, s, end)) | |
goto fail; | |
s += enclen(encode, s, end); | |
MOP_OUT; | |
NEXT; | |
CASE(OP_WORD_BOUND) MOP_IN(OP_WORD_BOUND); | |
if (ON_STR_BEGIN(s)) { | |
DATA_ENSURE(1); | |
if (! ONIGENC_IS_MBC_WORD(encode, s, end)) | |
goto fail; | |
} | |
else if (ON_STR_END(s)) { | |
if (! ONIGENC_IS_MBC_WORD(encode, sprev, end)) | |
goto fail; | |
} | |
else { | |
if (ONIGENC_IS_MBC_WORD(encode, s, end) | |
== ONIGENC_IS_MBC_WORD(encode, sprev, end)) | |
goto fail; | |
} | |
MOP_OUT; | |
JUMP; | |
CASE(OP_ASCII_WORD_BOUND) MOP_IN(OP_ASCII_WORD_BOUND); | |
if (ON_STR_BEGIN(s)) { | |
DATA_ENSURE(1); | |
if (! ONIGENC_IS_MBC_ASCII_WORD(encode, s, end)) | |
goto fail; | |
} | |
else if (ON_STR_END(s)) { | |
if (! ONIGENC_IS_MBC_ASCII_WORD(encode, sprev, end)) | |
goto fail; | |
} | |
else { | |
if (ONIGENC_IS_MBC_ASCII_WORD(encode, s, end) | |
== ONIGENC_IS_MBC_ASCII_WORD(encode, sprev, end)) | |
goto fail; | |
} | |
MOP_OUT; | |
JUMP; | |
CASE(OP_NOT_WORD_BOUND) MOP_IN(OP_NOT_WORD_BOUND); | |
if (ON_STR_BEGIN(s)) { | |
if (DATA_ENSURE_CHECK1 && ONIGENC_IS_MBC_WORD(encode, s, end)) | |
goto fail; | |
} | |
else if (ON_STR_END(s)) { | |
if (ONIGENC_IS_MBC_WORD(encode, sprev, end)) | |
goto fail; | |
} | |
else { | |
if (ONIGENC_IS_MBC_WORD(encode, s, end) | |
!= ONIGENC_IS_MBC_WORD(encode, sprev, end)) | |
goto fail; | |
} | |
MOP_OUT; | |
JUMP; | |
CASE(OP_NOT_ASCII_WORD_BOUND) MOP_IN(OP_NOT_ASCII_WORD_BOUND); | |
if (ON_STR_BEGIN(s)) { | |
if (DATA_ENSURE_CHECK1 && ONIGENC_IS_MBC_ASCII_WORD(encode, s, end)) | |
goto fail; | |
} | |
else if (ON_STR_END(s)) { | |
if (ONIGENC_IS_MBC_ASCII_WORD(encode, sprev, end)) | |
goto fail; | |
} | |
else { | |
if (ONIGENC_IS_MBC_ASCII_WORD(encode, s, end) | |
!= ONIGENC_IS_MBC_ASCII_WORD(encode, sprev, end)) | |
goto fail; | |
} | |
MOP_OUT; | |
JUMP; | |
#ifdef USE_WORD_BEGIN_END | |
CASE(OP_WORD_BEGIN) MOP_IN(OP_WORD_BEGIN); | |
if (DATA_ENSURE_CHECK1 && ONIGENC_IS_MBC_WORD(encode, s, end)) { | |
if (ON_STR_BEGIN(s) || !ONIGENC_IS_MBC_WORD(encode, sprev, end)) { | |
MOP_OUT; | |
JUMP; | |
} | |
} | |
goto fail; | |
NEXT; | |
CASE(OP_ASCII_WORD_BEGIN) MOP_IN(OP_ASCII_WORD_BEGIN); | |
if (DATA_ENSURE_CHECK1 && ONIGENC_IS_MBC_ASCII_WORD(encode, s, end)) { | |
if (ON_STR_BEGIN(s) || !ONIGENC_IS_MBC_ASCII_WORD(encode, sprev, end)) { | |
MOP_OUT; | |
JUMP; | |
} | |
} | |
goto fail; | |
NEXT; | |
CASE(OP_WORD_END) MOP_IN(OP_WORD_END); | |
if (!ON_STR_BEGIN(s) && ONIGENC_IS_MBC_WORD(encode, sprev, end)) { | |
if (ON_STR_END(s) || !ONIGENC_IS_MBC_WORD(encode, s, end)) { | |
MOP_OUT; | |
JUMP; | |
} | |
} | |
goto fail; | |
NEXT; | |
CASE(OP_ASCII_WORD_END) MOP_IN(OP_ASCII_WORD_END); | |
if (!ON_STR_BEGIN(s) && ONIGENC_IS_MBC_ASCII_WORD(encode, sprev, end)) { | |
if (ON_STR_END(s) || !ONIGENC_IS_MBC_ASCII_WORD(encode, s, end)) { | |
MOP_OUT; | |
JUMP; | |
} | |
} | |
goto fail; | |
NEXT; | |
#endif | |
CASE(OP_BEGIN_BUF) MOP_IN(OP_BEGIN_BUF); | |
if (! ON_STR_BEGIN(s)) goto fail; | |
if (IS_NOTBOS(msa->options)) goto fail; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_END_BUF) MOP_IN(OP_END_BUF); | |
if (! ON_STR_END(s)) goto fail; | |
if (IS_NOTEOS(msa->options)) goto fail; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_BEGIN_LINE) MOP_IN(OP_BEGIN_LINE); | |
if (ON_STR_BEGIN(s)) { | |
if (IS_NOTBOL(msa->options)) goto fail; | |
MOP_OUT; | |
JUMP; | |
} | |
else if (ONIGENC_IS_MBC_NEWLINE(encode, sprev, end) | |
#ifdef USE_CRNL_AS_LINE_TERMINATOR | |
&& !(IS_NEWLINE_CRLF(option) | |
&& ONIGENC_IS_MBC_CRNL(encode, sprev, end)) | |
#endif | |
&& !ON_STR_END(s)) { | |
MOP_OUT; | |
JUMP; | |
} | |
goto fail; | |
NEXT; | |
CASE(OP_END_LINE) MOP_IN(OP_END_LINE); | |
if (ON_STR_END(s)) { | |
#ifndef USE_NEWLINE_AT_END_OF_STRING_HAS_EMPTY_LINE | |
if (IS_EMPTY_STR || !ONIGENC_IS_MBC_NEWLINE_EX(encode, sprev, str, end, option, 1)) { | |
#endif | |
if (IS_NOTEOL(msa->options)) goto fail; | |
MOP_OUT; | |
JUMP; | |
#ifndef USE_NEWLINE_AT_END_OF_STRING_HAS_EMPTY_LINE | |
} | |
#endif | |
} | |
else if (ONIGENC_IS_MBC_NEWLINE_EX(encode, s, str, end, option, 1)) { | |
MOP_OUT; | |
JUMP; | |
} | |
goto fail; | |
NEXT; | |
CASE(OP_SEMI_END_BUF) MOP_IN(OP_SEMI_END_BUF); | |
if (ON_STR_END(s)) { | |
#ifndef USE_NEWLINE_AT_END_OF_STRING_HAS_EMPTY_LINE | |
if (IS_EMPTY_STR || !ONIGENC_IS_MBC_NEWLINE_EX(encode, sprev, str, end, option, 1)) { | |
#endif | |
if (IS_NOTEOL(msa->options)) goto fail; | |
MOP_OUT; | |
JUMP; | |
#ifndef USE_NEWLINE_AT_END_OF_STRING_HAS_EMPTY_LINE | |
} | |
#endif | |
} | |
else if (ONIGENC_IS_MBC_NEWLINE_EX(encode, s, str, end, option, 1)) { | |
UChar* ss = s + enclen(encode, s, end); | |
if (ON_STR_END(ss)) { | |
MOP_OUT; | |
JUMP; | |
} | |
#ifdef USE_CRNL_AS_LINE_TERMINATOR | |
else if (IS_NEWLINE_CRLF(option) | |
&& ONIGENC_IS_MBC_CRNL(encode, s, end)) { | |
ss += enclen(encode, ss, end); | |
if (ON_STR_END(ss)) { | |
MOP_OUT; | |
JUMP; | |
} | |
} | |
#endif | |
} | |
goto fail; | |
NEXT; | |
CASE(OP_BEGIN_POSITION) MOP_IN(OP_BEGIN_POSITION); | |
if (s != msa->gpos) | |
goto fail; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_MEMORY_START_PUSH) MOP_IN(OP_MEMORY_START_PUSH); | |
GET_MEMNUM_INC(mem, p); | |
STACK_PUSH_MEM_START(mem, s); | |
MOP_OUT; | |
JUMP; | |
CASE(OP_MEMORY_START) MOP_IN(OP_MEMORY_START); | |
GET_MEMNUM_INC(mem, p); | |
mem_start_stk[mem] = (OnigStackIndex )((void* )s); | |
mem_end_stk[mem] = INVALID_STACK_INDEX; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_MEMORY_END_PUSH) MOP_IN(OP_MEMORY_END_PUSH); | |
GET_MEMNUM_INC(mem, p); | |
STACK_PUSH_MEM_END(mem, s); | |
MOP_OUT; | |
JUMP; | |
CASE(OP_MEMORY_END) MOP_IN(OP_MEMORY_END); | |
GET_MEMNUM_INC(mem, p); | |
mem_end_stk[mem] = (OnigStackIndex )((void* )s); | |
MOP_OUT; | |
JUMP; | |
CASE(OP_KEEP) MOP_IN(OP_KEEP); | |
pkeep = s; | |
MOP_OUT; | |
JUMP; | |
#ifdef USE_SUBEXP_CALL | |
CASE(OP_MEMORY_END_PUSH_REC) MOP_IN(OP_MEMORY_END_PUSH_REC); | |
GET_MEMNUM_INC(mem, p); | |
STACK_GET_MEM_START(mem, stkp); /* should be before push mem-end. */ | |
STACK_PUSH_MEM_END(mem, s); | |
mem_start_stk[mem] = GET_STACK_INDEX(stkp); | |
MOP_OUT; | |
JUMP; | |
CASE(OP_MEMORY_END_REC) MOP_IN(OP_MEMORY_END_REC); | |
GET_MEMNUM_INC(mem, p); | |
mem_end_stk[mem] = (OnigStackIndex )((void* )s); | |
STACK_GET_MEM_START(mem, stkp); | |
if (BIT_STATUS_AT(reg->bt_mem_start, mem)) | |
mem_start_stk[mem] = GET_STACK_INDEX(stkp); | |
else | |
mem_start_stk[mem] = (OnigStackIndex )((void* )stkp->u.mem.pstr); | |
STACK_PUSH_MEM_END_MARK(mem); | |
MOP_OUT; | |
JUMP; | |
#endif | |
CASE(OP_BACKREF1) MOP_IN(OP_BACKREF1); | |
mem = 1; | |
goto backref; | |
NEXT; | |
CASE(OP_BACKREF2) MOP_IN(OP_BACKREF2); | |
mem = 2; | |
goto backref; | |
NEXT; | |
CASE(OP_BACKREFN) MOP_IN(OP_BACKREFN); | |
GET_MEMNUM_INC(mem, p); | |
backref: | |
{ | |
int len; | |
UChar *pstart, *pend; | |
/* if you want to remove following line, | |
you should check in parse and compile time. */ | |
if (mem > num_mem) goto fail; | |
if (mem_end_stk[mem] == INVALID_STACK_INDEX) goto fail; | |
if (mem_start_stk[mem] == INVALID_STACK_INDEX) goto fail; | |
if (BIT_STATUS_AT(reg->bt_mem_start, mem)) | |
pstart = STACK_AT(mem_start_stk[mem])->u.mem.pstr; | |
else | |
pstart = (UChar* )((void* )mem_start_stk[mem]); | |
pend = (BIT_STATUS_AT(reg->bt_mem_end, mem) | |
? STACK_AT(mem_end_stk[mem])->u.mem.pstr | |
: (UChar* )((void* )mem_end_stk[mem])); | |
n = pend - pstart; | |
DATA_ENSURE(n); | |
sprev = s; | |
STRING_CMP(pstart, s, n); | |
while (sprev + (len = enclen(encode, sprev, end)) < s) | |
sprev += len; | |
MOP_OUT; | |
JUMP; | |
} | |
CASE(OP_BACKREFN_IC) MOP_IN(OP_BACKREFN_IC); | |
GET_MEMNUM_INC(mem, p); | |
{ | |
int len; | |
UChar *pstart, *pend; | |
/* if you want to remove following line, | |
you should check in parse and compile time. */ | |
if (mem > num_mem) goto fail; | |
if (mem_end_stk[mem] == INVALID_STACK_INDEX) goto fail; | |
if (mem_start_stk[mem] == INVALID_STACK_INDEX) goto fail; | |
if (BIT_STATUS_AT(reg->bt_mem_start, mem)) | |
pstart = STACK_AT(mem_start_stk[mem])->u.mem.pstr; | |
else | |
pstart = (UChar* )((void* )mem_start_stk[mem]); | |
pend = (BIT_STATUS_AT(reg->bt_mem_end, mem) | |
? STACK_AT(mem_end_stk[mem])->u.mem.pstr | |
: (UChar* )((void* )mem_end_stk[mem])); | |
n = pend - pstart; | |
DATA_ENSURE(n); | |
sprev = s; | |
STRING_CMP_IC(case_fold_flag, pstart, &s, (int)n, end); | |
while (sprev + (len = enclen(encode, sprev, end)) < s) | |
sprev += len; | |
MOP_OUT; | |
JUMP; | |
} | |
NEXT; | |
CASE(OP_BACKREF_MULTI) MOP_IN(OP_BACKREF_MULTI); | |
{ | |
int len, is_fail; | |
UChar *pstart, *pend, *swork; | |
GET_LENGTH_INC(tlen, p); | |
for (i = 0; i < tlen; i++) { | |
GET_MEMNUM_INC(mem, p); | |
if (mem_end_stk[mem] == INVALID_STACK_INDEX) continue; | |
if (mem_start_stk[mem] == INVALID_STACK_INDEX) continue; | |
if (BIT_STATUS_AT(reg->bt_mem_start, mem)) | |
pstart = STACK_AT(mem_start_stk[mem])->u.mem.pstr; | |
else | |
pstart = (UChar* )((void* )mem_start_stk[mem]); | |
pend = (BIT_STATUS_AT(reg->bt_mem_end, mem) | |
? STACK_AT(mem_end_stk[mem])->u.mem.pstr | |
: (UChar* )((void* )mem_end_stk[mem])); | |
n = pend - pstart; | |
DATA_ENSURE(n); | |
sprev = s; | |
swork = s; | |
STRING_CMP_VALUE(pstart, swork, n, is_fail); | |
if (is_fail) continue; | |
s = swork; | |
while (sprev + (len = enclen(encode, sprev, end)) < s) | |
sprev += len; | |
p += (SIZE_MEMNUM * (tlen - i - 1)); | |
break; /* success */ | |
} | |
if (i == tlen) goto fail; | |
MOP_OUT; | |
JUMP; | |
} | |
NEXT; | |
CASE(OP_BACKREF_MULTI_IC) MOP_IN(OP_BACKREF_MULTI_IC); | |
{ | |
int len, is_fail; | |
UChar *pstart, *pend, *swork; | |
GET_LENGTH_INC(tlen, p); | |
for (i = 0; i < tlen; i++) { | |
GET_MEMNUM_INC(mem, p); | |
if (mem_end_stk[mem] == INVALID_STACK_INDEX) continue; | |
if (mem_start_stk[mem] == INVALID_STACK_INDEX) continue; | |
if (BIT_STATUS_AT(reg->bt_mem_start, mem)) | |
pstart = STACK_AT(mem_start_stk[mem])->u.mem.pstr; | |
else | |
pstart = (UChar* )((void* )mem_start_stk[mem]); | |
pend = (BIT_STATUS_AT(reg->bt_mem_end, mem) | |
? STACK_AT(mem_end_stk[mem])->u.mem.pstr | |
: (UChar* )((void* )mem_end_stk[mem])); | |
n = pend - pstart; | |
DATA_ENSURE(n); | |
sprev = s; | |
swork = s; | |
STRING_CMP_VALUE_IC(case_fold_flag, pstart, &swork, n, end, is_fail); | |
if (is_fail) continue; | |
s = swork; | |
while (sprev + (len = enclen(encode, sprev, end)) < s) | |
sprev += len; | |
p += (SIZE_MEMNUM * (tlen - i - 1)); | |
break; /* success */ | |
} | |
if (i == tlen) goto fail; | |
MOP_OUT; | |
JUMP; | |
} | |
#ifdef USE_BACKREF_WITH_LEVEL | |
CASE(OP_BACKREF_WITH_LEVEL) | |
{ | |
int len; | |
OnigOptionType ic; | |
LengthType level; | |
GET_OPTION_INC(ic, p); | |
GET_LENGTH_INC(level, p); | |
GET_LENGTH_INC(tlen, p); | |
sprev = s; | |
if (backref_match_at_nested_level(reg, stk, stk_base, ic, | |
case_fold_flag, (int )level, (int )tlen, p, &s, end)) { | |
while (sprev + (len = enclen(encode, sprev, end)) < s) | |
sprev += len; | |
p += (SIZE_MEMNUM * tlen); | |
} | |
else | |
goto fail; | |
MOP_OUT; | |
JUMP; | |
} | |
#endif | |
#if 0 /* no need: IS_DYNAMIC_OPTION() == 0 */ | |
CASE(OP_SET_OPTION_PUSH) MOP_IN(OP_SET_OPTION_PUSH); | |
GET_OPTION_INC(option, p); | |
STACK_PUSH_ALT(p, s, sprev, pkeep); | |
p += SIZE_OP_SET_OPTION + SIZE_OP_FAIL; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_SET_OPTION) MOP_IN(OP_SET_OPTION); | |
GET_OPTION_INC(option, p); | |
MOP_OUT; | |
JUMP; | |
#endif | |
CASE(OP_NULL_CHECK_START) MOP_IN(OP_NULL_CHECK_START); | |
GET_MEMNUM_INC(mem, p); /* mem: null check id */ | |
STACK_PUSH_NULL_CHECK_START(mem, s); | |
MOP_OUT; | |
JUMP; | |
CASE(OP_NULL_CHECK_END) MOP_IN(OP_NULL_CHECK_END); | |
{ | |
int isnull; | |
GET_MEMNUM_INC(mem, p); /* mem: null check id */ | |
STACK_NULL_CHECK(isnull, mem, s); | |
if (isnull) { | |
#ifdef ONIG_DEBUG_MATCH | |
fprintf(stderr, "NULL_CHECK_END: skip id:%d, s:%"PRIuPTR" (%p)\n", | |
(int )mem, (uintptr_t )s, s); | |
#endif | |
null_check_found: | |
/* empty loop founded, skip next instruction */ | |
switch (*p++) { | |
case OP_JUMP: | |
case OP_PUSH: | |
p += SIZE_RELADDR; | |
break; | |
case OP_REPEAT_INC: | |
case OP_REPEAT_INC_NG: | |
case OP_REPEAT_INC_SG: | |
case OP_REPEAT_INC_NG_SG: | |
p += SIZE_MEMNUM; | |
break; | |
default: | |
goto unexpected_bytecode_error; | |
break; | |
} | |
} | |
} | |
MOP_OUT; | |
JUMP; | |
#ifdef USE_MONOMANIAC_CHECK_CAPTURES_IN_ENDLESS_REPEAT | |
CASE(OP_NULL_CHECK_END_MEMST) MOP_IN(OP_NULL_CHECK_END_MEMST); | |
{ | |
int isnull; | |
GET_MEMNUM_INC(mem, p); /* mem: null check id */ | |
STACK_NULL_CHECK_MEMST(isnull, mem, s, reg); | |
if (isnull) { | |
# ifdef ONIG_DEBUG_MATCH | |
fprintf(stderr, "NULL_CHECK_END_MEMST: skip id:%d, s:%"PRIuPTR" (%p)\n", | |
(int )mem, (uintptr_t )s, s); | |
# endif | |
if (isnull == -1) goto fail; | |
goto null_check_found; | |
} | |
} | |
MOP_OUT; | |
JUMP; | |
#endif | |
#ifdef USE_SUBEXP_CALL | |
CASE(OP_NULL_CHECK_END_MEMST_PUSH) | |
MOP_IN(OP_NULL_CHECK_END_MEMST_PUSH); | |
{ | |
int isnull; | |
GET_MEMNUM_INC(mem, p); /* mem: null check id */ | |
# ifdef USE_MONOMANIAC_CHECK_CAPTURES_IN_ENDLESS_REPEAT | |
STACK_NULL_CHECK_MEMST_REC(isnull, mem, s, reg); | |
# else | |
STACK_NULL_CHECK_REC(isnull, mem, s); | |
# endif | |
if (isnull) { | |
# ifdef ONIG_DEBUG_MATCH | |
fprintf(stderr, "NULL_CHECK_END_MEMST_PUSH: skip id:%d, s:%"PRIuPTR" (%p)\n", | |
(int )mem, (uintptr_t )s, s); | |
# endif | |
if (isnull == -1) goto fail; | |
goto null_check_found; | |
} | |
else { | |
STACK_PUSH_NULL_CHECK_END(mem); | |
} | |
} | |
MOP_OUT; | |
JUMP; | |
#endif | |
CASE(OP_JUMP) MOP_IN(OP_JUMP); | |
GET_RELADDR_INC(addr, p); | |
p += addr; | |
MOP_OUT; | |
CHECK_INTERRUPT_IN_MATCH_AT; | |
JUMP; | |
CASE(OP_PUSH) MOP_IN(OP_PUSH); | |
GET_RELADDR_INC(addr, p); | |
STACK_PUSH_ALT(p + addr, s, sprev, pkeep); | |
MOP_OUT; | |
JUMP; | |
#ifdef USE_COMBINATION_EXPLOSION_CHECK | |
CASE(OP_STATE_CHECK_PUSH) MOP_IN(OP_STATE_CHECK_PUSH); | |
GET_STATE_CHECK_NUM_INC(mem, p); | |
STATE_CHECK_VAL(scv, mem); | |
if (scv) goto fail; | |
GET_RELADDR_INC(addr, p); | |
STACK_PUSH_ALT_WITH_STATE_CHECK(p + addr, s, sprev, mem, pkeep); | |
MOP_OUT; | |
JUMP; | |
CASE(OP_STATE_CHECK_PUSH_OR_JUMP) MOP_IN(OP_STATE_CHECK_PUSH_OR_JUMP); | |
GET_STATE_CHECK_NUM_INC(mem, p); | |
GET_RELADDR_INC(addr, p); | |
STATE_CHECK_VAL(scv, mem); | |
if (scv) { | |
p += addr; | |
} | |
else { | |
STACK_PUSH_ALT_WITH_STATE_CHECK(p + addr, s, sprev, mem, pkeep); | |
} | |
MOP_OUT; | |
JUMP; | |
CASE(OP_STATE_CHECK) MOP_IN(OP_STATE_CHECK); | |
GET_STATE_CHECK_NUM_INC(mem, p); | |
STATE_CHECK_VAL(scv, mem); | |
if (scv) goto fail; | |
STACK_PUSH_STATE_CHECK(s, mem); | |
MOP_OUT; | |
JUMP; | |
#endif /* USE_COMBINATION_EXPLOSION_CHECK */ | |
CASE(OP_POP) MOP_IN(OP_POP); | |
STACK_POP_ONE; | |
MOP_OUT; | |
JUMP; | |
#ifdef USE_OP_PUSH_OR_JUMP_EXACT | |
CASE(OP_PUSH_OR_JUMP_EXACT1) MOP_IN(OP_PUSH_OR_JUMP_EXACT1); | |
GET_RELADDR_INC(addr, p); | |
if (*p == *s && DATA_ENSURE_CHECK1) { | |
p++; | |
STACK_PUSH_ALT(p + addr, s, sprev, pkeep); | |
MOP_OUT; | |
JUMP; | |
} | |
p += (addr + 1); | |
MOP_OUT; | |
JUMP; | |
#endif | |
CASE(OP_PUSH_IF_PEEK_NEXT) MOP_IN(OP_PUSH_IF_PEEK_NEXT); | |
GET_RELADDR_INC(addr, p); | |
if (*p == *s) { | |
p++; | |
STACK_PUSH_ALT(p + addr, s, sprev, pkeep); | |
MOP_OUT; | |
JUMP; | |
} | |
p++; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_REPEAT) MOP_IN(OP_REPEAT); | |
{ | |
GET_MEMNUM_INC(mem, p); /* mem: OP_REPEAT ID */ | |
GET_RELADDR_INC(addr, p); | |
STACK_ENSURE(1); | |
repeat_stk[mem] = GET_STACK_INDEX(stk); | |
STACK_PUSH_REPEAT(mem, p); | |
if (reg->repeat_range[mem].lower == 0) { | |
STACK_PUSH_ALT(p + addr, s, sprev, pkeep); | |
} | |
} | |
MOP_OUT; | |
JUMP; | |
CASE(OP_REPEAT_NG) MOP_IN(OP_REPEAT_NG); | |
{ | |
GET_MEMNUM_INC(mem, p); /* mem: OP_REPEAT ID */ | |
GET_RELADDR_INC(addr, p); | |
STACK_ENSURE(1); | |
repeat_stk[mem] = GET_STACK_INDEX(stk); | |
STACK_PUSH_REPEAT(mem, p); | |
if (reg->repeat_range[mem].lower == 0) { | |
STACK_PUSH_ALT(p, s, sprev, pkeep); | |
p += addr; | |
} | |
} | |
MOP_OUT; | |
JUMP; | |
CASE(OP_REPEAT_INC) MOP_IN(OP_REPEAT_INC); | |
GET_MEMNUM_INC(mem, p); /* mem: OP_REPEAT ID */ | |
si = repeat_stk[mem]; | |
stkp = STACK_AT(si); | |
repeat_inc: | |
stkp->u.repeat.count++; | |
if (stkp->u.repeat.count >= reg->repeat_range[mem].upper) { | |
/* end of repeat. Nothing to do. */ | |
} | |
else if (stkp->u.repeat.count >= reg->repeat_range[mem].lower) { | |
STACK_PUSH_ALT(p, s, sprev, pkeep); | |
p = STACK_AT(si)->u.repeat.pcode; /* Don't use stkp after PUSH. */ | |
} | |
else { | |
p = stkp->u.repeat.pcode; | |
} | |
STACK_PUSH_REPEAT_INC(si); | |
MOP_OUT; | |
CHECK_INTERRUPT_IN_MATCH_AT; | |
JUMP; | |
CASE(OP_REPEAT_INC_SG) MOP_IN(OP_REPEAT_INC_SG); | |
GET_MEMNUM_INC(mem, p); /* mem: OP_REPEAT ID */ | |
STACK_GET_REPEAT(mem, stkp); | |
si = GET_STACK_INDEX(stkp); | |
goto repeat_inc; | |
NEXT; | |
CASE(OP_REPEAT_INC_NG) MOP_IN(OP_REPEAT_INC_NG); | |
GET_MEMNUM_INC(mem, p); /* mem: OP_REPEAT ID */ | |
si = repeat_stk[mem]; | |
stkp = STACK_AT(si); | |
repeat_inc_ng: | |
stkp->u.repeat.count++; | |
if (stkp->u.repeat.count < reg->repeat_range[mem].upper) { | |
if (stkp->u.repeat.count >= reg->repeat_range[mem].lower) { | |
UChar* pcode = stkp->u.repeat.pcode; | |
STACK_PUSH_REPEAT_INC(si); | |
STACK_PUSH_ALT(pcode, s, sprev, pkeep); | |
} | |
else { | |
p = stkp->u.repeat.pcode; | |
STACK_PUSH_REPEAT_INC(si); | |
} | |
} | |
else if (stkp->u.repeat.count == reg->repeat_range[mem].upper) { | |
STACK_PUSH_REPEAT_INC(si); | |
} | |
MOP_OUT; | |
CHECK_INTERRUPT_IN_MATCH_AT; | |
JUMP; | |
CASE(OP_REPEAT_INC_NG_SG) MOP_IN(OP_REPEAT_INC_NG_SG); | |
GET_MEMNUM_INC(mem, p); /* mem: OP_REPEAT ID */ | |
STACK_GET_REPEAT(mem, stkp); | |
si = GET_STACK_INDEX(stkp); | |
goto repeat_inc_ng; | |
NEXT; | |
CASE(OP_PUSH_POS) MOP_IN(OP_PUSH_POS); | |
STACK_PUSH_POS(s, sprev, pkeep); | |
MOP_OUT; | |
JUMP; | |
CASE(OP_POP_POS) MOP_IN(OP_POP_POS); | |
{ | |
STACK_POS_END(stkp); | |
s = stkp->u.state.pstr; | |
sprev = stkp->u.state.pstr_prev; | |
} | |
MOP_OUT; | |
JUMP; | |
CASE(OP_PUSH_POS_NOT) MOP_IN(OP_PUSH_POS_NOT); | |
GET_RELADDR_INC(addr, p); | |
STACK_PUSH_POS_NOT(p + addr, s, sprev, pkeep); | |
MOP_OUT; | |
JUMP; | |
CASE(OP_FAIL_POS) MOP_IN(OP_FAIL_POS); | |
STACK_POP_TIL_POS_NOT; | |
goto fail; | |
NEXT; | |
CASE(OP_PUSH_STOP_BT) MOP_IN(OP_PUSH_STOP_BT); | |
STACK_PUSH_STOP_BT; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_POP_STOP_BT) MOP_IN(OP_POP_STOP_BT); | |
STACK_STOP_BT_END; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_LOOK_BEHIND) MOP_IN(OP_LOOK_BEHIND); | |
GET_LENGTH_INC(tlen, p); | |
s = (UChar* )ONIGENC_STEP_BACK(encode, str, s, end, (int )tlen); | |
if (IS_NULL(s)) goto fail; | |
sprev = (UChar* )onigenc_get_prev_char_head(encode, str, s, end); | |
MOP_OUT; | |
JUMP; | |
CASE(OP_PUSH_LOOK_BEHIND_NOT) MOP_IN(OP_PUSH_LOOK_BEHIND_NOT); | |
GET_RELADDR_INC(addr, p); | |
GET_LENGTH_INC(tlen, p); | |
q = (UChar* )ONIGENC_STEP_BACK(encode, str, s, end, (int )tlen); | |
if (IS_NULL(q)) { | |
/* too short case -> success. ex. /(?<!XXX)a/.match("a") | |
If you want to change to fail, replace following line. */ | |
p += addr; | |
/* goto fail; */ | |
} | |
else { | |
STACK_PUSH_LOOK_BEHIND_NOT(p + addr, s, sprev, pkeep); | |
s = q; | |
sprev = (UChar* )onigenc_get_prev_char_head(encode, str, s, end); | |
} | |
MOP_OUT; | |
JUMP; | |
CASE(OP_FAIL_LOOK_BEHIND_NOT) MOP_IN(OP_FAIL_LOOK_BEHIND_NOT); | |
STACK_POP_TIL_LOOK_BEHIND_NOT; | |
goto fail; | |
NEXT; | |
CASE(OP_PUSH_ABSENT_POS) MOP_IN(OP_PUSH_ABSENT_POS); | |
/* Save the absent-start-pos and the original end-pos. */ | |
STACK_PUSH_ABSENT_POS(s, ABSENT_END_POS); | |
MOP_OUT; | |
JUMP; | |
CASE(OP_ABSENT) MOP_IN(OP_ABSENT); | |
{ | |
const UChar* aend = ABSENT_END_POS; | |
UChar* absent; | |
UChar* selfp = p - 1; | |
STACK_POP_ABSENT_POS(absent, ABSENT_END_POS); /* Restore end-pos. */ | |
GET_RELADDR_INC(addr, p); | |
#ifdef ONIG_DEBUG_MATCH | |
fprintf(stderr, "ABSENT: s:%p, end:%p, absent:%p, aend:%p\n", s, end, absent, aend); | |
#endif | |
if ((absent > aend) && (s > absent)) { | |
/* An empty match occurred in (?~...) at the start point. | |
* Never match. */ | |
STACK_POP; | |
goto fail; | |
} | |
else if ((s >= aend) && (s > absent)) { | |
if (s > aend) { | |
/* Only one (or less) character matched in the last iteration. | |
* This is not a possible point. */ | |
goto fail; | |
} | |
/* All possible points were found. Try matching after (?~...). */ | |
DATA_ENSURE(0); | |
p += addr; | |
} | |
else { | |
STACK_PUSH_ALT(p + addr, s, sprev, pkeep); /* Push possible point. */ | |
n = enclen(encode, s, end); | |
STACK_PUSH_ABSENT_POS(absent, ABSENT_END_POS); /* Save the original pos. */ | |
STACK_PUSH_ALT(selfp, s + n, s, pkeep); /* Next iteration. */ | |
STACK_PUSH_ABSENT; | |
ABSENT_END_POS = aend; | |
} | |
} | |
MOP_OUT; | |
JUMP; | |
CASE(OP_ABSENT_END) MOP_IN(OP_ABSENT_END); | |
/* The pattern inside (?~...) was matched. | |
* Set the end-pos temporary and go to next iteration. */ | |
if (sprev < ABSENT_END_POS) | |
ABSENT_END_POS = sprev; | |
#ifdef ONIG_DEBUG_MATCH | |
fprintf(stderr, "ABSENT_END: end:%p\n", ABSENT_END_POS); | |
#endif | |
STACK_POP_TIL_ABSENT; | |
goto fail; | |
NEXT; | |
#ifdef USE_SUBEXP_CALL | |
CASE(OP_CALL) MOP_IN(OP_CALL); | |
GET_ABSADDR_INC(addr, p); | |
STACK_PUSH_CALL_FRAME(p); | |
p = reg->p + addr; | |
MOP_OUT; | |
JUMP; | |
CASE(OP_RETURN) MOP_IN(OP_RETURN); | |
STACK_RETURN(p); | |
STACK_PUSH_RETURN; | |
MOP_OUT; | |
JUMP; | |
#endif | |
CASE(OP_CONDITION) MOP_IN(OP_CONDITION); | |
GET_MEMNUM_INC(mem, p); | |
GET_RELADDR_INC(addr, p); | |
if ((mem > num_mem) || | |
(mem_end_stk[mem] == INVALID_STACK_INDEX) || | |
(mem_start_stk[mem] == INVALID_STACK_INDEX)) { | |
p += addr; | |
} | |
MOP_OUT; | |
JUMP; | |
CASE(OP_FINISH) | |
goto finish; | |
NEXT; | |
CASE(OP_FAIL) | |
if (0) { | |
/* fall */ | |
fail: | |
MOP_OUT; | |
} | |
MOP_IN(OP_FAIL); | |
STACK_POP; | |
p = stk->u.state.pcode; | |
s = stk->u.state.pstr; | |
sprev = stk->u.state.pstr_prev; | |
pkeep = stk->u.state.pkeep; | |
#ifdef USE_COMBINATION_EXPLOSION_CHECK | |
if (stk->u.state.state_check != 0) { | |
stk->type = STK_STATE_CHECK_MARK; | |
stk++; | |
} | |
#endif | |
MOP_OUT; | |
JUMP; | |
DEFAULT | |
goto bytecode_error; | |
} VM_LOOP_END | |
finish: | |
STACK_SAVE; | |
if (xmalloc_base) xfree(xmalloc_base); | |
return best_len; | |
#ifdef ONIG_DEBUG | |
stack_error: | |
STACK_SAVE; | |
if (xmalloc_base) xfree(xmalloc_base); | |
return ONIGERR_STACK_BUG; | |
#endif | |
bytecode_error: | |
STACK_SAVE; | |
if (xmalloc_base) xfree(xmalloc_base); | |
return ONIGERR_UNDEFINED_BYTECODE; | |
unexpected_bytecode_error: | |
STACK_SAVE; | |
if (xmalloc_base) xfree(xmalloc_base); | |
return ONIGERR_UNEXPECTED_BYTECODE; | |
} | |
static UChar* | |
slow_search(OnigEncoding enc, UChar* target, UChar* target_end, | |
const UChar* text, const UChar* text_end, UChar* text_range) | |
{ | |
UChar *t, *p, *s, *end; | |
end = (UChar* )text_end; | |
end -= target_end - target - 1; | |
if (end > text_range) | |
end = text_range; | |
s = (UChar* )text; | |
if (enc->max_enc_len == enc->min_enc_len) { | |
int n = enc->max_enc_len; | |
while (s < end) { | |
if (*s == *target) { | |
p = s + 1; | |
t = target + 1; | |
if (target_end == t || memcmp(t, p, target_end - t) == 0) | |
return s; | |
} | |
s += n; | |
} | |
return (UChar* )NULL; | |
} | |
while (s < end) { | |
if (*s == *target) { | |
p = s + 1; | |
t = target + 1; | |
if (target_end == t || memcmp(t, p, target_end - t) == 0) | |
return s; | |
} | |
s += enclen(enc, s, text_end); | |
} | |
return (UChar* )NULL; | |
} | |
static int | |
str_lower_case_match(OnigEncoding enc, int case_fold_flag, | |
const UChar* t, const UChar* tend, | |
const UChar* p, const UChar* end) | |
{ | |
int lowlen; | |
UChar *q, lowbuf[ONIGENC_MBC_CASE_FOLD_MAXLEN]; | |
while (t < tend) { | |
lowlen = ONIGENC_MBC_CASE_FOLD(enc, case_fold_flag, &p, end, lowbuf); | |
q = lowbuf; | |
while (lowlen > 0) { | |
if (*t++ != *q++) return 0; | |
lowlen--; | |
} | |
} | |
return 1; | |
} | |
static UChar* | |
slow_search_ic(OnigEncoding enc, int case_fold_flag, | |
UChar* target, UChar* target_end, | |
const UChar* text, const UChar* text_end, UChar* text_range) | |
{ | |
UChar *s, *end; | |
end = (UChar* )text_end; | |
end -= target_end - target - 1; | |
if (end > text_range) | |
end = text_range; | |
s = (UChar* )text; | |
while (s < end) { | |
if (str_lower_case_match(enc, case_fold_flag, target, target_end, | |
s, text_end)) | |
return s; | |
s += enclen(enc, s, text_end); | |
} | |
return (UChar* )NULL; | |
} | |
static UChar* | |
slow_search_backward(OnigEncoding enc, UChar* target, UChar* target_end, | |
const UChar* text, const UChar* adjust_text, | |
const UChar* text_end, const UChar* text_start) | |
{ | |
UChar *t, *p, *s; | |
s = (UChar* )text_end; | |
s -= (target_end - target); | |
if (s > text_start) | |
s = (UChar* )text_start; | |
else | |
s = ONIGENC_LEFT_ADJUST_CHAR_HEAD(enc, adjust_text, s, text_end); | |
while (s >= text) { | |
if (*s == *target) { | |
p = s + 1; | |
t = target + 1; | |
while (t < target_end) { | |
if (*t != *p++) | |
break; | |
t++; | |
} | |
if (t == target_end) | |
return s; | |
} | |
s = (UChar* )onigenc_get_prev_char_head(enc, adjust_text, s, text_end); | |
} | |
return (UChar* )NULL; | |
} | |
static UChar* | |
slow_search_backward_ic(OnigEncoding enc, int case_fold_flag, | |
UChar* target, UChar* target_end, | |
const UChar* text, const UChar* adjust_text, | |
const UChar* text_end, const UChar* text_start) | |
{ | |
UChar *s; | |
s = (UChar* )text_end; | |
s -= (target_end - target); | |
if (s > text_start) | |
s = (UChar* )text_start; | |
else | |
s = ONIGENC_LEFT_ADJUST_CHAR_HEAD(enc, adjust_text, s, text_end); | |
while (s >= text) { | |
if (str_lower_case_match(enc, case_fold_flag, | |
target, target_end, s, text_end)) | |
return s; | |
s = (UChar* )onigenc_get_prev_char_head(enc, adjust_text, s, text_end); | |
} | |
return (UChar* )NULL; | |
} | |
#ifndef USE_SUNDAY_QUICK_SEARCH | |
/* Boyer-Moore-Horspool search applied to a multibyte string */ | |
static UChar* | |
bm_search_notrev(regex_t* reg, const UChar* target, const UChar* target_end, | |
const UChar* text, const UChar* text_end, | |
const UChar* text_range) | |
{ | |
const UChar *s, *se, *t, *p, *end; | |
const UChar *tail; | |
ptrdiff_t skip, tlen1; | |
# ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "bm_search_notrev: text: %"PRIuPTR" (%p), text_end: %"PRIuPTR" (%p), text_range: %"PRIuPTR" (%p)\n", | |
(uintptr_t )text, text, (uintptr_t )text_end, text_end, (uintptr_t )text_range, text_range); | |
# endif | |
tail = target_end - 1; | |
tlen1 = tail - target; | |
end = text_range; | |
if (end + tlen1 > text_end) | |
end = text_end - tlen1; | |
s = text; | |
if (IS_NULL(reg->int_map)) { | |
while (s < end) { | |
p = se = s + tlen1; | |
t = tail; | |
while (*p == *t) { | |
if (t == target) return (UChar* )s; | |
p--; t--; | |
} | |
skip = reg->map[*se]; | |
t = s; | |
do { | |
s += enclen(reg->enc, s, end); | |
} while ((s - t) < skip && s < end); | |
} | |
} | |
else { | |
# if OPT_EXACT_MAXLEN >= ONIG_CHAR_TABLE_SIZE | |
while (s < end) { | |
p = se = s + tlen1; | |
t = tail; | |
while (*p == *t) { | |
if (t == target) return (UChar* )s; | |
p--; t--; | |
} | |
skip = reg->int_map[*se]; | |
t = s; | |
do { | |
s += enclen(reg->enc, s, end); | |
} while ((s - t) < skip && s < end); | |
} | |
# endif | |
} | |
return (UChar* )NULL; | |
} | |
/* Boyer-Moore-Horspool search */ | |
static UChar* | |
bm_search(regex_t* reg, const UChar* target, const UChar* target_end, | |
const UChar* text, const UChar* text_end, const UChar* text_range) | |
{ | |
const UChar *s, *t, *p, *end; | |
const UChar *tail; | |
# ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "bm_search: text: %"PRIuPTR" (%p), text_end: %"PRIuPTR" (%p), text_range: %"PRIuPTR" (%p)\n", | |
(uintptr_t )text, text, (uintptr_t )text_end, text_end, (uintptr_t )text_range, text_range); | |
# endif | |
end = text_range + (target_end - target) - 1; | |
if (end > text_end) | |
end = text_end; | |
tail = target_end - 1; | |
s = text + (target_end - target) - 1; | |
if (IS_NULL(reg->int_map)) { | |
while (s < end) { | |
p = s; | |
t = tail; | |
# ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "bm_search_loop: pos: %"PRIdPTR" %s\n", | |
(intptr_t )(s - text), s); | |
# endif | |
while (*p == *t) { | |
if (t == target) return (UChar* )p; | |
p--; t--; | |
} | |
s += reg->map[*s]; | |
} | |
} | |
else { /* see int_map[] */ | |
# if OPT_EXACT_MAXLEN >= ONIG_CHAR_TABLE_SIZE | |
while (s < end) { | |
p = s; | |
t = tail; | |
while (*p == *t) { | |
if (t == target) return (UChar* )p; | |
p--; t--; | |
} | |
s += reg->int_map[*s]; | |
} | |
# endif | |
} | |
return (UChar* )NULL; | |
} | |
/* Boyer-Moore-Horspool search applied to a multibyte string (ignore case) */ | |
static UChar* | |
bm_search_notrev_ic(regex_t* reg, const UChar* target, const UChar* target_end, | |
const UChar* text, const UChar* text_end, | |
const UChar* text_range) | |
{ | |
const UChar *s, *se, *t, *end; | |
const UChar *tail; | |
ptrdiff_t skip, tlen1; | |
OnigEncoding enc = reg->enc; | |
int case_fold_flag = reg->case_fold_flag; | |
# ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "bm_search_notrev_ic: text: %d (%p), text_end: %d (%p), text_range: %d (%p)\n", | |
(int )text, text, (int )text_end, text_end, (int )text_range, text_range); | |
# endif | |
tail = target_end - 1; | |
tlen1 = tail - target; | |
end = text_range; | |
if (end + tlen1 > text_end) | |
end = text_end - tlen1; | |
s = text; | |
if (IS_NULL(reg->int_map)) { | |
while (s < end) { | |
se = s + tlen1; | |
if (str_lower_case_match(enc, case_fold_flag, target, target_end, | |
s, se + 1)) | |
return (UChar* )s; | |
skip = reg->map[*se]; | |
t = s; | |
do { | |
s += enclen(reg->enc, s, end); | |
} while ((s - t) < skip && s < end); | |
} | |
} | |
else { | |
# if OPT_EXACT_MAXLEN >= ONIG_CHAR_TABLE_SIZE | |
while (s < end) { | |
se = s + tlen1; | |
if (str_lower_case_match(enc, case_fold_flag, target, target_end, | |
s, se + 1)) | |
return (UChar* )s; | |
skip = reg->int_map[*se]; | |
t = s; | |
do { | |
s += enclen(reg->enc, s, end); | |
} while ((s - t) < skip && s < end); | |
} | |
# endif | |
} | |
return (UChar* )NULL; | |
} | |
/* Boyer-Moore-Horspool search (ignore case) */ | |
static UChar* | |
bm_search_ic(regex_t* reg, const UChar* target, const UChar* target_end, | |
const UChar* text, const UChar* text_end, const UChar* text_range) | |
{ | |
const UChar *s, *p, *end; | |
const UChar *tail; | |
OnigEncoding enc = reg->enc; | |
int case_fold_flag = reg->case_fold_flag; | |
# ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "bm_search_ic: text: %d (%p), text_end: %d (%p), text_range: %d (%p)\n", | |
(int )text, text, (int )text_end, text_end, (int )text_range, text_range); | |
# endif | |
end = text_range + (target_end - target) - 1; | |
if (end > text_end) | |
end = text_end; | |
tail = target_end - 1; | |
s = text + (target_end - target) - 1; | |
if (IS_NULL(reg->int_map)) { | |
while (s < end) { | |
p = s - (target_end - target) + 1; | |
if (str_lower_case_match(enc, case_fold_flag, target, target_end, | |
p, s + 1)) | |
return (UChar* )p; | |
s += reg->map[*s]; | |
} | |
} | |
else { /* see int_map[] */ | |
# if OPT_EXACT_MAXLEN >= ONIG_CHAR_TABLE_SIZE | |
while (s < end) { | |
p = s - (target_end - target) + 1; | |
if (str_lower_case_match(enc, case_fold_flag, target, target_end, | |
p, s + 1)) | |
return (UChar* )p; | |
s += reg->int_map[*s]; | |
} | |
# endif | |
} | |
return (UChar* )NULL; | |
} | |
#else /* USE_SUNDAY_QUICK_SEARCH */ | |
/* Sunday's quick search applied to a multibyte string */ | |
static UChar* | |
bm_search_notrev(regex_t* reg, const UChar* target, const UChar* target_end, | |
const UChar* text, const UChar* text_end, | |
const UChar* text_range) | |
{ | |
const UChar *s, *se, *t, *p, *end; | |
const UChar *tail; | |
ptrdiff_t skip, tlen1; | |
OnigEncoding enc = reg->enc; | |
# ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "bm_search_notrev: text: %"PRIuPTR" (%p), text_end: %"PRIuPTR" (%p), text_range: %"PRIuPTR" (%p)\n", | |
(uintptr_t )text, text, (uintptr_t )text_end, text_end, (uintptr_t )text_range, text_range); | |
# endif | |
tail = target_end - 1; | |
tlen1 = tail - target; | |
end = text_range; | |
if (end + tlen1 > text_end) | |
end = text_end - tlen1; | |
s = text; | |
if (IS_NULL(reg->int_map)) { | |
while (s < end) { | |
p = se = s + tlen1; | |
t = tail; | |
while (*p == *t) { | |
if (t == target) return (UChar* )s; | |
p--; t--; | |
} | |
if (s + 1 >= end) break; | |
skip = reg->map[se[1]]; | |
t = s; | |
do { | |
s += enclen(enc, s, end); | |
} while ((s - t) < skip && s < end); | |
} | |
} | |
else { | |
# if OPT_EXACT_MAXLEN >= ONIG_CHAR_TABLE_SIZE | |
while (s < end) { | |
p = se = s + tlen1; | |
t = tail; | |
while (*p == *t) { | |
if (t == target) return (UChar* )s; | |
p--; t--; | |
} | |
if (s + 1 >= end) break; | |
skip = reg->int_map[se[1]]; | |
t = s; | |
do { | |
s += enclen(enc, s, end); | |
} while ((s - t) < skip && s < end); | |
} | |
# endif | |
} | |
return (UChar* )NULL; | |
} | |
/* Sunday's quick search */ | |
static UChar* | |
bm_search(regex_t* reg, const UChar* target, const UChar* target_end, | |
const UChar* text, const UChar* text_end, const UChar* text_range) | |
{ | |
const UChar *s, *t, *p, *end; | |
const UChar *tail; | |
ptrdiff_t tlen1; | |
# ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "bm_search: text: %"PRIuPTR" (%p), text_end: %"PRIuPTR" (%p), text_range: %"PRIuPTR" (%p)\n", | |
(uintptr_t )text, text, (uintptr_t )text_end, text_end, (uintptr_t )text_range, text_range); | |
# endif | |
tail = target_end - 1; | |
tlen1 = tail - target; | |
end = text_range + tlen1; | |
if (end > text_end) | |
end = text_end; | |
s = text + tlen1; | |
if (IS_NULL(reg->int_map)) { | |
while (s < end) { | |
p = s; | |
t = tail; | |
while (*p == *t) { | |
if (t == target) return (UChar* )p; | |
p--; t--; | |
} | |
if (s + 1 >= end) break; | |
s += reg->map[s[1]]; | |
} | |
} | |
else { /* see int_map[] */ | |
# if OPT_EXACT_MAXLEN >= ONIG_CHAR_TABLE_SIZE | |
while (s < end) { | |
p = s; | |
t = tail; | |
while (*p == *t) { | |
if (t == target) return (UChar* )p; | |
p--; t--; | |
} | |
if (s + 1 >= end) break; | |
s += reg->int_map[s[1]]; | |
} | |
# endif | |
} | |
return (UChar* )NULL; | |
} | |
/* Sunday's quick search applied to a multibyte string (ignore case) */ | |
static UChar* | |
bm_search_notrev_ic(regex_t* reg, const UChar* target, const UChar* target_end, | |
const UChar* text, const UChar* text_end, | |
const UChar* text_range) | |
{ | |
const UChar *s, *se, *t, *end; | |
const UChar *tail; | |
ptrdiff_t skip, tlen1; | |
OnigEncoding enc = reg->enc; | |
int case_fold_flag = reg->case_fold_flag; | |
# ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "bm_search_notrev_ic: text: %"PRIuPTR" (%p), text_end: %"PRIuPTR" (%p), text_range: %"PRIuPTR" (%p)\n", | |
(uintptr_t )text, text, (uintptr_t )text_end, text_end, (uintptr_t )text_range, text_range); | |
# endif | |
tail = target_end - 1; | |
tlen1 = tail - target; | |
end = text_range; | |
if (end + tlen1 > text_end) | |
end = text_end - tlen1; | |
s = text; | |
if (IS_NULL(reg->int_map)) { | |
while (s < end) { | |
se = s + tlen1; | |
if (str_lower_case_match(enc, case_fold_flag, target, target_end, | |
s, se + 1)) | |
return (UChar* )s; | |
if (s + 1 >= end) break; | |
skip = reg->map[se[1]]; | |
t = s; | |
do { | |
s += enclen(enc, s, end); | |
} while ((s - t) < skip && s < end); | |
} | |
} | |
else { | |
# if OPT_EXACT_MAXLEN >= ONIG_CHAR_TABLE_SIZE | |
while (s < end) { | |
se = s + tlen1; | |
if (str_lower_case_match(enc, case_fold_flag, target, target_end, | |
s, se + 1)) | |
return (UChar* )s; | |
if (s + 1 >= end) break; | |
skip = reg->int_map[se[1]]; | |
t = s; | |
do { | |
s += enclen(enc, s, end); | |
} while ((s - t) < skip && s < end); | |
} | |
# endif | |
} | |
return (UChar* )NULL; | |
} | |
/* Sunday's quick search (ignore case) */ | |
static UChar* | |
bm_search_ic(regex_t* reg, const UChar* target, const UChar* target_end, | |
const UChar* text, const UChar* text_end, const UChar* text_range) | |
{ | |
const UChar *s, *p, *end; | |
const UChar *tail; | |
ptrdiff_t tlen1; | |
OnigEncoding enc = reg->enc; | |
int case_fold_flag = reg->case_fold_flag; | |
# ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "bm_search_ic: text: %"PRIuPTR" (%p), text_end: %"PRIuPTR" (%p), text_range: %"PRIuPTR" (%p)\n", | |
(uintptr_t )text, text, (uintptr_t )text_end, text_end, (uintptr_t )text_range, text_range); | |
# endif | |
tail = target_end - 1; | |
tlen1 = tail - target; | |
end = text_range + tlen1; | |
if (end > text_end) | |
end = text_end; | |
s = text + tlen1; | |
if (IS_NULL(reg->int_map)) { | |
while (s < end) { | |
p = s - tlen1; | |
if (str_lower_case_match(enc, case_fold_flag, target, target_end, | |
p, s + 1)) | |
return (UChar* )p; | |
if (s + 1 >= end) break; | |
s += reg->map[s[1]]; | |
} | |
} | |
else { /* see int_map[] */ | |
# if OPT_EXACT_MAXLEN >= ONIG_CHAR_TABLE_SIZE | |
while (s < end) { | |
p = s - tlen1; | |
if (str_lower_case_match(enc, case_fold_flag, target, target_end, | |
p, s + 1)) | |
return (UChar* )p; | |
if (s + 1 >= end) break; | |
s += reg->int_map[s[1]]; | |
} | |
# endif | |
} | |
return (UChar* )NULL; | |
} | |
#endif /* USE_SUNDAY_QUICK_SEARCH */ | |
#ifdef USE_INT_MAP_BACKWARD | |
static int | |
set_bm_backward_skip(UChar* s, UChar* end, OnigEncoding enc ARG_UNUSED, | |
int** skip) | |
{ | |
int i, len; | |
if (IS_NULL(*skip)) { | |
*skip = (int* )xmalloc(sizeof(int) * ONIG_CHAR_TABLE_SIZE); | |
if (IS_NULL(*skip)) return ONIGERR_MEMORY; | |
} | |
len = (int )(end - s); | |
for (i = 0; i < ONIG_CHAR_TABLE_SIZE; i++) | |
(*skip)[i] = len; | |
for (i = len - 1; i > 0; i--) | |
(*skip)[s[i]] = i; | |
return 0; | |
} | |
static UChar* | |
bm_search_backward(regex_t* reg, const UChar* target, const UChar* target_end, | |
const UChar* text, const UChar* adjust_text, | |
const UChar* text_end, const UChar* text_start) | |
{ | |
const UChar *s, *t, *p; | |
s = text_end - (target_end - target); | |
if (text_start < s) | |
s = text_start; | |
else | |
s = ONIGENC_LEFT_ADJUST_CHAR_HEAD(reg->enc, adjust_text, s, text_end); | |
while (s >= text) { | |
p = s; | |
t = target; | |
while (t < target_end && *p == *t) { | |
p++; t++; | |
} | |
if (t == target_end) | |
return (UChar* )s; | |
s -= reg->int_map_backward[*s]; | |
s = ONIGENC_LEFT_ADJUST_CHAR_HEAD(reg->enc, adjust_text, s, text_end); | |
} | |
return (UChar* )NULL; | |
} | |
#endif | |
static UChar* | |
map_search(OnigEncoding enc, UChar map[], | |
const UChar* text, const UChar* text_range, const UChar* text_end) | |
{ | |
const UChar *s = text; | |
while (s < text_range) { | |
if (map[*s]) return (UChar* )s; | |
s += enclen(enc, s, text_end); | |
} | |
return (UChar* )NULL; | |
} | |
static UChar* | |
map_search_backward(OnigEncoding enc, UChar map[], | |
const UChar* text, const UChar* adjust_text, | |
const UChar* text_start, const UChar* text_end) | |
{ | |
const UChar *s = text_start; | |
while (s >= text) { | |
if (map[*s]) return (UChar* )s; | |
s = onigenc_get_prev_char_head(enc, adjust_text, s, text_end); | |
} | |
return (UChar* )NULL; | |
} | |
extern OnigPosition | |
onig_match(regex_t* reg, const UChar* str, const UChar* end, const UChar* at, OnigRegion* region, | |
OnigOptionType option) | |
{ | |
ptrdiff_t r; | |
UChar *prev; | |
OnigMatchArg msa; | |
MATCH_ARG_INIT(msa, option, region, at, at); | |
#ifdef USE_COMBINATION_EXPLOSION_CHECK | |
{ | |
ptrdiff_t offset = at - str; | |
STATE_CHECK_BUFF_INIT(msa, end - str, offset, reg->num_comb_exp_check); | |
} | |
#endif | |
if (region) { | |
r = onig_region_resize_clear(region, reg->num_mem + 1); | |
} | |
else | |
r = 0; | |
if (r == 0) { | |
prev = (UChar* )onigenc_get_prev_char_head(reg->enc, str, at, end); | |
r = match_at(reg, str, end, | |
#ifdef USE_MATCH_RANGE_MUST_BE_INSIDE_OF_SPECIFIED_RANGE | |
end, | |
#endif | |
at, prev, &msa); | |
} | |
MATCH_ARG_FREE(msa); | |
return r; | |
} | |
static int | |
forward_search_range(regex_t* reg, const UChar* str, const UChar* end, UChar* s, | |
UChar* range, UChar** low, UChar** high, UChar** low_prev) | |
{ | |
UChar *p, *pprev = (UChar* )NULL; | |
#ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "forward_search_range: str: %"PRIuPTR" (%p), end: %"PRIuPTR" (%p), s: %"PRIuPTR" (%p), range: %"PRIuPTR" (%p)\n", | |
(uintptr_t )str, str, (uintptr_t )end, end, (uintptr_t )s, s, (uintptr_t )range, range); | |
#endif | |
p = s; | |
if (reg->dmin > 0) { | |
if (ONIGENC_IS_SINGLEBYTE(reg->enc)) { | |
p += reg->dmin; | |
} | |
else { | |
UChar *q = p + reg->dmin; | |
if (q >= end) return 0; /* fail */ | |
while (p < q) p += enclen(reg->enc, p, end); | |
} | |
} | |
retry: | |
switch (reg->optimize) { | |
case ONIG_OPTIMIZE_EXACT: | |
p = slow_search(reg->enc, reg->exact, reg->exact_end, p, end, range); | |
break; | |
case ONIG_OPTIMIZE_EXACT_IC: | |
p = slow_search_ic(reg->enc, reg->case_fold_flag, | |
reg->exact, reg->exact_end, p, end, range); | |
break; | |
case ONIG_OPTIMIZE_EXACT_BM: | |
p = bm_search(reg, reg->exact, reg->exact_end, p, end, range); | |
break; | |
case ONIG_OPTIMIZE_EXACT_BM_NOT_REV: | |
p = bm_search_notrev(reg, reg->exact, reg->exact_end, p, end, range); | |
break; | |
case ONIG_OPTIMIZE_EXACT_BM_IC: | |
p = bm_search_ic(reg, reg->exact, reg->exact_end, p, end, range); | |
break; | |
case ONIG_OPTIMIZE_EXACT_BM_NOT_REV_IC: | |
p = bm_search_notrev_ic(reg, reg->exact, reg->exact_end, p, end, range); | |
break; | |
case ONIG_OPTIMIZE_MAP: | |
p = map_search(reg->enc, reg->map, p, range, end); | |
break; | |
} | |
if (p && p < range) { | |
if (p - reg->dmin < s) { | |
retry_gate: | |
pprev = p; | |
p += enclen(reg->enc, p, end); | |
goto retry; | |
} | |
if (reg->sub_anchor) { | |
UChar* prev; | |
switch (reg->sub_anchor) { | |
case ANCHOR_BEGIN_LINE: | |
if (!ON_STR_BEGIN(p)) { | |
prev = onigenc_get_prev_char_head(reg->enc, | |
(pprev ? pprev : str), p, end); | |
if (!ONIGENC_IS_MBC_NEWLINE_EX(reg->enc, prev, str, end, reg->options, 0)) | |
goto retry_gate; | |
} | |
break; | |
case ANCHOR_END_LINE: | |
if (ON_STR_END(p)) { | |
#ifndef USE_NEWLINE_AT_END_OF_STRING_HAS_EMPTY_LINE | |
prev = (UChar* )onigenc_get_prev_char_head(reg->enc, | |
(pprev ? pprev : str), p); | |
if (prev && ONIGENC_IS_MBC_NEWLINE_EX(reg->enc, prev, str, end, reg->options, 1)) | |
goto retry_gate; | |
#endif | |
} | |
else if (! ONIGENC_IS_MBC_NEWLINE_EX(reg->enc, p, str, end, reg->options, 1)) | |
goto retry_gate; | |
break; | |
} | |
} | |
if (reg->dmax == 0) { | |
*low = p; | |
if (low_prev) { | |
if (*low > s) | |
*low_prev = onigenc_get_prev_char_head(reg->enc, s, p, end); | |
else | |
*low_prev = onigenc_get_prev_char_head(reg->enc, | |
(pprev ? pprev : str), p, end); | |
} | |
} | |
else { | |
if (reg->dmax != ONIG_INFINITE_DISTANCE) { | |
if (p < str + reg->dmax) { | |
*low = (UChar* )str; | |
if (low_prev) | |
*low_prev = onigenc_get_prev_char_head(reg->enc, str, *low, end); | |
} | |
else { | |
*low = p - reg->dmax; | |
if (*low > s) { | |
*low = onigenc_get_right_adjust_char_head_with_prev(reg->enc, s, | |
*low, end, (const UChar** )low_prev); | |
if (low_prev && IS_NULL(*low_prev)) | |
*low_prev = onigenc_get_prev_char_head(reg->enc, | |
(pprev ? pprev : s), *low, end); | |
} | |
else { | |
if (low_prev) | |
*low_prev = onigenc_get_prev_char_head(reg->enc, | |
(pprev ? pprev : str), *low, end); | |
} | |
} | |
} | |
} | |
/* no needs to adjust *high, *high is used as range check only */ | |
*high = p - reg->dmin; | |
#ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, | |
"forward_search_range success: low: %"PRIdPTR", high: %"PRIdPTR", dmin: %"PRIdPTR", dmax: %"PRIdPTR"\n", | |
*low - str, *high - str, reg->dmin, reg->dmax); | |
#endif | |
return 1; /* success */ | |
} | |
return 0; /* fail */ | |
} | |
#define BM_BACKWARD_SEARCH_LENGTH_THRESHOLD 100 | |
static int | |
backward_search_range(regex_t* reg, const UChar* str, const UChar* end, | |
UChar* s, const UChar* range, UChar* adjrange, | |
UChar** low, UChar** high) | |
{ | |
UChar *p; | |
range += reg->dmin; | |
p = s; | |
retry: | |
switch (reg->optimize) { | |
case ONIG_OPTIMIZE_EXACT: | |
exact_method: | |
p = slow_search_backward(reg->enc, reg->exact, reg->exact_end, | |
range, adjrange, end, p); | |
break; | |
case ONIG_OPTIMIZE_EXACT_IC: | |
case ONIG_OPTIMIZE_EXACT_BM_IC: | |
case ONIG_OPTIMIZE_EXACT_BM_NOT_REV_IC: | |
p = slow_search_backward_ic(reg->enc, reg->case_fold_flag, | |
reg->exact, reg->exact_end, | |
range, adjrange, end, p); | |
break; | |
case ONIG_OPTIMIZE_EXACT_BM: | |
case ONIG_OPTIMIZE_EXACT_BM_NOT_REV: | |
#ifdef USE_INT_MAP_BACKWARD | |
if (IS_NULL(reg->int_map_backward)) { | |
int r; | |
if (s - range < BM_BACKWARD_SEARCH_LENGTH_THRESHOLD) | |
goto exact_method; | |
r = set_bm_backward_skip(reg->exact, reg->exact_end, reg->enc, | |
&(reg->int_map_backward)); | |
if (r) return r; | |
} | |
p = bm_search_backward(reg, reg->exact, reg->exact_end, range, adjrange, | |
end, p); | |
#else | |
goto exact_method; | |
#endif | |
break; | |
case ONIG_OPTIMIZE_MAP: | |
p = map_search_backward(reg->enc, reg->map, range, adjrange, p, end); | |
break; | |
} | |
if (p) { | |
if (reg->sub_anchor) { | |
UChar* prev; | |
switch (reg->sub_anchor) { | |
case ANCHOR_BEGIN_LINE: | |
if (!ON_STR_BEGIN(p)) { | |
prev = onigenc_get_prev_char_head(reg->enc, str, p, end); | |
if (!ONIGENC_IS_MBC_NEWLINE_EX(reg->enc, prev, str, end, reg->options, 0)) { | |
p = prev; | |
goto retry; | |
} | |
} | |
break; | |
case ANCHOR_END_LINE: | |
if (ON_STR_END(p)) { | |
#ifndef USE_NEWLINE_AT_END_OF_STRING_HAS_EMPTY_LINE | |
prev = onigenc_get_prev_char_head(reg->enc, adjrange, p); | |
if (IS_NULL(prev)) goto fail; | |
if (ONIGENC_IS_MBC_NEWLINE_EX(reg->enc, prev, str, end, reg->options, 1)) { | |
p = prev; | |
goto retry; | |
} | |
#endif | |
} | |
else if (! ONIGENC_IS_MBC_NEWLINE_EX(reg->enc, p, str, end, reg->options, 1)) { | |
p = onigenc_get_prev_char_head(reg->enc, adjrange, p, end); | |
if (IS_NULL(p)) goto fail; | |
goto retry; | |
} | |
break; | |
} | |
} | |
/* no needs to adjust *high, *high is used as range check only */ | |
if (reg->dmax != ONIG_INFINITE_DISTANCE) { | |
*low = p - reg->dmax; | |
*high = p - reg->dmin; | |
*high = onigenc_get_right_adjust_char_head(reg->enc, adjrange, *high, end); | |
} | |
#ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "backward_search_range: low: %d, high: %d\n", | |
(int )(*low - str), (int )(*high - str)); | |
#endif | |
return 1; /* success */ | |
} | |
fail: | |
#ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "backward_search_range: fail.\n"); | |
#endif | |
return 0; /* fail */ | |
} | |
extern OnigPosition | |
onig_search(regex_t* reg, const UChar* str, const UChar* end, | |
const UChar* start, const UChar* range, OnigRegion* region, OnigOptionType option) | |
{ | |
return onig_search_gpos(reg, str, end, start, start, range, region, option); | |
} | |
extern OnigPosition | |
onig_search_gpos(regex_t* reg, const UChar* str, const UChar* end, | |
const UChar* global_pos, | |
const UChar* start, const UChar* range, OnigRegion* region, OnigOptionType option) | |
{ | |
ptrdiff_t r; | |
UChar *s, *prev; | |
OnigMatchArg msa; | |
#ifdef USE_MATCH_RANGE_MUST_BE_INSIDE_OF_SPECIFIED_RANGE | |
const UChar *orig_start = start; | |
const UChar *orig_range = range; | |
#endif | |
#ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, | |
"onig_search (entry point): str: %"PRIuPTR" (%p), end: %"PRIuPTR", start: %"PRIuPTR", range: %"PRIuPTR"\n", | |
(uintptr_t )str, str, end - str, start - str, range - str); | |
#endif | |
if (region) { | |
r = onig_region_resize_clear(region, reg->num_mem + 1); | |
if (r) goto finish_no_msa; | |
} | |
if (start > end || start < str) goto mismatch_no_msa; | |
#ifdef USE_MATCH_RANGE_MUST_BE_INSIDE_OF_SPECIFIED_RANGE | |
# ifdef USE_FIND_LONGEST_SEARCH_ALL_OF_RANGE | |
# define MATCH_AND_RETURN_CHECK(upper_range) \ | |
r = match_at(reg, str, end, (upper_range), s, prev, &msa); \ | |
if (r != ONIG_MISMATCH) {\ | |
if (r >= 0) {\ | |
if (! IS_FIND_LONGEST(reg->options)) {\ | |
goto match;\ | |
}\ | |
}\ | |
else goto finish; /* error */ \ | |
} | |
# else | |
# define MATCH_AND_RETURN_CHECK(upper_range) \ | |
r = match_at(reg, str, end, (upper_range), s, prev, &msa); \ | |
if (r != ONIG_MISMATCH) {\ | |
if (r >= 0) {\ | |
goto match;\ | |
}\ | |
else goto finish; /* error */ \ | |
} | |
# endif /* USE_FIND_LONGEST_SEARCH_ALL_OF_RANGE */ | |
#else | |
# ifdef USE_FIND_LONGEST_SEARCH_ALL_OF_RANGE | |
# define MATCH_AND_RETURN_CHECK(none) \ | |
r = match_at(reg, str, end, s, prev, &msa);\ | |
if (r != ONIG_MISMATCH) {\ | |
if (r >= 0) {\ | |
if (! IS_FIND_LONGEST(reg->options)) {\ | |
goto match;\ | |
}\ | |
}\ | |
else goto finish; /* error */ \ | |
} | |
# else | |
# define MATCH_AND_RETURN_CHECK(none) \ | |
r = match_at(reg, str, end, s, prev, &msa);\ | |
if (r != ONIG_MISMATCH) {\ | |
if (r >= 0) {\ | |
goto match;\ | |
}\ | |
else goto finish; /* error */ \ | |
} | |
# endif /* USE_FIND_LONGEST_SEARCH_ALL_OF_RANGE */ | |
#endif /* USE_MATCH_RANGE_MUST_BE_INSIDE_OF_SPECIFIED_RANGE */ | |
/* anchor optimize: resume search range */ | |
if (reg->anchor != 0 && str < end) { | |
UChar *min_semi_end, *max_semi_end; | |
if (reg->anchor & ANCHOR_BEGIN_POSITION) { | |
/* search start-position only */ | |
begin_position: | |
if (range > start) | |
{ | |
if (global_pos > start) | |
{ | |
if (global_pos < range) | |
range = global_pos + 1; | |
} | |
else | |
range = start + 1; | |
} | |
else | |
range = start; | |
} | |
else if (reg->anchor & ANCHOR_BEGIN_BUF) { | |
/* search str-position only */ | |
if (range > start) { | |
if (start != str) goto mismatch_no_msa; | |
range = str + 1; | |
} | |
else { | |
if (range <= str) { | |
start = str; | |
range = str; | |
} | |
else | |
goto mismatch_no_msa; | |
} | |
} | |
else if (reg->anchor & ANCHOR_END_BUF) { | |
min_semi_end = max_semi_end = (UChar* )end; | |
end_buf: | |
if ((OnigDistance )(max_semi_end - str) < reg->anchor_dmin) | |
goto mismatch_no_msa; | |
if (range > start) { | |
if ((OnigDistance )(min_semi_end - start) > reg->anchor_dmax) { | |
start = min_semi_end - reg->anchor_dmax; | |
if (start < end) | |
start = onigenc_get_right_adjust_char_head(reg->enc, str, start, end); | |
} | |
if ((OnigDistance )(max_semi_end - (range - 1)) < reg->anchor_dmin) { | |
range = max_semi_end - reg->anchor_dmin + 1; | |
} | |
if (start > range) goto mismatch_no_msa; | |
/* If start == range, match with empty at end. | |
Backward search is used. */ | |
} | |
else { | |
if ((OnigDistance )(min_semi_end - range) > reg->anchor_dmax) { | |
range = min_semi_end - reg->anchor_dmax; | |
} | |
if ((OnigDistance )(max_semi_end - start) < reg->anchor_dmin) { | |
start = max_semi_end - reg->anchor_dmin; | |
start = ONIGENC_LEFT_ADJUST_CHAR_HEAD(reg->enc, str, start, end); | |
} | |
if (range > start) goto mismatch_no_msa; | |
} | |
} | |
else if (reg->anchor & ANCHOR_SEMI_END_BUF) { | |
UChar* pre_end = ONIGENC_STEP_BACK(reg->enc, str, end, end, 1); | |
max_semi_end = (UChar* )end; | |
if (ONIGENC_IS_MBC_NEWLINE(reg->enc, pre_end, end)) { | |
min_semi_end = pre_end; | |
#ifdef USE_CRNL_AS_LINE_TERMINATOR | |
pre_end = ONIGENC_STEP_BACK(reg->enc, str, pre_end, end, 1); | |
if (IS_NOT_NULL(pre_end) && | |
IS_NEWLINE_CRLF(reg->options) && | |
ONIGENC_IS_MBC_CRNL(reg->enc, pre_end, end)) { | |
min_semi_end = pre_end; | |
} | |
#endif | |
if (min_semi_end > str && start <= min_semi_end) { | |
goto end_buf; | |
} | |
} | |
else { | |
min_semi_end = (UChar* )end; | |
goto end_buf; | |
} | |
} | |
else if ((reg->anchor & ANCHOR_ANYCHAR_STAR_ML)) { | |
goto begin_position; | |
} | |
} | |
else if (str == end) { /* empty string */ | |
static const UChar address_for_empty_string[] = ""; | |
#ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "onig_search: empty string.\n"); | |
#endif | |
if (reg->threshold_len == 0) { | |
start = end = str = address_for_empty_string; | |
s = (UChar* )start; | |
prev = (UChar* )NULL; | |
MATCH_ARG_INIT(msa, option, region, start, start); | |
#ifdef USE_COMBINATION_EXPLOSION_CHECK | |
msa.state_check_buff = (void* )0; | |
msa.state_check_buff_size = 0; /* NO NEED, for valgrind */ | |
#endif | |
MATCH_AND_RETURN_CHECK(end); | |
goto mismatch; | |
} | |
goto mismatch_no_msa; | |
} | |
#ifdef ONIG_DEBUG_SEARCH | |
fprintf(stderr, "onig_search(apply anchor): end: %d, start: %d, range: %d\n", | |
(int )(end - str), (int )(start - str), (int )(range - str)); | |
#endif | |
MATCH_ARG_INIT(msa, option, region, start, global_pos); | |
#ifdef USE_COMBINATION_EXPLOSION_CHECK | |
{ | |
ptrdiff_t offset = (MIN(start, range) - str); | |
STATE_CHECK_BUFF_INIT(msa, end - str, offset, reg->num_comb_exp_check); | |
} | |
#endif | |
s = (UChar* )start; | |
if (range > start) { /* forward search */ | |
if (s > str) | |
prev = onigenc_get_prev_char_head(reg->enc, str, s, end); | |
else | |
prev = (UChar* )NULL; | |
if (reg->optimize != ONIG_OPTIMIZE_NONE) { | |
UChar *sch_range, *low, *high, *low_prev; | |
sch_range = (UChar* )range; | |
if (reg->dmax != 0) { | |
if (reg->dmax == ONIG_INFINITE_DISTANCE) | |
sch_range = (UChar* )end; | |
else { | |
sch_range += reg->dmax; | |
if (sch_range > end) sch_range = (UChar* )end; | |
} | |
} | |
if ((end - start) < reg->threshold_len) | |
goto mismatch; | |
if (reg->dmax != ONIG_INFINITE_DISTANCE) { | |
do { | |
if (! forward_search_range(reg, str, end, s, sch_range, | |
&low, &high, &low_prev)) goto mismatch; | |
if (s < low) { | |
s = low; | |
prev = low_prev; | |
} | |
while (s <= high) { | |
MATCH_AND_RETURN_CHECK(orig_range); | |
prev = s; | |
s += enclen(reg->enc, s, end); | |
} | |
} while (s < range); | |
goto mismatch; | |
} | |
else { /* check only. */ | |
if (! forward_search_range(reg, str, end, s, sch_range, | |
&low, &high, (UChar** )NULL)) goto mismatch; | |
if ((reg->anchor & ANCHOR_ANYCHAR_STAR) != 0) { | |
do { | |
MATCH_AND_RETURN_CHECK(orig_range); | |
prev = s; | |
s += enclen(reg->enc, s, end); | |
if ((reg->anchor & (ANCHOR_LOOK_BEHIND | ANCHOR_PREC_READ_NOT)) == 0) { | |
while (!ONIGENC_IS_MBC_NEWLINE_EX(reg->enc, prev, str, end, reg->options, 0) | |
&& s < range) { | |
prev = s; | |
s += enclen(reg->enc, s, end); | |
} | |
} | |
} while (s < range); | |
goto mismatch; | |
} | |
} | |
} | |
do { | |
MATCH_AND_RETURN_CHECK(orig_range); | |
prev = s; | |
s += enclen(reg->enc, s, end); | |
} while (s < range); | |
if (s == range) { /* because empty match with /$/. */ | |
MATCH_AND_RETURN_CHECK(orig_range); | |
} | |
} | |
else { /* backward search */ | |
if (reg->optimize != ONIG_OPTIMIZE_NONE) { | |
UChar *low, *high, *adjrange, *sch_start; | |
if (range < end) | |
adjrange = ONIGENC_LEFT_ADJUST_CHAR_HEAD(reg->enc, str, range, end); | |
else | |
adjrange = (UChar* )end; | |
if (reg->dmax != ONIG_INFINITE_DISTANCE && | |
(end - range) >= reg->threshold_len) { | |
do { | |
sch_start = s + reg->dmax; | |
if (sch_start > end) sch_start = (UChar* )end; | |
if (backward_search_range(reg, str, end, sch_start, range, adjrange, | |
&low, &high) <= 0) | |
goto mismatch; | |
if (s > high) | |
s = high; | |
while (s >= low) { | |
prev = onigenc_get_prev_char_head(reg->enc, str, s, end); | |
MATCH_AND_RETURN_CHECK(orig_start); | |
s = prev; | |
} | |
} while (s >= range); | |
goto mismatch; | |
} | |
else { /* check only. */ | |
if ((end - range) < reg->threshold_len) goto mismatch; | |
sch_start = s; | |
if (reg->dmax != 0) { | |
if (reg->dmax == ONIG_INFINITE_DISTANCE) | |
sch_start = (UChar* )end; | |
else { | |
sch_start += reg->dmax; | |
if (sch_start > end) sch_start = (UChar* )end; | |
else | |
sch_start = ONIGENC_LEFT_ADJUST_CHAR_HEAD(reg->enc, | |
start, sch_start, end); | |
} | |
} | |
if (backward_search_range(reg, str, end, sch_start, range, adjrange, | |
&low, &high) <= 0) goto mismatch; | |
} | |
} | |
do { | |
prev = onigenc_get_prev_char_head(reg->enc, str, s, end); | |
MATCH_AND_RETURN_CHECK(orig_start); | |
s = prev; | |
} while (s >= range); | |
} | |
mismatch: | |
#ifdef USE_FIND_LONGEST_SEARCH_ALL_OF_RANGE | |
if (IS_FIND_LONGEST(reg->options)) { | |
if (msa.best_len >= 0) { | |
s = msa.best_s; | |
goto match; | |
} | |
} | |
#endif | |
r = ONIG_MISMATCH; | |
finish: | |
MATCH_ARG_FREE(msa); | |
/* If result is mismatch and no FIND_NOT_EMPTY option, | |
then the region is not set in match_at(). */ | |
if (IS_FIND_NOT_EMPTY(reg->options) && region) { | |
onig_region_clear(region); | |
} | |
#ifdef ONIG_DEBUG | |
if (r != ONIG_MISMATCH) | |
fprintf(stderr, "onig_search: error %"PRIdPTRDIFF"\n", r); | |
#endif | |
return r; | |
mismatch_no_msa: | |
r = ONIG_MISMATCH; | |
finish_no_msa: | |
#ifdef ONIG_DEBUG | |
if (r != ONIG_MISMATCH) | |
fprintf(stderr, "onig_search: error %"PRIdPTRDIFF"\n", r); | |
#endif | |
return r; | |
match: | |
MATCH_ARG_FREE(msa); | |
return s - str; | |
} | |
extern OnigPosition | |
onig_scan(regex_t* reg, const UChar* str, const UChar* end, | |
OnigRegion* region, OnigOptionType option, | |
int (*scan_callback)(OnigPosition, OnigPosition, OnigRegion*, void*), | |
void* callback_arg) | |
{ | |
OnigPosition r; | |
OnigPosition n; | |
int rs; | |
const UChar* start; | |
n = 0; | |
start = str; | |
while (1) { | |
r = onig_search(reg, str, end, start, end, region, option); | |
if (r >= 0) { | |
rs = scan_callback(n, r, region, callback_arg); | |
n++; | |
if (rs != 0) | |
return rs; | |
if (region->end[0] == start - str) { | |
if (start >= end) break; | |
start += enclen(reg->enc, start, end); | |
} | |
else | |
start = str + region->end[0]; | |
if (start > end) | |
break; | |
} | |
else if (r == ONIG_MISMATCH) { | |
break; | |
} | |
else { /* error */ | |
return r; | |
} | |
} | |
return n; | |
} | |
extern OnigEncoding | |
onig_get_encoding(const regex_t* reg) | |
{ | |
return reg->enc; | |
} | |
extern OnigOptionType | |
onig_get_options(const regex_t* reg) | |
{ | |
return reg->options; | |
} | |
extern OnigCaseFoldType | |
onig_get_case_fold_flag(const regex_t* reg) | |
{ | |
return reg->case_fold_flag; | |
} | |
extern const OnigSyntaxType* | |
onig_get_syntax(const regex_t* reg) | |
{ | |
return reg->syntax; | |
} | |
extern int | |
onig_number_of_captures(const regex_t* reg) | |
{ | |
return reg->num_mem; | |
} | |
extern int | |
onig_number_of_capture_histories(const regex_t* reg) | |
{ | |
#ifdef USE_CAPTURE_HISTORY | |
int i, n; | |
n = 0; | |
for (i = 0; i <= ONIG_MAX_CAPTURE_HISTORY_GROUP; i++) { | |
if (BIT_STATUS_AT(reg->capture_history, i) != 0) | |
n++; | |
} | |
return n; | |
#else | |
return 0; | |
#endif | |
} | |
extern void | |
onig_copy_encoding(OnigEncodingType *to, OnigEncoding from) | |
{ | |
*to = *from; | |
} |