16# include RUBY_EXTCONF_H
19#ifdef HAVE_ONIG_REGION_MEMSIZE
25#define STRSCAN_VERSION "3.0.1"
31static VALUE StringScanner;
32static VALUE ScanError;
33static ID id_byteslice;
39#define FLAG_MATCHED (1 << 0)
58#define MATCHED_P(s) ((s)->flags & FLAG_MATCHED)
59#define MATCHED(s) (s)->flags |= FLAG_MATCHED
60#define CLEAR_MATCH_STATUS(s) (s)->flags &= ~FLAG_MATCHED
62#define S_PBEG(s) (RSTRING_PTR((s)->str))
63#define S_LEN(s) (RSTRING_LEN((s)->str))
64#define S_PEND(s) (S_PBEG(s) + S_LEN(s))
65#define CURPTR(s) (S_PBEG(s) + (s)->curr)
66#define S_RESTLEN(s) (S_LEN(s) - (s)->curr)
68#define EOS_P(s) ((s)->curr >= RSTRING_LEN(p->str))
70#define GET_SCANNER(obj,var) do {\
71 (var) = check_strscan(obj);\
72 if (NIL_P((var)->str)) rb_raise(rb_eArgError, "uninitialized StringScanner object");\
79static inline long minl
_((
const long n,
const long x));
84static void strscan_mark
_((
void *p));
85static void strscan_free
_((
void *p));
86static size_t strscan_memsize
_((
const void *p));
100 int succptr,
int getstr,
int headonly));
112static void adjust_registers_to_matched
_((
struct strscanner *p));
149minl(
const long x,
const long y)
151 return (x < y) ? x : y;
155extract_range(
struct strscanner *p,
long beg_i,
long end_i)
158 end_i = minl(end_i,
S_LEN(p));
159 return str_new(p,
S_PBEG(p) + beg_i, end_i - beg_i);
167 return str_new(p,
S_PBEG(p) + beg_i,
len);
175strscan_mark(
void *
ptr)
183strscan_free(
void *
ptr)
191strscan_memsize(
const void *
ptr)
194 size_t size =
sizeof(*p) -
sizeof(p->
regs);
195#ifdef HAVE_ONIG_REGION_MEMSIZE
203 {strscan_mark, strscan_free, strscan_memsize},
208strscan_s_allocate(
VALUE klass)
238 p = check_strscan(self);
241 if (!
NIL_P(options)) {
244 keyword_ids[0] =
rb_intern(
"fixed_anchor");
246 if (fixed_anchor ==
Qundef) {
263check_strscan(
VALUE obj)
280 self = check_strscan(vself);
281 orig = check_strscan(vorig);
305strscan_s_mustc(
VALUE self)
314strscan_reset(
VALUE self)
332strscan_terminate(
VALUE self)
347strscan_clear(
VALUE self)
349 rb_warning(
"StringScanner#clear is obsolete; use #terminate instead");
350 return strscan_terminate(self);
357strscan_get_string(
VALUE self)
423strscan_get_pos(
VALUE self)
445strscan_get_charpos(
VALUE self)
471 if (i < 0) i +=
S_LEN(p);
491set_registers(
struct strscanner *p,
size_t length)
532adjust_register_position(
struct strscanner *p,
long position)
538 return p->
prev + position;
543strscan_do_scan(
VALUE self,
VALUE pattern,
int succptr,
int getstr,
int headonly)
548 if (!RB_TYPE_P(pattern,
T_REGEXP)) {
571 if (!tmpreg)
RREGEXP(pattern)->usecnt++;
590 if (!tmpreg)
RREGEXP(pattern)->usecnt--;
592 if (
RREGEXP(pattern)->usecnt) {
601 if (ret == -2)
rb_raise(ScanError,
"regexp buffer overflow");
625 const long length = last_match_length(p);
627 return extract_beg_len(p, p->
prev, length);
654 return strscan_do_scan(self, re, 1, 1, 1);
672 return strscan_do_scan(self, re, 0, 0, 1);
696 return strscan_do_scan(self, re, 1, 0, 1);
717 return strscan_do_scan(self, re, 0, 1, 1);
733 return strscan_do_scan(self, re,
RTEST(s),
RTEST(
f), 1);
751 return strscan_do_scan(self, re, 1, 1, 0);
770 return strscan_do_scan(self, re, 0, 0, 0);
792 return strscan_do_scan(self, re, 1, 0, 0);
811 return strscan_do_scan(self, re, 0, 1, 0);
826 return strscan_do_scan(self, re,
RTEST(s),
RTEST(
f), 0);
830adjust_registers_to_matched(
struct strscanner *p)
855strscan_getch(
VALUE self)
870 adjust_registers_to_matched(p);
871 return extract_range(p,
872 adjust_register_position(p, p->
regs.
beg[0]),
873 adjust_register_position(p, p->
regs.
end[0]));
892strscan_get_byte(
VALUE self)
904 adjust_registers_to_matched(p);
905 return extract_range(p,
906 adjust_register_position(p, p->
regs.
beg[0]),
907 adjust_register_position(p, p->
regs.
end[0]));
915strscan_getbyte(
VALUE self)
917 rb_warning(
"StringScanner#getbyte is obsolete; use #get_byte instead");
918 return strscan_get_byte(self);
942 return str_new(p,
"", 0);
945 return extract_beg_len(p, p->
curr,
len);
955 rb_warning(
"StringScanner#peep is obsolete; use #peek instead");
956 return strscan_peek(self, vlen);
971strscan_unscan(
VALUE self)
977 rb_raise(ScanError,
"unscan failed: previous match record not exist");
996strscan_bol_p(
VALUE self)
1017strscan_eos_p(
VALUE self)
1030strscan_empty_p(
VALUE self)
1032 rb_warning(
"StringScanner#empty? is obsolete; use #eos? instead");
1033 return strscan_eos_p(self);
1045strscan_rest_p(
VALUE self)
1063strscan_matched_p(
VALUE self)
1079strscan_matched(
VALUE self)
1085 return extract_range(p,
1086 adjust_register_position(p, p->
regs.
beg[0]),
1087 adjust_register_position(p, p->
regs.
end[0]));
1102strscan_matched_size(
VALUE self)
1117 (
const unsigned char* )
name, (
const unsigned char* )name_end,
regs);
1165 switch (
TYPE(idx)) {
1180 if (i < 0)
return Qnil;
1184 return extract_range(p,
1185 adjust_register_position(p, p->
regs.
beg[i]),
1186 adjust_register_position(p, p->
regs.
end[i]));
1200strscan_size(
VALUE self)
1222strscan_captures(
VALUE self)
1234 for (i = 1; i < num_regs; i++) {
1236 adjust_register_position(p, p->
regs.
beg[i]),
1237 adjust_register_position(p, p->
regs.
end[i]));
1269 for (i = 0; i<
argc; i++) {
1286strscan_pre_match(
VALUE self)
1292 return extract_range(p,
1294 adjust_register_position(p, p->
regs.
beg[0]));
1307strscan_post_match(
VALUE self)
1313 return extract_range(p,
1314 adjust_register_position(p, p->
regs.
end[0]),
1323strscan_rest(
VALUE self)
1329 return str_new(p,
"", 0);
1331 return extract_range(p, p->
curr,
S_LEN(p));
1338strscan_rest_size(
VALUE self)
1356strscan_restsize(
VALUE self)
1358 rb_warning(
"StringScanner#restsize is obsolete; use #rest_size instead");
1359 return strscan_rest_size(self);
1362#define INSPECT_LENGTH 5
1376strscan_inspect(
VALUE self)
1381 p = check_strscan(self);
1454strscan_fixed_anchor_p(
VALUE self)
1457 p = check_strscan(self);
1571#ifdef HAVE_RB_EXT_RACTOR_SAFE
1652 rb_define_method(StringScanner,
"fixed_anchor?", strscan_fixed_anchor_p, 0);
VALUE rb_ary_push(VALUE ary, VALUE item)
#define rb_define_method(klass, mid, func, arity)
Defines klass#mid.
#define rb_define_singleton_method(klass, mid, func, arity)
Defines klass.mid.
#define rb_define_private_method(klass, mid, func, arity)
Defines klass#mid and makes it private.
rb_encoding * rb_enc_get(VALUE obj)
void rb_enc_copy(VALUE obj1, VALUE obj2)
rb_encoding * rb_enc_check(VALUE str1, VALUE str2)
int rb_enc_mbclen(const char *p, const char *e, rb_encoding *enc)
char str[HTML_ESCAPE_MAX_LEN+1]
#define RSTRING_LEN(string)
#define RSTRING_PTR(string)
void ruby_xfree(void *x)
Deallocates a storage instance.
void rb_gc_mark(VALUE ptr)
VALUE rb_define_class(const char *name, VALUE super)
Defines a top-level class.
VALUE rb_define_class_under(VALUE outer, const char *name, VALUE super)
Defines a class under the namespace of outer.
int rb_scan_args(int argc, const VALUE *argv, const char *fmt,...)
int rb_get_kwargs(VALUE keyword_hash, const ID *table, int required, int optional, VALUE *values)
void rb_raise(VALUE exc, const char *fmt,...)
void * rb_check_typeddata(VALUE obj, const rb_data_type_t *data_type)
void rb_warning(const char *fmt,...)
VALUE rb_cObject
Object class.
VALUE rb_obj_class(VALUE)
VALUE rb_obj_freeze(VALUE)
Make the object unmodifiable.
VALUE rb_check_hash_type(VALUE hash)
long rb_enc_strlen(const char *, const char *, rb_encoding *)
void rb_ext_ractor_safe(bool flag)
#define rb_str_new(str, len)
VALUE rb_str_cat(VALUE, const char *, long)
VALUE rb_str_append(VALUE, VALUE)
#define rb_str_new_cstr(str)
void rb_const_set(VALUE, ID, VALUE)
int rb_const_defined(VALUE, ID)
void rb_define_alloc_func(VALUE, rb_alloc_func_t)
void rb_alias(VALUE, ID, ID)
ID rb_intern(const char *)
int rb_reg_region_copy(struct re_registers *, const struct re_registers *)
regex_t * rb_reg_prepare_re(VALUE re, VALUE str)
int memcmp(const void *s1, const void *s2, size_t len)
ONIG_EXTERN int onig_region_set(OnigRegion *region, int at, int beg, int end)
ONIG_EXTERN void onig_region_init(OnigRegion *region)
ONIG_EXTERN void onig_region_free(OnigRegion *region, int free_self)
ONIG_EXTERN OnigPosition onig_search(OnigRegex, const OnigUChar *str, const OnigUChar *end, const OnigUChar *start, const OnigUChar *range, OnigRegion *region, OnigOptionType option)
ONIG_EXTERN void onig_free(OnigRegex)
ONIG_EXTERN OnigPosition onig_match(OnigRegex, const OnigUChar *str, const OnigUChar *end, const OnigUChar *at, OnigRegion *region, OnigOptionType option)
ONIG_EXTERN void onig_region_clear(OnigRegion *region)
ONIG_EXTERN int onig_name_to_backref_number(OnigRegex reg, const OnigUChar *name, const OnigUChar *name_end, const OnigRegion *region)
size_t onig_region_memsize(const OnigRegion *regs)
#define RSTRING_GETMEM(str, ptrvar, lenvar)
@ RUBY_TYPED_FREE_IMMEDIATELY
#define TypedData_Make_Struct(klass, type, data_type, sval)
VALUE rb_sprintf(const char *,...)
#define CLEAR_MATCH_STATUS(s)
#define GET_SCANNER(obj, var)