|
Packit |
b89d10 |
/*
|
|
Packit |
b89d10 |
* count.c
|
|
Packit |
b89d10 |
*/
|
|
Packit |
b89d10 |
#include <stdlib.h>
|
|
Packit |
b89d10 |
#include <stdio.h>
|
|
Packit |
b89d10 |
#include <string.h>
|
|
Packit |
b89d10 |
#include "oniguruma.h"
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
#define ulen(enc, p) onigenc_str_bytelen_null(enc, (UChar* )p)
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
static int
|
|
Packit |
b89d10 |
test(OnigEncoding enc, OnigMatchParam* mp, char* in_pattern, char* in_str)
|
|
Packit |
b89d10 |
{
|
|
Packit |
b89d10 |
int r;
|
|
Packit |
b89d10 |
unsigned char *start, *range, *end;
|
|
Packit |
b89d10 |
regex_t* reg;
|
|
Packit |
b89d10 |
OnigErrorInfo einfo;
|
|
Packit |
b89d10 |
OnigRegion *region;
|
|
Packit |
b89d10 |
UChar* pattern;
|
|
Packit |
b89d10 |
UChar* str;
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
pattern = (UChar* )in_pattern;
|
|
Packit |
b89d10 |
str = (UChar* )in_str;
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
r = onig_new(®, pattern, pattern + ulen(enc, pattern),
|
|
Packit |
b89d10 |
ONIG_OPTION_DEFAULT, enc, ONIG_SYNTAX_DEFAULT, &einfo);
|
|
Packit |
b89d10 |
if (r != ONIG_NORMAL) {
|
|
Packit |
b89d10 |
char s[ONIG_MAX_ERROR_MESSAGE_LEN];
|
|
Packit |
b89d10 |
onig_error_code_to_str((UChar* )s, r, &einfo);
|
|
Packit |
b89d10 |
fprintf(stderr, "COMPILE ERROR: %d: %s\n", r, s);
|
|
Packit |
b89d10 |
return -1;
|
|
Packit |
b89d10 |
}
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
region = onig_region_new();
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
end = str + ulen(enc, str);
|
|
Packit |
b89d10 |
start = str;
|
|
Packit |
b89d10 |
range = end;
|
|
Packit |
b89d10 |
r = onig_search_with_param(reg, str, end, start, range, region,
|
|
Packit |
b89d10 |
ONIG_OPTION_NONE, mp);
|
|
Packit |
b89d10 |
if (r >= 0) {
|
|
Packit |
b89d10 |
int slot;
|
|
Packit |
b89d10 |
OnigValue val;
|
|
Packit |
b89d10 |
char* tag;
|
|
Packit |
b89d10 |
int tag_len;
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
fprintf(stdout, "match at %d\n", r);
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
show_count:
|
|
Packit |
b89d10 |
if (enc == ONIG_ENCODING_UTF16_BE) {
|
|
Packit |
b89d10 |
tag = "\000x\000\000";
|
|
Packit |
b89d10 |
}
|
|
Packit |
b89d10 |
else if (enc == ONIG_ENCODING_UTF16_LE) {
|
|
Packit |
b89d10 |
tag = "x\000\000\000";
|
|
Packit |
b89d10 |
}
|
|
Packit |
b89d10 |
else {
|
|
Packit |
b89d10 |
tag = "x";
|
|
Packit |
b89d10 |
}
|
|
Packit |
b89d10 |
tag_len = ulen(enc, tag);
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
slot = 0;
|
|
Packit |
b89d10 |
r = onig_get_callout_data_by_tag(reg, mp, (UChar* )tag, (UChar* )tag + tag_len,
|
|
Packit |
b89d10 |
slot, 0, &val;;
|
|
Packit |
b89d10 |
if (r < ONIG_NORMAL) goto err;
|
|
Packit |
b89d10 |
else if (r > ONIG_NORMAL) {
|
|
Packit |
b89d10 |
fprintf(stdout, "COUNT[x]: NO DATA\n");
|
|
Packit |
b89d10 |
}
|
|
Packit |
b89d10 |
else {
|
|
Packit |
b89d10 |
fprintf(stdout, "COUNT[x]: %ld\n", val.l);
|
|
Packit |
b89d10 |
}
|
|
Packit |
b89d10 |
}
|
|
Packit |
b89d10 |
else if (r == ONIG_MISMATCH) {
|
|
Packit |
b89d10 |
fprintf(stdout, "search fail\n");
|
|
Packit |
b89d10 |
goto show_count;
|
|
Packit |
b89d10 |
}
|
|
Packit |
b89d10 |
else { /* error */
|
|
Packit |
b89d10 |
char s[ONIG_MAX_ERROR_MESSAGE_LEN];
|
|
Packit |
b89d10 |
err:
|
|
Packit |
b89d10 |
onig_error_code_to_str((UChar* )s, r);
|
|
Packit |
b89d10 |
fprintf(stdout, "SEARCH ERROR: %d: %s\n", r, s);
|
|
Packit |
b89d10 |
}
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
onig_region_free(region, 1 /* 1:free self, 0:free contents only */);
|
|
Packit |
b89d10 |
onig_free(reg);
|
|
Packit |
b89d10 |
return r;
|
|
Packit |
b89d10 |
}
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
extern int main(int argc, char* argv[])
|
|
Packit |
b89d10 |
{
|
|
Packit |
b89d10 |
int r;
|
|
Packit |
b89d10 |
OnigMatchParam* mp;
|
|
Packit |
b89d10 |
OnigEncoding encs[3];
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
encs[0] = ONIG_ENCODING_UTF8;
|
|
Packit |
b89d10 |
encs[1] = ONIG_ENCODING_UTF16_BE;
|
|
Packit |
b89d10 |
encs[2] = ONIG_ENCODING_UTF16_LE;
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
r = onig_initialize(encs, sizeof(encs)/sizeof(encs[0]));
|
|
Packit |
b89d10 |
if (r != ONIG_NORMAL) {
|
|
Packit |
b89d10 |
fprintf(stderr, "FAIL: onig_initialize(): %d\n", r);
|
|
Packit |
b89d10 |
return -1;
|
|
Packit |
b89d10 |
}
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
mp = onig_new_match_param();
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
test(encs[0], mp, "abc(.(*COUNT[x]))*(*FAIL)", "abcdefg");
|
|
Packit |
b89d10 |
test(encs[0], mp, "abc(.(*COUNT[_any_]))*(.(*COUNT[x]))*d", "abcdefg");
|
|
Packit |
b89d10 |
/* fail count */
|
|
Packit |
b89d10 |
test(encs[0], mp, "abc(.(*COUNT[x]{<}))*f", "abcdefg");
|
|
Packit |
b89d10 |
/* success count */
|
|
Packit |
b89d10 |
test(encs[0], mp, "abc(.(*COUNT[x]{X}))*f", "abcdefg");
|
|
Packit |
b89d10 |
/* passed count */
|
|
Packit |
b89d10 |
test(encs[0], mp, "abc(.(*COUNT[x]))*f", "abcdefg");
|
|
Packit |
b89d10 |
test(encs[0], mp, "a(.(*COUNT[x]))*z", "abcd\nabcdz");
|
|
Packit |
b89d10 |
/* total count */
|
|
Packit |
b89d10 |
test(encs[0], mp, "a(.(*TOTAL_COUNT[x]))*z", "abcd\nabcdz");
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
test(encs[1], mp, "\000a\000b\000c\000(\000.\000(\000*\000C\000O\000U\000N\000T\000[\000x\000]\000)\000)\000*\000(\000*\000F\000A\000I\000L\000)\000\000", "\000a\000b\000c\000d\000e\000f\000g\000\000");
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
test(encs[2], mp, "a\000b\000c\000(\000.\000(\000*\000C\000O\000U\000N\000T\000[\000x\000]\000)\000)\000*\000(\000*\000F\000A\000I\000L\000)\000\000\000", "a\000b\000c\000d\000e\000f\000g\000\000\000");
|
|
Packit |
b89d10 |
|
|
Packit |
b89d10 |
onig_free_match_param(mp);
|
|
Packit |
b89d10 |
onig_end();
|
|
Packit |
b89d10 |
return 0;
|
|
Packit |
b89d10 |
}
|