123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858 |
- #include "libbb.h"
- #include "common_bufsiz.h"
- #include "xregex.h"
- #define OPTSTR_GREP \
- "lnqvscFiHhe:*f:*Lorm:+wx" \
- IF_FEATURE_GREP_CONTEXT("A:+B:+C:+") \
- "E" \
- IF_EXTRA_COMPAT("z") \
- "aI"
- enum {
- OPTBIT_l,
- OPTBIT_n,
- OPTBIT_q,
- OPTBIT_v,
- OPTBIT_s,
- OPTBIT_c,
- OPTBIT_F,
- OPTBIT_i,
- OPTBIT_H,
- OPTBIT_h,
- OPTBIT_e,
- OPTBIT_f,
- OPTBIT_L,
- OPTBIT_o,
- OPTBIT_r,
- OPTBIT_m,
- OPTBIT_w,
- OPTBIT_x,
- IF_FEATURE_GREP_CONTEXT( OPTBIT_A ,)
- IF_FEATURE_GREP_CONTEXT( OPTBIT_B ,)
- IF_FEATURE_GREP_CONTEXT( OPTBIT_C ,)
- OPTBIT_E,
- IF_EXTRA_COMPAT( OPTBIT_z ,)
- OPT_l = 1 << OPTBIT_l,
- OPT_n = 1 << OPTBIT_n,
- OPT_q = 1 << OPTBIT_q,
- OPT_v = 1 << OPTBIT_v,
- OPT_s = 1 << OPTBIT_s,
- OPT_c = 1 << OPTBIT_c,
- OPT_F = 1 << OPTBIT_F,
- OPT_i = 1 << OPTBIT_i,
- OPT_H = 1 << OPTBIT_H,
- OPT_h = 1 << OPTBIT_h,
- OPT_e = 1 << OPTBIT_e,
- OPT_f = 1 << OPTBIT_f,
- OPT_L = 1 << OPTBIT_L,
- OPT_o = 1 << OPTBIT_o,
- OPT_r = 1 << OPTBIT_r,
- OPT_m = 1 << OPTBIT_m,
- OPT_w = 1 << OPTBIT_w,
- OPT_x = 1 << OPTBIT_x,
- OPT_A = IF_FEATURE_GREP_CONTEXT( (1 << OPTBIT_A)) + 0,
- OPT_B = IF_FEATURE_GREP_CONTEXT( (1 << OPTBIT_B)) + 0,
- OPT_C = IF_FEATURE_GREP_CONTEXT( (1 << OPTBIT_C)) + 0,
- OPT_E = 1 << OPTBIT_E,
- OPT_z = IF_EXTRA_COMPAT( (1 << OPTBIT_z)) + 0,
- };
- #define PRINT_FILES_WITH_MATCHES (option_mask32 & OPT_l)
- #define PRINT_LINE_NUM (option_mask32 & OPT_n)
- #define BE_QUIET (option_mask32 & OPT_q)
- #define SUPPRESS_ERR_MSGS (option_mask32 & OPT_s)
- #define PRINT_MATCH_COUNTS (option_mask32 & OPT_c)
- #define FGREP_FLAG (option_mask32 & OPT_F)
- #define PRINT_FILES_WITHOUT_MATCHES (option_mask32 & OPT_L)
- #define NUL_DELIMITED (option_mask32 & OPT_z)
- struct globals {
- int max_matches;
- #if !ENABLE_EXTRA_COMPAT
- int reflags;
- #else
- RE_TRANSLATE_TYPE case_fold;
- #endif
- smalluint invert_search;
- smalluint print_filename;
- smalluint open_errors;
- #if ENABLE_FEATURE_GREP_CONTEXT
- smalluint did_print_line;
- int lines_before;
- int lines_after;
- char **before_buf;
- IF_EXTRA_COMPAT(size_t *before_buf_size;)
- int last_line_printed;
- #endif
-
- llist_t *pattern_head;
- const char *cur_file;
- } FIX_ALIASING;
- #define G (*(struct globals*)bb_common_bufsiz1)
- #define INIT_G() do { \
- setup_common_bufsiz(); \
- BUILD_BUG_ON(sizeof(G) > COMMON_BUFSIZE); \
- } while (0)
- #define max_matches (G.max_matches )
- #if !ENABLE_EXTRA_COMPAT
- # define reflags (G.reflags )
- #else
- # define case_fold (G.case_fold )
- # define reflags re_syntax_options
- # undef REG_NOSUB
- # undef REG_EXTENDED
- # undef REG_ICASE
- # define REG_NOSUB bug:is:here
- # define REG_EXTENDED (RE_SYNTAX_EGREP | RE_INTERVALS | RE_NO_BK_BRACES)
- # define REG_ICASE bug:is:here
- #endif
- #define invert_search (G.invert_search )
- #define print_filename (G.print_filename )
- #define open_errors (G.open_errors )
- #define did_print_line (G.did_print_line )
- #define lines_before (G.lines_before )
- #define lines_after (G.lines_after )
- #define before_buf (G.before_buf )
- #define before_buf_size (G.before_buf_size )
- #define last_line_printed (G.last_line_printed )
- #define pattern_head (G.pattern_head )
- #define cur_file (G.cur_file )
- typedef struct grep_list_data_t {
- char *pattern;
- #if !ENABLE_EXTRA_COMPAT
- regex_t compiled_regex;
- regmatch_t matched_range;
- #else
- struct re_pattern_buffer compiled_regex;
- struct re_registers matched_range;
- #endif
- #define ALLOCATED 1
- #define COMPILED 2
- int flg_mem_allocated_compiled;
- } grep_list_data_t;
- #if !ENABLE_EXTRA_COMPAT
- #define print_line(line, line_len, linenum, decoration) \
- print_line(line, linenum, decoration)
- #endif
- static void print_line(const char *line, size_t line_len, int linenum, char decoration)
- {
- #if ENABLE_FEATURE_GREP_CONTEXT
-
- if (linenum < 1)
- return;
-
- if ((lines_before || lines_after) && did_print_line
- && last_line_printed != linenum - 1
- ) {
- puts("--");
- }
-
- did_print_line = 1;
- last_line_printed = linenum;
- #endif
- if (print_filename)
- printf("%s%c", cur_file, decoration);
- if (PRINT_LINE_NUM)
- printf("%i%c", linenum, decoration);
-
- if ((option_mask32 & (OPT_v|OPT_o)) != (OPT_v|OPT_o)) {
- #if !ENABLE_EXTRA_COMPAT
- puts(line);
- #else
- fwrite(line, 1, line_len, stdout);
- putchar(NUL_DELIMITED ? '\0' : '\n');
- #endif
- }
- }
- #if ENABLE_EXTRA_COMPAT
- static ssize_t FAST_FUNC bb_getline(char **line_ptr, size_t *line_alloc_len, FILE *file)
- {
- ssize_t res_sz;
- char *line;
- int delim = (NUL_DELIMITED ? '\0' : '\n');
- res_sz = getdelim(line_ptr, line_alloc_len, delim, file);
- line = *line_ptr;
- if (res_sz > 0) {
- if (line[res_sz - 1] == delim)
- line[--res_sz] = '\0';
- } else {
- free(line);
- }
- return res_sz;
- }
- #endif
- static int grep_file(FILE *file)
- {
- smalluint found;
- int linenum = 0;
- int nmatches = 0;
- #if !ENABLE_EXTRA_COMPAT
- char *line;
- #else
- char *line = NULL;
- ssize_t line_len;
- size_t line_alloc_len;
- # define rm_so start[0]
- # define rm_eo end[0]
- #endif
- #if ENABLE_FEATURE_GREP_CONTEXT
- int print_n_lines_after = 0;
- int curpos = 0;
- int idx = 0;
- #else
- enum { print_n_lines_after = 0 };
- #endif
- while (
- #if !ENABLE_EXTRA_COMPAT
- (line = xmalloc_fgetline(file)) != NULL
- #else
- (line_len = bb_getline(&line, &line_alloc_len, file)) >= 0
- #endif
- ) {
- llist_t *pattern_ptr = pattern_head;
- grep_list_data_t *gl = gl;
- linenum++;
- found = 0;
- while (pattern_ptr) {
- gl = (grep_list_data_t *)pattern_ptr->data;
- if (FGREP_FLAG) {
- char *match;
- char *str = line;
- opt_f_again:
- match = ((option_mask32 & OPT_i)
- ? strcasestr(str, gl->pattern)
- : strstr(str, gl->pattern)
- );
- if (match) {
- if (option_mask32 & OPT_x) {
- if (match != str)
- goto opt_f_not_found;
- if (str[strlen(gl->pattern)] != '\0')
- goto opt_f_not_found;
- } else
- if (option_mask32 & OPT_w) {
- char c = (match != str) ? match[-1] : ' ';
- if (!isalnum(c) && c != '_') {
- c = match[strlen(gl->pattern)];
- if (!c || (!isalnum(c) && c != '_'))
- goto opt_f_found;
- }
- str = match + 1;
- goto opt_f_again;
- }
- opt_f_found:
- found = 1;
- opt_f_not_found: ;
- }
- } else {
- #if ENABLE_EXTRA_COMPAT
- unsigned start_pos;
- #else
- int match_flg;
- #endif
- char *match_at;
- if (!(gl->flg_mem_allocated_compiled & COMPILED)) {
- gl->flg_mem_allocated_compiled |= COMPILED;
- #if !ENABLE_EXTRA_COMPAT
- xregcomp(&gl->compiled_regex, gl->pattern, reflags);
- #else
- memset(&gl->compiled_regex, 0, sizeof(gl->compiled_regex));
- gl->compiled_regex.translate = case_fold;
- if (re_compile_pattern(gl->pattern, strlen(gl->pattern), &gl->compiled_regex))
- bb_error_msg_and_die("bad regex '%s'", gl->pattern);
- #endif
- }
- #if !ENABLE_EXTRA_COMPAT
- gl->matched_range.rm_so = 0;
- gl->matched_range.rm_eo = 0;
- match_flg = 0;
- #else
- start_pos = 0;
- #endif
- match_at = line;
- opt_w_again:
- if (
- #if !ENABLE_EXTRA_COMPAT
- regexec(&gl->compiled_regex, match_at, 1, &gl->matched_range, match_flg) == 0
- #else
- re_search(&gl->compiled_regex, match_at, line_len,
- start_pos, line_len,
- &gl->matched_range) >= 0
- #endif
- ) {
- if (option_mask32 & OPT_x) {
- found = (gl->matched_range.rm_so == 0
- && match_at[gl->matched_range.rm_eo] == '\0');
- } else
- if (!(option_mask32 & OPT_w)) {
- found = 1;
- } else {
- char c = ' ';
- if (match_at > line || gl->matched_range.rm_so != 0) {
- c = match_at[gl->matched_range.rm_so - 1];
- }
- if (!isalnum(c) && c != '_') {
- c = match_at[gl->matched_range.rm_eo];
- }
- if (!isalnum(c) && c != '_') {
- found = 1;
- } else {
-
- #if !ENABLE_EXTRA_COMPAT
- if (gl->matched_range.rm_eo != 0) {
- match_at += gl->matched_range.rm_eo;
- match_flg |= REG_NOTBOL;
- goto opt_w_again;
- }
- #else
- if (gl->matched_range.rm_eo > start_pos) {
- start_pos = gl->matched_range.rm_eo;
- goto opt_w_again;
- }
- #endif
- }
- }
- }
- }
-
- if (found && !invert_search)
- goto do_found;
- pattern_ptr = pattern_ptr->link;
- }
- if (found ^ invert_search) {
- do_found:
-
- nmatches++;
-
- if (option_mask32 & (OPT_q|OPT_l|OPT_L)) {
- free(line);
- if (BE_QUIET) {
-
- exit(EXIT_SUCCESS);
- }
-
- if (PRINT_FILES_WITH_MATCHES) {
- puts(cur_file);
-
- }
-
- return 1;
- }
- #if ENABLE_FEATURE_GREP_CONTEXT
-
- if ((option_mask32 & OPT_m) && nmatches > max_matches)
- break;
- #endif
-
- if (PRINT_MATCH_COUNTS == 0) {
- #if ENABLE_FEATURE_GREP_CONTEXT
- int prevpos = (curpos == 0) ? lines_before - 1 : curpos - 1;
-
- if (lines_before && before_buf[prevpos] != NULL) {
- int first_buf_entry_line_num = linenum - lines_before;
-
- idx = curpos;
- while (before_buf[idx] == NULL) {
- idx = (idx + 1) % lines_before;
- first_buf_entry_line_num++;
- }
-
- while (before_buf[idx] != NULL) {
- print_line(before_buf[idx], before_buf_size[idx], first_buf_entry_line_num, '-');
- free(before_buf[idx]);
- before_buf[idx] = NULL;
- idx = (idx + 1) % lines_before;
- first_buf_entry_line_num++;
- }
- }
-
- print_n_lines_after = lines_after;
- #endif
- if (option_mask32 & OPT_o) {
- if (FGREP_FLAG) {
-
- if (found)
- print_line(gl->pattern, strlen(gl->pattern), linenum, ':');
- } else while (1) {
- unsigned start = gl->matched_range.rm_so;
- unsigned end = gl->matched_range.rm_eo;
- unsigned len = end - start;
- char old = line[end];
- line[end] = '\0';
-
- if (len != 0)
- print_line(line + start, len, linenum, ':');
- if (old == '\0')
- break;
- line[end] = old;
- if (len == 0)
- end++;
- #if !ENABLE_EXTRA_COMPAT
- if (regexec(&gl->compiled_regex, line + end,
- 1, &gl->matched_range, REG_NOTBOL) != 0)
- break;
- gl->matched_range.rm_so += end;
- gl->matched_range.rm_eo += end;
- #else
- if (re_search(&gl->compiled_regex, line, line_len,
- end, line_len - end,
- &gl->matched_range) < 0)
- break;
- #endif
- }
- } else {
- print_line(line, line_len, linenum, ':');
- }
- }
- }
- #if ENABLE_FEATURE_GREP_CONTEXT
- else {
-
- if (print_n_lines_after) {
- print_line(line, strlen(line), linenum, '-');
- print_n_lines_after--;
- } else if (lines_before) {
-
- free(before_buf[curpos]);
- before_buf[curpos] = line;
- IF_EXTRA_COMPAT(before_buf_size[curpos] = line_len;)
- curpos = (curpos + 1) % lines_before;
-
- line = NULL;
- }
- }
- #endif
- #if !ENABLE_EXTRA_COMPAT
- free(line);
- #endif
-
- if ((option_mask32 & OPT_m)
- && !print_n_lines_after
- && nmatches == max_matches
- ) {
- break;
- }
- }
-
-
- if (PRINT_MATCH_COUNTS) {
- if (print_filename)
- printf("%s:", cur_file);
- printf("%d\n", nmatches);
- }
-
- if (PRINT_FILES_WITHOUT_MATCHES) {
-
- puts(cur_file);
- }
- return nmatches;
- }
- #if ENABLE_FEATURE_CLEAN_UP
- #define new_grep_list_data(p, m) add_grep_list_data(p, m)
- static char *add_grep_list_data(char *pattern, int flg_used_mem)
- #else
- #define new_grep_list_data(p, m) add_grep_list_data(p)
- static char *add_grep_list_data(char *pattern)
- #endif
- {
- grep_list_data_t *gl = xzalloc(sizeof(*gl));
- gl->pattern = pattern;
- #if ENABLE_FEATURE_CLEAN_UP
- gl->flg_mem_allocated_compiled = flg_used_mem;
- #else
-
- #endif
- return (char *)gl;
- }
- static void load_regexes_from_file(llist_t *fopt)
- {
- while (fopt) {
- char *line;
- FILE *fp;
- llist_t *cur = fopt;
- char *ffile = cur->data;
- fopt = cur->link;
- free(cur);
- fp = xfopen_stdin(ffile);
- while ((line = xmalloc_fgetline(fp)) != NULL) {
- llist_add_to(&pattern_head,
- new_grep_list_data(line, ALLOCATED));
- }
- fclose_if_not_stdin(fp);
- }
- }
- static int FAST_FUNC file_action_grep(const char *filename,
- struct stat *statbuf,
- void* matched,
- int depth UNUSED_PARAM)
- {
- FILE *file;
-
- if (S_ISLNK(statbuf->st_mode)) {
- struct stat sb;
- if (stat(filename, &sb) != 0) {
- if (!SUPPRESS_ERR_MSGS)
- bb_simple_perror_msg(filename);
- return 0;
- }
- if (S_ISDIR(sb.st_mode))
- return 1;
- }
- file = fopen_for_read(filename);
- if (file == NULL) {
- if (!SUPPRESS_ERR_MSGS)
- bb_simple_perror_msg(filename);
- open_errors = 1;
- return 0;
- }
- cur_file = filename;
- *(int*)matched += grep_file(file);
- fclose(file);
- return 1;
- }
- static int grep_dir(const char *dir)
- {
- int matched = 0;
- recursive_action(dir,
- ACTION_RECURSE |
- ACTION_FOLLOWLINKS_L0 |
- ACTION_DEPTHFIRST,
- file_action_grep,
- NULL,
- &matched,
- 0);
- return matched;
- }
- int grep_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
- int grep_main(int argc UNUSED_PARAM, char **argv)
- {
- FILE *file;
- int matched;
- llist_t *fopt = NULL;
- #if ENABLE_FEATURE_GREP_CONTEXT
- int Copt, opts;
- #endif
- INIT_G();
-
- xfunc_error_retval = 2;
-
- #if ENABLE_FEATURE_GREP_CONTEXT
-
- opts = getopt32(argv,
- "^" OPTSTR_GREP "\0" "H-h:C-AB",
- &pattern_head, &fopt, &max_matches,
- &lines_after, &lines_before, &Copt);
- if (opts & OPT_C) {
-
- if (!(opts & OPT_A))
- lines_after = Copt;
- if (!(opts & OPT_B))
- lines_before = Copt;
- }
-
- if (opts & (OPT_c|OPT_q|OPT_l|OPT_L)) {
- option_mask32 &= ~OPT_n;
- lines_before = 0;
- lines_after = 0;
- } else if (lines_before > 0) {
- if (lines_before > INT_MAX / sizeof(long long))
- lines_before = INT_MAX / sizeof(long long);
-
- before_buf = xzalloc(lines_before * sizeof(before_buf[0]));
- IF_EXTRA_COMPAT(before_buf_size = xzalloc(lines_before * sizeof(before_buf_size[0]));)
- }
- #else
-
- getopt32(argv, "^" OPTSTR_GREP "\0" "H-h:c-n:q-n:l-n:",
- &pattern_head, &fopt, &max_matches);
- #endif
- invert_search = ((option_mask32 & OPT_v) != 0);
- {
- llist_t *cur;
- for (cur = pattern_head; cur; cur = cur->link)
- cur->data = new_grep_list_data(cur->data, 0);
- }
- if (option_mask32 & OPT_f) {
- load_regexes_from_file(fopt);
- if (!pattern_head) {
-
- llist_add_to(&pattern_head, new_grep_list_data((char*) "", 0));
- invert_search ^= 1;
- }
- }
- if (ENABLE_FGREP && applet_name[0] == 'f')
- option_mask32 |= OPT_F;
- #if !ENABLE_EXTRA_COMPAT
- if (!(option_mask32 & (OPT_o | OPT_w | OPT_x)))
- reflags = REG_NOSUB;
- #endif
- if ((ENABLE_EGREP && applet_name[0] == 'e')
- || (option_mask32 & OPT_E)
- ) {
- reflags |= REG_EXTENDED;
- }
- #if ENABLE_EXTRA_COMPAT
- else {
- reflags = RE_SYNTAX_GREP;
- }
- #endif
- if (option_mask32 & OPT_i) {
- #if !ENABLE_EXTRA_COMPAT
- reflags |= REG_ICASE;
- #else
- int i;
- case_fold = xmalloc(256);
- for (i = 0; i < 256; i++)
- case_fold[i] = (unsigned char)i;
- for (i = 'a'; i <= 'z'; i++)
- case_fold[i] = (unsigned char)(i - ('a' - 'A'));
- #endif
- }
- argv += optind;
-
- if (pattern_head == NULL) {
- char *pattern;
- if (*argv == NULL)
- bb_show_usage();
- pattern = new_grep_list_data(*argv++, 0);
- llist_add_to(&pattern_head, pattern);
- }
-
- if (argv[0] && argv[1])
- print_filename = 1;
-
- if (option_mask32 & OPT_H)
- print_filename = 1;
- if (option_mask32 & OPT_h)
- print_filename = 0;
-
- matched = 0;
- do {
- cur_file = *argv;
- file = stdin;
- if (!cur_file || LONE_DASH(cur_file)) {
- cur_file = "(standard input)";
- } else {
- if (option_mask32 & OPT_r) {
- struct stat st;
- if (stat(cur_file, &st) == 0 && S_ISDIR(st.st_mode)) {
- if (!(option_mask32 & OPT_h))
- print_filename = 1;
- matched += grep_dir(cur_file);
- goto grep_done;
- }
- }
-
- file = fopen_for_read(cur_file);
- if (file == NULL) {
- if (!SUPPRESS_ERR_MSGS)
- bb_simple_perror_msg(cur_file);
- open_errors = 1;
- continue;
- }
- }
- matched += grep_file(file);
- fclose_if_not_stdin(file);
- grep_done: ;
- } while (*argv && *++argv);
-
- if (ENABLE_FEATURE_CLEAN_UP) {
- while (pattern_head) {
- llist_t *pattern_head_ptr = pattern_head;
- grep_list_data_t *gl = (grep_list_data_t *)pattern_head_ptr->data;
- pattern_head = pattern_head->link;
- if (gl->flg_mem_allocated_compiled & ALLOCATED)
- free(gl->pattern);
- if (gl->flg_mem_allocated_compiled & COMPILED)
- regfree(&gl->compiled_regex);
- free(gl);
- free(pattern_head_ptr);
- }
- }
-
- if (open_errors)
- return 2;
- return !matched;
- }
|