1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22#include "libbb.h"
23#include "xregex.h"
24
25
26#define OPTSTR_GREP \
27 "lnqvscFiHhe:f:Lorm:" \
28 IF_FEATURE_GREP_CONTEXT("A:B:C:") \
29 IF_FEATURE_GREP_EGREP_ALIAS("E") \
30 IF_DESKTOP("w") \
31 IF_EXTRA_COMPAT("z") \
32 "aI"
33
34
35
36
37enum {
38 OPTBIT_l,
39 OPTBIT_n,
40 OPTBIT_q,
41 OPTBIT_v,
42 OPTBIT_s,
43 OPTBIT_c,
44 OPTBIT_F,
45 OPTBIT_i,
46 OPTBIT_H,
47 OPTBIT_h,
48 OPTBIT_e,
49 OPTBIT_f,
50 OPTBIT_L,
51 OPTBIT_o,
52 OPTBIT_r,
53 OPTBIT_m,
54 IF_FEATURE_GREP_CONTEXT( OPTBIT_A ,)
55 IF_FEATURE_GREP_CONTEXT( OPTBIT_B ,)
56 IF_FEATURE_GREP_CONTEXT( OPTBIT_C ,)
57 IF_FEATURE_GREP_EGREP_ALIAS(OPTBIT_E ,)
58 IF_DESKTOP( OPTBIT_w ,)
59 IF_EXTRA_COMPAT( OPTBIT_z ,)
60 OPT_l = 1 << OPTBIT_l,
61 OPT_n = 1 << OPTBIT_n,
62 OPT_q = 1 << OPTBIT_q,
63 OPT_v = 1 << OPTBIT_v,
64 OPT_s = 1 << OPTBIT_s,
65 OPT_c = 1 << OPTBIT_c,
66 OPT_F = 1 << OPTBIT_F,
67 OPT_i = 1 << OPTBIT_i,
68 OPT_H = 1 << OPTBIT_H,
69 OPT_h = 1 << OPTBIT_h,
70 OPT_e = 1 << OPTBIT_e,
71 OPT_f = 1 << OPTBIT_f,
72 OPT_L = 1 << OPTBIT_L,
73 OPT_o = 1 << OPTBIT_o,
74 OPT_r = 1 << OPTBIT_r,
75 OPT_m = 1 << OPTBIT_m,
76 OPT_A = IF_FEATURE_GREP_CONTEXT( (1 << OPTBIT_A)) + 0,
77 OPT_B = IF_FEATURE_GREP_CONTEXT( (1 << OPTBIT_B)) + 0,
78 OPT_C = IF_FEATURE_GREP_CONTEXT( (1 << OPTBIT_C)) + 0,
79 OPT_E = IF_FEATURE_GREP_EGREP_ALIAS((1 << OPTBIT_E)) + 0,
80 OPT_w = IF_DESKTOP( (1 << OPTBIT_w)) + 0,
81 OPT_z = IF_EXTRA_COMPAT( (1 << OPTBIT_z)) + 0,
82};
83
84#define PRINT_FILES_WITH_MATCHES (option_mask32 & OPT_l)
85#define PRINT_LINE_NUM (option_mask32 & OPT_n)
86#define BE_QUIET (option_mask32 & OPT_q)
87#define SUPPRESS_ERR_MSGS (option_mask32 & OPT_s)
88#define PRINT_MATCH_COUNTS (option_mask32 & OPT_c)
89#define FGREP_FLAG (option_mask32 & OPT_F)
90#define PRINT_FILES_WITHOUT_MATCHES (option_mask32 & OPT_L)
91#define NUL_DELIMITED (option_mask32 & OPT_z)
92
93struct globals {
94 int max_matches;
95#if !ENABLE_EXTRA_COMPAT
96 int reflags;
97#else
98 RE_TRANSLATE_TYPE case_fold;
99#endif
100 smalluint invert_search;
101 smalluint print_filename;
102 smalluint open_errors;
103#if ENABLE_FEATURE_GREP_CONTEXT
104 smalluint did_print_line;
105 int lines_before;
106 int lines_after;
107 char **before_buf;
108 IF_EXTRA_COMPAT(size_t *before_buf_size;)
109 int last_line_printed;
110#endif
111
112 llist_t *pattern_head;
113 const char *cur_file;
114};
115#define G (*(struct globals*)&bb_common_bufsiz1)
116#define INIT_G() do { \
117 struct G_sizecheck { \
118 char G_sizecheck[sizeof(G) > COMMON_BUFSIZE ? -1 : 1]; \
119 }; \
120} while (0)
121#define max_matches (G.max_matches )
122#if !ENABLE_EXTRA_COMPAT
123# define reflags (G.reflags )
124#else
125# define case_fold (G.case_fold )
126
127# define reflags re_syntax_options
128# undef REG_NOSUB
129# undef REG_EXTENDED
130# undef REG_ICASE
131# define REG_NOSUB bug:is:here
132
133# define REG_EXTENDED (RE_SYNTAX_EGREP | RE_INTERVALS | RE_NO_BK_BRACES)
134# define REG_ICASE bug:is:here
135#endif
136#define invert_search (G.invert_search )
137#define print_filename (G.print_filename )
138#define open_errors (G.open_errors )
139#define did_print_line (G.did_print_line )
140#define lines_before (G.lines_before )
141#define lines_after (G.lines_after )
142#define before_buf (G.before_buf )
143#define before_buf_size (G.before_buf_size )
144#define last_line_printed (G.last_line_printed )
145#define pattern_head (G.pattern_head )
146#define cur_file (G.cur_file )
147
148
149typedef struct grep_list_data_t {
150 char *pattern;
151
152#if !ENABLE_EXTRA_COMPAT
153 regex_t compiled_regex;
154 regmatch_t matched_range;
155#else
156 struct re_pattern_buffer compiled_regex;
157 struct re_registers matched_range;
158#endif
159#define ALLOCATED 1
160#define COMPILED 2
161 int flg_mem_alocated_compiled;
162} grep_list_data_t;
163
164#if !ENABLE_EXTRA_COMPAT
165#define print_line(line, line_len, linenum, decoration) \
166 print_line(line, linenum, decoration)
167#endif
168static void print_line(const char *line, size_t line_len, int linenum, char decoration)
169{
170#if ENABLE_FEATURE_GREP_CONTEXT
171
172
173 if (linenum < 1)
174 return;
175
176 if ((lines_before || lines_after) && did_print_line
177 && last_line_printed != linenum - 1
178 ) {
179 puts("--");
180 }
181
182 did_print_line = 1;
183 last_line_printed = linenum;
184#endif
185 if (print_filename)
186 printf("%s%c", cur_file, decoration);
187 if (PRINT_LINE_NUM)
188 printf("%i%c", linenum, decoration);
189
190 if ((option_mask32 & (OPT_v|OPT_o)) != (OPT_v|OPT_o)) {
191#if !ENABLE_EXTRA_COMPAT
192 puts(line);
193#else
194 fwrite(line, 1, line_len, stdout);
195 putchar(NUL_DELIMITED ? '\0' : '\n');
196#endif
197 }
198}
199
200#if ENABLE_EXTRA_COMPAT
201
202static ssize_t FAST_FUNC bb_getline(char **line_ptr, size_t *line_alloc_len, FILE *file)
203{
204 ssize_t res_sz;
205 char *line;
206 int delim = (NUL_DELIMITED ? '\0' : '\n');
207
208 res_sz = getdelim(line_ptr, line_alloc_len, delim, file);
209 line = *line_ptr;
210
211 if (res_sz > 0) {
212 if (line[res_sz - 1] == delim)
213 line[--res_sz] = '\0';
214 } else {
215 free(line);
216 }
217 return res_sz;
218}
219#endif
220
221static int grep_file(FILE *file)
222{
223 smalluint found;
224 int linenum = 0;
225 int nmatches = 0;
226#if !ENABLE_EXTRA_COMPAT
227 char *line;
228#else
229 char *line = NULL;
230 ssize_t line_len;
231 size_t line_alloc_len;
232# define rm_so start[0]
233# define rm_eo end[0]
234#endif
235#if ENABLE_FEATURE_GREP_CONTEXT
236 int print_n_lines_after = 0;
237 int curpos = 0;
238 int idx = 0;
239#else
240 enum { print_n_lines_after = 0 };
241#endif
242
243 while (
244#if !ENABLE_EXTRA_COMPAT
245 (line = xmalloc_fgetline(file)) != NULL
246#else
247 (line_len = bb_getline(&line, &line_alloc_len, file)) >= 0
248#endif
249 ) {
250 llist_t *pattern_ptr = pattern_head;
251 grep_list_data_t *gl = gl;
252
253 linenum++;
254 found = 0;
255 while (pattern_ptr) {
256 gl = (grep_list_data_t *)pattern_ptr->data;
257 if (FGREP_FLAG) {
258 found |= (strstr(line, gl->pattern) != NULL);
259 } else {
260 if (!(gl->flg_mem_alocated_compiled & COMPILED)) {
261 gl->flg_mem_alocated_compiled |= COMPILED;
262#if !ENABLE_EXTRA_COMPAT
263 xregcomp(&gl->compiled_regex, gl->pattern, reflags);
264#else
265 memset(&gl->compiled_regex, 0, sizeof(gl->compiled_regex));
266 gl->compiled_regex.translate = case_fold;
267 if (re_compile_pattern(gl->pattern, strlen(gl->pattern), &gl->compiled_regex))
268 bb_error_msg_and_die("bad regex '%s'", gl->pattern);
269#endif
270 }
271#if !ENABLE_EXTRA_COMPAT
272 gl->matched_range.rm_so = 0;
273 gl->matched_range.rm_eo = 0;
274#endif
275 if (
276#if !ENABLE_EXTRA_COMPAT
277 regexec(&gl->compiled_regex, line, 1, &gl->matched_range, 0) == 0
278#else
279 re_search(&gl->compiled_regex, line, line_len,
280 0, line_len,
281 &gl->matched_range) >= 0
282#endif
283 ) {
284 if (!(option_mask32 & OPT_w))
285 found = 1;
286 else {
287 char c = ' ';
288 if (gl->matched_range.rm_so)
289 c = line[gl->matched_range.rm_so - 1];
290 if (!isalnum(c) && c != '_') {
291 c = line[gl->matched_range.rm_eo];
292 if (!c || (!isalnum(c) && c != '_'))
293 found = 1;
294 }
295 }
296 }
297 }
298
299
300 if (found && !invert_search)
301 goto do_found;
302 pattern_ptr = pattern_ptr->link;
303 }
304
305 if (found ^ invert_search) {
306 do_found:
307
308 nmatches++;
309
310
311 if (option_mask32 & (OPT_q|OPT_l|OPT_L)) {
312 free(line);
313 if (BE_QUIET) {
314
315
316
317
318 exit(EXIT_SUCCESS);
319 }
320
321 if (PRINT_FILES_WITH_MATCHES) {
322 puts(cur_file);
323
324 }
325
326 return 1;
327 }
328
329#if ENABLE_FEATURE_GREP_CONTEXT
330
331 if ((option_mask32 & OPT_m) && nmatches > max_matches)
332 break;
333#endif
334
335
336 if (PRINT_MATCH_COUNTS == 0) {
337#if ENABLE_FEATURE_GREP_CONTEXT
338 int prevpos = (curpos == 0) ? lines_before - 1 : curpos - 1;
339
340
341
342 if (lines_before && before_buf[prevpos] != NULL) {
343 int first_buf_entry_line_num = linenum - lines_before;
344
345
346
347
348 idx = curpos;
349 while (before_buf[idx] == NULL) {
350 idx = (idx + 1) % lines_before;
351 first_buf_entry_line_num++;
352 }
353
354
355 while (before_buf[idx] != NULL) {
356 print_line(before_buf[idx], before_buf_size[idx], first_buf_entry_line_num, '-');
357 free(before_buf[idx]);
358 before_buf[idx] = NULL;
359 idx = (idx + 1) % lines_before;
360 first_buf_entry_line_num++;
361 }
362 }
363
364
365 print_n_lines_after = lines_after;
366#endif
367 if (option_mask32 & OPT_o) {
368 if (FGREP_FLAG) {
369
370
371 if (found)
372 print_line(gl->pattern, strlen(gl->pattern), linenum, ':');
373 } else while (1) {
374 unsigned end = gl->matched_range.rm_eo;
375 char old = line[end];
376 line[end] = '\0';
377 print_line(line + gl->matched_range.rm_so,
378 end - gl->matched_range.rm_so,
379 linenum, ':');
380 if (old == '\0')
381 break;
382 line[end] = old;
383#if !ENABLE_EXTRA_COMPAT
384 if (regexec(&gl->compiled_regex, line + end,
385 1, &gl->matched_range, REG_NOTBOL) != 0)
386 break;
387 gl->matched_range.rm_so += end;
388 gl->matched_range.rm_eo += end;
389#else
390 if (re_search(&gl->compiled_regex, line, line_len,
391 end, line_len - end,
392 &gl->matched_range) < 0)
393 break;
394#endif
395 }
396 } else {
397 print_line(line, line_len, linenum, ':');
398 }
399 }
400 }
401#if ENABLE_FEATURE_GREP_CONTEXT
402 else {
403
404 if (print_n_lines_after) {
405 print_line(line, strlen(line), linenum, '-');
406 print_n_lines_after--;
407 } else if (lines_before) {
408
409 free(before_buf[curpos]);
410 before_buf[curpos] = line;
411 IF_EXTRA_COMPAT(before_buf_size[curpos] = line_len;)
412 curpos = (curpos + 1) % lines_before;
413
414 line = NULL;
415 }
416 }
417
418#endif
419#if !ENABLE_EXTRA_COMPAT
420 free(line);
421#endif
422
423 if ((option_mask32 & OPT_m)
424 && !print_n_lines_after
425 && nmatches == max_matches
426 ) {
427 break;
428 }
429 }
430
431
432
433
434
435 if (PRINT_MATCH_COUNTS) {
436 if (print_filename)
437 printf("%s:", cur_file);
438 printf("%d\n", nmatches);
439 }
440
441
442 if (PRINT_FILES_WITHOUT_MATCHES) {
443
444
445
446 puts(cur_file);
447 }
448
449 return nmatches;
450}
451
452#if ENABLE_FEATURE_CLEAN_UP
453#define new_grep_list_data(p, m) add_grep_list_data(p, m)
454static char *add_grep_list_data(char *pattern, int flg_used_mem)
455#else
456#define new_grep_list_data(p, m) add_grep_list_data(p)
457static char *add_grep_list_data(char *pattern)
458#endif
459{
460 grep_list_data_t *gl = xzalloc(sizeof(*gl));
461 gl->pattern = pattern;
462#if ENABLE_FEATURE_CLEAN_UP
463 gl->flg_mem_alocated_compiled = flg_used_mem;
464#else
465
466#endif
467 return (char *)gl;
468}
469
470static void load_regexes_from_file(llist_t *fopt)
471{
472 char *line;
473 FILE *f;
474
475 while (fopt) {
476 llist_t *cur = fopt;
477 char *ffile = cur->data;
478
479 fopt = cur->link;
480 free(cur);
481 f = xfopen_stdin(ffile);
482 while ((line = xmalloc_fgetline(f)) != NULL) {
483 llist_add_to(&pattern_head,
484 new_grep_list_data(line, ALLOCATED));
485 }
486 }
487}
488
489static int FAST_FUNC file_action_grep(const char *filename,
490 struct stat *statbuf UNUSED_PARAM,
491 void* matched,
492 int depth UNUSED_PARAM)
493{
494 FILE *file = fopen_for_read(filename);
495 if (file == NULL) {
496 if (!SUPPRESS_ERR_MSGS)
497 bb_simple_perror_msg(filename);
498 open_errors = 1;
499 return 0;
500 }
501 cur_file = filename;
502 *(int*)matched += grep_file(file);
503 fclose(file);
504 return 1;
505}
506
507static int grep_dir(const char *dir)
508{
509 int matched = 0;
510 recursive_action(dir,
511 ACTION_RECURSE |
512
513 ACTION_DEPTHFIRST,
514 file_action_grep,
515 NULL,
516 &matched,
517 0);
518 return matched;
519}
520
521int grep_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
522int grep_main(int argc UNUSED_PARAM, char **argv)
523{
524 FILE *file;
525 int matched;
526 llist_t *fopt = NULL;
527
528
529#if ENABLE_FEATURE_GREP_CONTEXT
530 int Copt;
531
532
533
534 opt_complementary = "H-h:C-AB:e::f::m+:A+:B+:C+";
535 getopt32(argv,
536 OPTSTR_GREP,
537 &pattern_head, &fopt, &max_matches,
538 &lines_after, &lines_before, &Copt);
539
540 if (option_mask32 & OPT_C) {
541
542
543 if (!(option_mask32 & OPT_A))
544 lines_after = Copt;
545 if (!(option_mask32 & OPT_B))
546 lines_before = Copt;
547 }
548
549 if (option_mask32 & (OPT_c|OPT_q|OPT_l|OPT_L)) {
550 option_mask32 &= ~OPT_n;
551 lines_before = 0;
552 lines_after = 0;
553 } else if (lines_before > 0) {
554 before_buf = xzalloc(lines_before * sizeof(before_buf[0]));
555 IF_EXTRA_COMPAT(before_buf_size = xzalloc(lines_before * sizeof(before_buf_size[0]));)
556 }
557#else
558
559
560 opt_complementary = "H-h:c-n:q-n:l-n:e::f::m+";
561 getopt32(argv, OPTSTR_GREP,
562 &pattern_head, &fopt, &max_matches);
563#endif
564 invert_search = ((option_mask32 & OPT_v) != 0);
565
566 if (pattern_head != NULL) {
567
568 llist_t *cur;
569
570 for (cur = pattern_head; cur; cur = cur->link)
571 cur->data = new_grep_list_data(cur->data, 0);
572 }
573 if (option_mask32 & OPT_f)
574 load_regexes_from_file(fopt);
575
576 if (ENABLE_FEATURE_GREP_FGREP_ALIAS && applet_name[0] == 'f')
577 option_mask32 |= OPT_F;
578
579#if !ENABLE_EXTRA_COMPAT
580 if (!(option_mask32 & (OPT_o | OPT_w)))
581 reflags = REG_NOSUB;
582#endif
583
584 if (ENABLE_FEATURE_GREP_EGREP_ALIAS
585 && (applet_name[0] == 'e' || (option_mask32 & OPT_E))
586 ) {
587 reflags |= REG_EXTENDED;
588 }
589#if ENABLE_EXTRA_COMPAT
590 else {
591 reflags = RE_SYNTAX_GREP;
592 }
593#endif
594
595 if (option_mask32 & OPT_i) {
596#if !ENABLE_EXTRA_COMPAT
597 reflags |= REG_ICASE;
598#else
599 int i;
600 case_fold = xmalloc(256);
601 for (i = 0; i < 256; i++)
602 case_fold[i] = (unsigned char)i;
603 for (i = 'a'; i <= 'z'; i++)
604 case_fold[i] = (unsigned char)(i - ('a' - 'A'));
605#endif
606 }
607
608 argv += optind;
609
610
611
612 if (pattern_head == NULL) {
613 char *pattern;
614 if (*argv == NULL)
615 bb_show_usage();
616 pattern = new_grep_list_data(*argv++, 0);
617 llist_add_to(&pattern_head, pattern);
618 }
619
620
621
622 if (argv[0] && argv[1])
623 print_filename = 1;
624
625 if (option_mask32 & OPT_H)
626 print_filename = 1;
627 if (option_mask32 & OPT_h)
628 print_filename = 0;
629
630
631
632 matched = 0;
633 do {
634 cur_file = *argv;
635 file = stdin;
636 if (!cur_file || LONE_DASH(cur_file)) {
637 cur_file = "(standard input)";
638 } else {
639 if (option_mask32 & OPT_r) {
640 struct stat st;
641 if (stat(cur_file, &st) == 0 && S_ISDIR(st.st_mode)) {
642 if (!(option_mask32 & OPT_h))
643 print_filename = 1;
644 matched += grep_dir(cur_file);
645 goto grep_done;
646 }
647 }
648
649 file = fopen_for_read(cur_file);
650 if (file == NULL) {
651 if (!SUPPRESS_ERR_MSGS)
652 bb_simple_perror_msg(cur_file);
653 open_errors = 1;
654 continue;
655 }
656 }
657 matched += grep_file(file);
658 fclose_if_not_stdin(file);
659 grep_done: ;
660 } while (*argv && *++argv);
661
662
663 if (ENABLE_FEATURE_CLEAN_UP) {
664 while (pattern_head) {
665 llist_t *pattern_head_ptr = pattern_head;
666 grep_list_data_t *gl = (grep_list_data_t *)pattern_head_ptr->data;
667
668 pattern_head = pattern_head->link;
669 if (gl->flg_mem_alocated_compiled & ALLOCATED)
670 free(gl->pattern);
671 if (gl->flg_mem_alocated_compiled & COMPILED)
672 regfree(&gl->compiled_regex);
673 free(gl);
674 free(pattern_head_ptr);
675 }
676 }
677
678 if (open_errors)
679 return 2;
680 return !matched;
681}
682