2005-09-23 15:38:49 +00:00
|
|
|
/* vi: set sw=4 ts=4: */
|
1999-10-05 16:24:54 +00:00
|
|
|
/*
|
2000-06-28 22:00:26 +00:00
|
|
|
* Mini grep implementation for busybox using libc regex.
|
1999-10-20 22:08:37 +00:00
|
|
|
*
|
2001-10-24 05:00:29 +00:00
|
|
|
* Copyright (C) 1999,2000,2001 by Lineo, inc. and Mark Whitley
|
2004-03-15 08:29:22 +00:00
|
|
|
* Copyright (C) 1999,2000,2001 by Mark Whitley <markw@codepoet.org>
|
1999-10-19 06:02:44 +00:00
|
|
|
*
|
2010-08-16 20:14:46 +02:00
|
|
|
* Licensed under GPLv2 or later, see file LICENSE in this source tree.
|
1999-10-05 16:24:54 +00:00
|
|
|
*/
|
2008-03-17 09:09:09 +00:00
|
|
|
/* BB_AUDIT SUSv3 defects - unsupported option -x "match whole line only". */
|
2005-09-23 15:38:49 +00:00
|
|
|
/* BB_AUDIT GNU defects - always acts as -a. */
|
|
|
|
/* http://www.opengroup.org/onlinepubs/007904975/utilities/grep.html */
|
2003-06-20 09:01:58 +00:00
|
|
|
/*
|
2006-02-28 10:10:19 +00:00
|
|
|
* 2004,2006 (C) Vladimir Oleynik <dzo@simtreas.ru> -
|
2004-05-26 09:46:41 +00:00
|
|
|
* correction "-e pattern1 -e pattern2" logic and more optimizations.
|
2006-02-28 10:10:19 +00:00
|
|
|
* precompiled regex
|
2010-06-15 15:40:16 +02:00
|
|
|
*
|
2006-09-29 20:58:53 +00:00
|
|
|
* (C) 2006 Jac Goudsmit added -o option
|
|
|
|
*/
|
2010-05-09 04:22:48 +02:00
|
|
|
//config:config GREP
|
2018-12-28 03:20:17 +01:00
|
|
|
//config: bool "grep (8.6 kb)"
|
2010-06-06 04:14:28 +02:00
|
|
|
//config: default y
|
2010-05-09 04:22:48 +02:00
|
|
|
//config: help
|
2017-07-21 09:50:55 +02:00
|
|
|
//config: grep is used to search files for a specified pattern.
|
2010-05-09 04:22:48 +02:00
|
|
|
//config:
|
2016-11-14 05:09:48 +01:00
|
|
|
//config:config EGREP
|
2018-12-28 03:20:17 +01:00
|
|
|
//config: bool "egrep (7.8 kb)"
|
2010-05-09 04:22:48 +02:00
|
|
|
//config: default y
|
|
|
|
//config: help
|
2017-07-21 09:50:55 +02:00
|
|
|
//config: Alias to "grep -E".
|
2010-05-09 04:22:48 +02:00
|
|
|
//config:
|
2016-11-14 05:09:48 +01:00
|
|
|
//config:config FGREP
|
2018-12-28 03:20:17 +01:00
|
|
|
//config: bool "fgrep (7.8 kb)"
|
2010-05-09 04:22:48 +02:00
|
|
|
//config: default y
|
|
|
|
//config: help
|
2017-07-21 09:50:55 +02:00
|
|
|
//config: Alias to "grep -F".
|
2010-05-09 04:22:48 +02:00
|
|
|
//config:
|
|
|
|
//config:config FEATURE_GREP_CONTEXT
|
|
|
|
//config: bool "Enable before and after context flags (-A, -B and -C)"
|
|
|
|
//config: default y
|
2017-04-12 17:53:54 +02:00
|
|
|
//config: depends on GREP || EGREP || FGREP
|
2010-05-09 04:22:48 +02:00
|
|
|
//config: help
|
2017-07-21 09:50:55 +02:00
|
|
|
//config: Print the specified number of leading (-B) and/or trailing (-A)
|
|
|
|
//config: context surrounding our matching lines.
|
|
|
|
//config: Print the specified number of context lines (-C).
|
2010-05-09 04:22:48 +02:00
|
|
|
|
2016-11-14 05:09:48 +01:00
|
|
|
//applet:IF_GREP(APPLET(grep, BB_DIR_BIN, BB_SUID_DROP))
|
2017-01-29 14:57:33 +01:00
|
|
|
// APPLET_ODDNAME:name main location suid_type help
|
2016-11-14 05:09:48 +01:00
|
|
|
//applet:IF_EGREP(APPLET_ODDNAME(egrep, grep, BB_DIR_BIN, BB_SUID_DROP, egrep))
|
|
|
|
//applet:IF_FGREP(APPLET_ODDNAME(fgrep, grep, BB_DIR_BIN, BB_SUID_DROP, fgrep))
|
|
|
|
|
|
|
|
//kbuild:lib-$(CONFIG_GREP) += grep.o
|
|
|
|
//kbuild:lib-$(CONFIG_EGREP) += grep.o
|
|
|
|
//kbuild:lib-$(CONFIG_FGREP) += grep.o
|
|
|
|
|
2007-05-26 19:00:18 +00:00
|
|
|
#include "libbb.h"
|
2016-04-21 16:26:30 +02:00
|
|
|
#include "common_bufsiz.h"
|
2005-09-14 16:59:11 +00:00
|
|
|
#include "xregex.h"
|
2000-06-28 22:00:26 +00:00
|
|
|
|
2010-06-15 15:40:16 +02:00
|
|
|
|
2000-06-28 22:00:26 +00:00
|
|
|
/* options */
|
2010-06-15 15:40:16 +02:00
|
|
|
//usage:#define grep_trivial_usage
|
2016-11-14 05:09:48 +01:00
|
|
|
//usage: "[-HhnlLoqvsriwFE"
|
2010-06-15 15:40:16 +02:00
|
|
|
//usage: IF_EXTRA_COMPAT("z")
|
|
|
|
//usage: "] [-m N] "
|
|
|
|
//usage: IF_FEATURE_GREP_CONTEXT("[-A/B/C N] ")
|
|
|
|
//usage: "PATTERN/-e PATTERN.../-f FILE [FILE]..."
|
|
|
|
//usage:#define grep_full_usage "\n\n"
|
|
|
|
//usage: "Search for PATTERN in FILEs (or stdin)\n"
|
|
|
|
//usage: "\n -H Add 'filename:' prefix"
|
|
|
|
//usage: "\n -h Do not add 'filename:' prefix"
|
|
|
|
//usage: "\n -n Add 'line_no:' prefix"
|
|
|
|
//usage: "\n -l Show only names of files that match"
|
|
|
|
//usage: "\n -L Show only names of files that don't match"
|
|
|
|
//usage: "\n -c Show only count of matching lines"
|
|
|
|
//usage: "\n -o Show only the matching part of line"
|
|
|
|
//usage: "\n -q Quiet. Return 0 if PATTERN is found, 1 otherwise"
|
|
|
|
//usage: "\n -v Select non-matching lines"
|
|
|
|
//usage: "\n -s Suppress open and read errors"
|
|
|
|
//usage: "\n -r Recurse"
|
|
|
|
//usage: "\n -i Ignore case"
|
|
|
|
//usage: "\n -w Match whole words only"
|
2012-02-23 14:20:22 +00:00
|
|
|
//usage: "\n -x Match whole lines only"
|
2010-06-15 15:40:16 +02:00
|
|
|
//usage: "\n -F PATTERN is a literal (not regexp)"
|
|
|
|
//usage: "\n -E PATTERN is an extended regexp"
|
|
|
|
//usage: IF_EXTRA_COMPAT(
|
|
|
|
//usage: "\n -z Input is NUL terminated"
|
|
|
|
//usage: )
|
|
|
|
//usage: "\n -m N Match up to N times per file"
|
|
|
|
//usage: IF_FEATURE_GREP_CONTEXT(
|
|
|
|
//usage: "\n -A N Print N lines of trailing context"
|
|
|
|
//usage: "\n -B N Print N lines of leading context"
|
|
|
|
//usage: "\n -C N Same as '-A N -B N'"
|
|
|
|
//usage: )
|
|
|
|
//usage: "\n -e PTRN Pattern to match"
|
|
|
|
//usage: "\n -f FILE Read pattern from file"
|
|
|
|
//usage:
|
|
|
|
//usage:#define grep_example_usage
|
|
|
|
//usage: "$ grep root /etc/passwd\n"
|
|
|
|
//usage: "root:x:0:0:root:/root:/bin/bash\n"
|
|
|
|
//usage: "$ grep ^[rR]oo. /etc/passwd\n"
|
|
|
|
//usage: "root:x:0:0:root:/root:/bin/bash\n"
|
|
|
|
//usage:
|
|
|
|
//usage:#define egrep_trivial_usage NOUSAGE_STR
|
|
|
|
//usage:#define egrep_full_usage ""
|
|
|
|
//usage:#define fgrep_trivial_usage NOUSAGE_STR
|
|
|
|
//usage:#define fgrep_full_usage ""
|
|
|
|
|
2017-08-08 21:55:02 +02:00
|
|
|
/* -e,-f are lists; -m,-A,-B,-C have numeric param */
|
2007-02-25 02:38:20 +00:00
|
|
|
#define OPTSTR_GREP \
|
2016-07-06 21:58:02 +02:00
|
|
|
"lnqvscFiHhe:*f:*Lorm:+wx" \
|
|
|
|
IF_FEATURE_GREP_CONTEXT("A:+B:+C:+") \
|
2016-11-14 05:09:48 +01:00
|
|
|
"E" \
|
2009-04-21 11:09:40 +00:00
|
|
|
IF_EXTRA_COMPAT("z") \
|
2007-02-25 02:38:54 +00:00
|
|
|
"aI"
|
|
|
|
/* ignored: -a "assume all files to be text" */
|
|
|
|
/* ignored: -I "assume binary files have no matches" */
|
2007-02-25 02:38:20 +00:00
|
|
|
enum {
|
2007-07-15 12:39:08 +00:00
|
|
|
OPTBIT_l, /* list matched file names only */
|
|
|
|
OPTBIT_n, /* print line# */
|
2008-05-19 09:29:47 +00:00
|
|
|
OPTBIT_q, /* quiet - exit(EXIT_SUCCESS) of first match */
|
2007-07-15 12:39:08 +00:00
|
|
|
OPTBIT_v, /* invert the match, to select non-matching lines */
|
|
|
|
OPTBIT_s, /* suppress errors about file open errors */
|
|
|
|
OPTBIT_c, /* count matches per file (suppresses normal output) */
|
|
|
|
OPTBIT_F, /* literal match */
|
|
|
|
OPTBIT_i, /* case-insensitive */
|
|
|
|
OPTBIT_H, /* force filename display */
|
|
|
|
OPTBIT_h, /* inhibit filename display */
|
|
|
|
OPTBIT_e, /* -e PATTERN */
|
|
|
|
OPTBIT_f, /* -f FILE_WITH_PATTERNS */
|
|
|
|
OPTBIT_L, /* list unmatched file names only */
|
|
|
|
OPTBIT_o, /* show only matching parts of lines */
|
|
|
|
OPTBIT_r, /* recurse dirs */
|
|
|
|
OPTBIT_m, /* -m MAX_MATCHES */
|
2010-04-26 08:45:44 +02:00
|
|
|
OPTBIT_w, /* -w whole word match */
|
2012-02-23 14:20:22 +00:00
|
|
|
OPTBIT_x, /* -x whole line match */
|
2009-04-21 11:09:40 +00:00
|
|
|
IF_FEATURE_GREP_CONTEXT( OPTBIT_A ,) /* -A NUM: after-match context */
|
|
|
|
IF_FEATURE_GREP_CONTEXT( OPTBIT_B ,) /* -B NUM: before-match context */
|
|
|
|
IF_FEATURE_GREP_CONTEXT( OPTBIT_C ,) /* -C NUM: -A and -B combined */
|
2016-11-14 05:09:48 +01:00
|
|
|
OPTBIT_E, /* extended regexp */
|
2009-04-21 11:09:40 +00:00
|
|
|
IF_EXTRA_COMPAT( OPTBIT_z ,) /* input is NUL terminated */
|
2007-02-25 02:38:20 +00:00
|
|
|
OPT_l = 1 << OPTBIT_l,
|
|
|
|
OPT_n = 1 << OPTBIT_n,
|
|
|
|
OPT_q = 1 << OPTBIT_q,
|
|
|
|
OPT_v = 1 << OPTBIT_v,
|
|
|
|
OPT_s = 1 << OPTBIT_s,
|
|
|
|
OPT_c = 1 << OPTBIT_c,
|
|
|
|
OPT_F = 1 << OPTBIT_F,
|
|
|
|
OPT_i = 1 << OPTBIT_i,
|
|
|
|
OPT_H = 1 << OPTBIT_H,
|
|
|
|
OPT_h = 1 << OPTBIT_h,
|
|
|
|
OPT_e = 1 << OPTBIT_e,
|
|
|
|
OPT_f = 1 << OPTBIT_f,
|
|
|
|
OPT_L = 1 << OPTBIT_L,
|
|
|
|
OPT_o = 1 << OPTBIT_o,
|
|
|
|
OPT_r = 1 << OPTBIT_r,
|
2007-07-15 12:39:08 +00:00
|
|
|
OPT_m = 1 << OPTBIT_m,
|
2010-04-26 08:45:44 +02:00
|
|
|
OPT_w = 1 << OPTBIT_w,
|
2012-02-23 14:20:22 +00:00
|
|
|
OPT_x = 1 << OPTBIT_x,
|
2009-04-21 11:09:40 +00:00
|
|
|
OPT_A = IF_FEATURE_GREP_CONTEXT( (1 << OPTBIT_A)) + 0,
|
|
|
|
OPT_B = IF_FEATURE_GREP_CONTEXT( (1 << OPTBIT_B)) + 0,
|
|
|
|
OPT_C = IF_FEATURE_GREP_CONTEXT( (1 << OPTBIT_C)) + 0,
|
2016-11-14 05:09:48 +01:00
|
|
|
OPT_E = 1 << OPTBIT_E,
|
2009-04-21 11:09:40 +00:00
|
|
|
OPT_z = IF_EXTRA_COMPAT( (1 << OPTBIT_z)) + 0,
|
2007-02-25 02:38:20 +00:00
|
|
|
};
|
|
|
|
|
2007-06-08 15:41:27 +00:00
|
|
|
#define PRINT_FILES_WITH_MATCHES (option_mask32 & OPT_l)
|
|
|
|
#define PRINT_LINE_NUM (option_mask32 & OPT_n)
|
|
|
|
#define BE_QUIET (option_mask32 & OPT_q)
|
|
|
|
#define SUPPRESS_ERR_MSGS (option_mask32 & OPT_s)
|
|
|
|
#define PRINT_MATCH_COUNTS (option_mask32 & OPT_c)
|
|
|
|
#define FGREP_FLAG (option_mask32 & OPT_F)
|
2007-02-25 02:38:20 +00:00
|
|
|
#define PRINT_FILES_WITHOUT_MATCHES (option_mask32 & OPT_L)
|
2009-03-20 22:17:13 +00:00
|
|
|
#define NUL_DELIMITED (option_mask32 & OPT_z)
|
2003-06-20 09:01:58 +00:00
|
|
|
|
2007-09-10 12:18:32 +00:00
|
|
|
struct globals {
|
|
|
|
int max_matches;
|
2008-09-19 21:29:21 +00:00
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
2007-09-10 12:18:32 +00:00
|
|
|
int reflags;
|
2008-09-19 21:29:21 +00:00
|
|
|
#else
|
|
|
|
RE_TRANSLATE_TYPE case_fold; /* RE_TRANSLATE_TYPE is [[un]signed] char* */
|
|
|
|
#endif
|
2007-09-10 12:18:32 +00:00
|
|
|
smalluint invert_search;
|
|
|
|
smalluint print_filename;
|
|
|
|
smalluint open_errors;
|
2005-09-23 15:38:49 +00:00
|
|
|
#if ENABLE_FEATURE_GREP_CONTEXT
|
2007-09-10 12:18:32 +00:00
|
|
|
smalluint did_print_line;
|
|
|
|
int lines_before;
|
|
|
|
int lines_after;
|
|
|
|
char **before_buf;
|
2009-04-21 11:09:40 +00:00
|
|
|
IF_EXTRA_COMPAT(size_t *before_buf_size;)
|
2007-09-10 12:18:32 +00:00
|
|
|
int last_line_printed;
|
|
|
|
#endif
|
|
|
|
/* globals used internally */
|
|
|
|
llist_t *pattern_head; /* growable list of patterns to match */
|
|
|
|
const char *cur_file; /* the current file we are reading */
|
2010-02-04 15:00:15 +01:00
|
|
|
} FIX_ALIASING;
|
2016-04-21 16:26:30 +02:00
|
|
|
#define G (*(struct globals*)bb_common_bufsiz1)
|
2008-06-25 09:53:17 +00:00
|
|
|
#define INIT_G() do { \
|
2016-04-21 18:18:48 +02:00
|
|
|
setup_common_bufsiz(); \
|
2015-10-13 17:17:34 +02:00
|
|
|
BUILD_BUG_ON(sizeof(G) > COMMON_BUFSIZE); \
|
2008-06-25 09:53:17 +00:00
|
|
|
} while (0)
|
2007-09-10 12:18:32 +00:00
|
|
|
#define max_matches (G.max_matches )
|
2008-09-19 21:29:21 +00:00
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
2009-07-29 01:20:09 +02:00
|
|
|
# define reflags (G.reflags )
|
2008-09-19 21:29:21 +00:00
|
|
|
#else
|
2009-07-29 01:20:09 +02:00
|
|
|
# define case_fold (G.case_fold )
|
2008-09-19 21:29:21 +00:00
|
|
|
/* http://www.delorie.com/gnu/docs/regex/regex_46.html */
|
2009-07-29 01:20:09 +02:00
|
|
|
# define reflags re_syntax_options
|
|
|
|
# undef REG_NOSUB
|
|
|
|
# undef REG_EXTENDED
|
|
|
|
# undef REG_ICASE
|
|
|
|
# define REG_NOSUB bug:is:here /* should not be used */
|
|
|
|
/* Just RE_SYNTAX_EGREP is not enough, need to enable {n[,[m]]} too */
|
|
|
|
# define REG_EXTENDED (RE_SYNTAX_EGREP | RE_INTERVALS | RE_NO_BK_BRACES)
|
|
|
|
# define REG_ICASE bug:is:here /* should not be used */
|
2008-09-19 21:29:21 +00:00
|
|
|
#endif
|
2007-09-10 12:18:32 +00:00
|
|
|
#define invert_search (G.invert_search )
|
|
|
|
#define print_filename (G.print_filename )
|
|
|
|
#define open_errors (G.open_errors )
|
|
|
|
#define did_print_line (G.did_print_line )
|
|
|
|
#define lines_before (G.lines_before )
|
|
|
|
#define lines_after (G.lines_after )
|
|
|
|
#define before_buf (G.before_buf )
|
2008-08-09 16:15:14 +00:00
|
|
|
#define before_buf_size (G.before_buf_size )
|
2007-09-10 12:18:32 +00:00
|
|
|
#define last_line_printed (G.last_line_printed )
|
|
|
|
#define pattern_head (G.pattern_head )
|
|
|
|
#define cur_file (G.cur_file )
|
|
|
|
|
2000-06-28 22:00:26 +00:00
|
|
|
|
2007-02-25 02:37:49 +00:00
|
|
|
typedef struct grep_list_data_t {
|
2006-02-28 10:10:19 +00:00
|
|
|
char *pattern;
|
2008-08-09 16:15:14 +00:00
|
|
|
/* for GNU regex, matched_range must be persistent across grep_file() calls */
|
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
|
|
|
regex_t compiled_regex;
|
|
|
|
regmatch_t matched_range;
|
|
|
|
#else
|
|
|
|
struct re_pattern_buffer compiled_regex;
|
|
|
|
struct re_registers matched_range;
|
|
|
|
#endif
|
2008-06-07 05:19:31 +00:00
|
|
|
#define ALLOCATED 1
|
2006-02-28 10:10:19 +00:00
|
|
|
#define COMPILED 2
|
2016-09-17 20:58:22 +02:00
|
|
|
int flg_mem_allocated_compiled;
|
2006-02-28 10:10:19 +00:00
|
|
|
} grep_list_data_t;
|
2001-05-24 18:36:18 +00:00
|
|
|
|
2008-08-09 16:15:14 +00:00
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
|
|
|
#define print_line(line, line_len, linenum, decoration) \
|
|
|
|
print_line(line, linenum, decoration)
|
|
|
|
#endif
|
|
|
|
static void print_line(const char *line, size_t line_len, int linenum, char decoration)
|
2001-02-09 00:41:10 +00:00
|
|
|
{
|
2005-09-23 15:38:49 +00:00
|
|
|
#if ENABLE_FEATURE_GREP_CONTEXT
|
2007-07-15 12:38:18 +00:00
|
|
|
/* Happens when we go to next file, immediately hit match
|
|
|
|
* and try to print prev context... from prev file! Don't do it */
|
|
|
|
if (linenum < 1)
|
|
|
|
return;
|
2004-04-14 17:51:38 +00:00
|
|
|
/* possibly print the little '--' separator */
|
2008-08-09 16:15:14 +00:00
|
|
|
if ((lines_before || lines_after) && did_print_line
|
|
|
|
&& last_line_printed != linenum - 1
|
|
|
|
) {
|
2001-02-09 00:41:10 +00:00
|
|
|
puts("--");
|
|
|
|
}
|
2007-07-15 12:38:18 +00:00
|
|
|
/* guard against printing "--" before first line of first file */
|
|
|
|
did_print_line = 1;
|
2001-02-09 00:41:10 +00:00
|
|
|
last_line_printed = linenum;
|
|
|
|
#endif
|
2006-10-14 14:24:30 +00:00
|
|
|
if (print_filename)
|
2001-02-09 00:41:10 +00:00
|
|
|
printf("%s%c", cur_file, decoration);
|
2005-09-23 15:38:49 +00:00
|
|
|
if (PRINT_LINE_NUM)
|
2001-02-09 00:41:10 +00:00
|
|
|
printf("%i%c", linenum, decoration);
|
2006-09-29 20:58:53 +00:00
|
|
|
/* Emulate weird GNU grep behavior with -ov */
|
2008-08-09 16:15:14 +00:00
|
|
|
if ((option_mask32 & (OPT_v|OPT_o)) != (OPT_v|OPT_o)) {
|
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
2006-09-29 20:58:53 +00:00
|
|
|
puts(line);
|
2008-08-09 16:15:14 +00:00
|
|
|
#else
|
|
|
|
fwrite(line, 1, line_len, stdout);
|
2009-03-20 22:17:13 +00:00
|
|
|
putchar(NUL_DELIMITED ? '\0' : '\n');
|
2008-08-09 16:15:14 +00:00
|
|
|
#endif
|
|
|
|
}
|
2001-02-09 00:41:10 +00:00
|
|
|
}
|
1999-11-08 17:00:52 +00:00
|
|
|
|
2008-08-09 16:15:14 +00:00
|
|
|
#if ENABLE_EXTRA_COMPAT
|
|
|
|
/* Unlike getline, this one removes trailing '\n' */
|
|
|
|
static ssize_t FAST_FUNC bb_getline(char **line_ptr, size_t *line_alloc_len, FILE *file)
|
2000-06-28 22:00:26 +00:00
|
|
|
{
|
2008-08-09 16:15:14 +00:00
|
|
|
ssize_t res_sz;
|
2003-06-20 09:01:58 +00:00
|
|
|
char *line;
|
2009-03-20 22:17:13 +00:00
|
|
|
int delim = (NUL_DELIMITED ? '\0' : '\n');
|
2008-08-09 16:15:14 +00:00
|
|
|
|
2009-03-20 22:17:13 +00:00
|
|
|
res_sz = getdelim(line_ptr, line_alloc_len, delim, file);
|
2008-08-09 16:15:14 +00:00
|
|
|
line = *line_ptr;
|
|
|
|
|
|
|
|
if (res_sz > 0) {
|
2009-03-20 22:17:13 +00:00
|
|
|
if (line[res_sz - 1] == delim)
|
2008-08-09 16:15:14 +00:00
|
|
|
line[--res_sz] = '\0';
|
|
|
|
} else {
|
|
|
|
free(line); /* uclibc allocates a buffer even on EOF. WTF? */
|
|
|
|
}
|
|
|
|
return res_sz;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
static int grep_file(FILE *file)
|
|
|
|
{
|
2007-09-10 12:18:32 +00:00
|
|
|
smalluint found;
|
2000-06-28 22:00:26 +00:00
|
|
|
int linenum = 0;
|
2000-08-06 15:25:53 +00:00
|
|
|
int nmatches = 0;
|
2008-08-09 16:15:14 +00:00
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
|
|
|
char *line;
|
|
|
|
#else
|
|
|
|
char *line = NULL;
|
|
|
|
ssize_t line_len;
|
|
|
|
size_t line_alloc_len;
|
2009-12-04 02:48:14 +01:00
|
|
|
# define rm_so start[0]
|
|
|
|
# define rm_eo end[0]
|
2008-08-09 16:15:14 +00:00
|
|
|
#endif
|
2005-09-23 15:38:49 +00:00
|
|
|
#if ENABLE_FEATURE_GREP_CONTEXT
|
2001-02-09 00:41:10 +00:00
|
|
|
int print_n_lines_after = 0;
|
|
|
|
int curpos = 0; /* track where we are in the circular 'before' buffer */
|
|
|
|
int idx = 0; /* used for iteration through the circular buffer */
|
2007-07-15 12:39:08 +00:00
|
|
|
#else
|
|
|
|
enum { print_n_lines_after = 0 };
|
2009-12-04 02:48:14 +01:00
|
|
|
#endif
|
2000-06-28 22:00:26 +00:00
|
|
|
|
2008-08-09 16:15:14 +00:00
|
|
|
while (
|
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
|
|
|
(line = xmalloc_fgetline(file)) != NULL
|
|
|
|
#else
|
|
|
|
(line_len = bb_getline(&line, &line_alloc_len, file)) >= 0
|
|
|
|
#endif
|
|
|
|
) {
|
2003-04-27 01:50:57 +00:00
|
|
|
llist_t *pattern_ptr = pattern_head;
|
2007-11-04 00:46:03 +00:00
|
|
|
grep_list_data_t *gl = gl; /* for gcc */
|
2003-04-27 01:50:57 +00:00
|
|
|
|
2000-06-28 22:00:26 +00:00
|
|
|
linenum++;
|
2007-09-10 12:18:32 +00:00
|
|
|
found = 0;
|
2003-04-27 01:50:57 +00:00
|
|
|
while (pattern_ptr) {
|
2006-02-28 10:10:19 +00:00
|
|
|
gl = (grep_list_data_t *)pattern_ptr->data;
|
2005-09-23 15:38:49 +00:00
|
|
|
if (FGREP_FLAG) {
|
2013-01-20 16:57:19 +01:00
|
|
|
char *match;
|
|
|
|
char *str = line;
|
|
|
|
opt_f_again:
|
|
|
|
match = ((option_mask32 & OPT_i)
|
|
|
|
? strcasestr(str, gl->pattern)
|
|
|
|
: strstr(str, gl->pattern)
|
|
|
|
);
|
|
|
|
if (match) {
|
|
|
|
if (option_mask32 & OPT_x) {
|
|
|
|
if (match != str)
|
|
|
|
goto opt_f_not_found;
|
|
|
|
if (str[strlen(gl->pattern)] != '\0')
|
|
|
|
goto opt_f_not_found;
|
|
|
|
} else
|
|
|
|
if (option_mask32 & OPT_w) {
|
2018-03-29 18:03:50 +02:00
|
|
|
char c = (match != line) ? match[-1] : ' ';
|
2013-01-20 16:57:19 +01:00
|
|
|
if (!isalnum(c) && c != '_') {
|
|
|
|
c = match[strlen(gl->pattern)];
|
|
|
|
if (!c || (!isalnum(c) && c != '_'))
|
|
|
|
goto opt_f_found;
|
|
|
|
}
|
|
|
|
str = match + 1;
|
|
|
|
goto opt_f_again;
|
|
|
|
}
|
|
|
|
opt_f_found:
|
|
|
|
found = 1;
|
|
|
|
opt_f_not_found: ;
|
|
|
|
}
|
2003-04-27 01:50:57 +00:00
|
|
|
} else {
|
2014-01-07 14:57:42 +01:00
|
|
|
#if ENABLE_EXTRA_COMPAT
|
|
|
|
unsigned start_pos;
|
2014-02-07 17:14:37 +01:00
|
|
|
#else
|
|
|
|
int match_flg;
|
2014-01-07 14:57:42 +01:00
|
|
|
#endif
|
2013-05-15 03:53:26 +02:00
|
|
|
char *match_at;
|
|
|
|
|
2016-09-17 20:58:22 +02:00
|
|
|
if (!(gl->flg_mem_allocated_compiled & COMPILED)) {
|
|
|
|
gl->flg_mem_allocated_compiled |= COMPILED;
|
2008-08-09 16:15:14 +00:00
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
|
|
|
xregcomp(&gl->compiled_regex, gl->pattern, reflags);
|
|
|
|
#else
|
|
|
|
memset(&gl->compiled_regex, 0, sizeof(gl->compiled_regex));
|
2008-09-19 21:29:21 +00:00
|
|
|
gl->compiled_regex.translate = case_fold; /* for -i */
|
2008-08-09 16:15:14 +00:00
|
|
|
if (re_compile_pattern(gl->pattern, strlen(gl->pattern), &gl->compiled_regex))
|
|
|
|
bb_error_msg_and_die("bad regex '%s'", gl->pattern);
|
|
|
|
#endif
|
2006-02-28 10:10:19 +00:00
|
|
|
}
|
2008-08-09 16:15:14 +00:00
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
|
|
|
gl->matched_range.rm_so = 0;
|
|
|
|
gl->matched_range.rm_eo = 0;
|
2014-02-07 17:14:37 +01:00
|
|
|
match_flg = 0;
|
2014-01-07 14:57:42 +01:00
|
|
|
#else
|
|
|
|
start_pos = 0;
|
2008-08-09 16:15:14 +00:00
|
|
|
#endif
|
2013-05-15 03:53:26 +02:00
|
|
|
match_at = line;
|
|
|
|
opt_w_again:
|
2014-01-07 14:57:42 +01:00
|
|
|
//bb_error_msg("'%s' start_pos:%d line_len:%d", match_at, start_pos, line_len);
|
2008-08-09 16:15:14 +00:00
|
|
|
if (
|
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
2014-02-07 17:14:37 +01:00
|
|
|
regexec(&gl->compiled_regex, match_at, 1, &gl->matched_range, match_flg) == 0
|
2008-08-09 16:15:14 +00:00
|
|
|
#else
|
2013-05-15 03:53:26 +02:00
|
|
|
re_search(&gl->compiled_regex, match_at, line_len,
|
2014-01-07 14:57:42 +01:00
|
|
|
start_pos, /*range:*/ line_len,
|
2008-08-09 16:15:14 +00:00
|
|
|
&gl->matched_range) >= 0
|
|
|
|
#endif
|
|
|
|
) {
|
2012-02-23 14:20:22 +00:00
|
|
|
if (option_mask32 & OPT_x) {
|
2019-01-29 14:42:57 +01:00
|
|
|
found |= (gl->matched_range.rm_so == 0
|
2013-05-15 03:53:26 +02:00
|
|
|
&& match_at[gl->matched_range.rm_eo] == '\0');
|
2013-01-20 16:57:19 +01:00
|
|
|
} else
|
|
|
|
if (!(option_mask32 & OPT_w)) {
|
2007-09-10 12:18:32 +00:00
|
|
|
found = 1;
|
2012-02-23 14:20:22 +00:00
|
|
|
} else {
|
2007-02-25 02:38:20 +00:00
|
|
|
char c = ' ';
|
2014-02-27 14:56:12 +01:00
|
|
|
if (match_at > line || gl->matched_range.rm_so != 0) {
|
2013-05-15 03:53:26 +02:00
|
|
|
c = match_at[gl->matched_range.rm_so - 1];
|
2014-02-27 14:56:12 +01:00
|
|
|
}
|
2007-02-25 02:38:20 +00:00
|
|
|
if (!isalnum(c) && c != '_') {
|
2013-05-15 03:53:26 +02:00
|
|
|
c = match_at[gl->matched_range.rm_eo];
|
2014-02-27 14:56:12 +01:00
|
|
|
}
|
|
|
|
if (!isalnum(c) && c != '_') {
|
|
|
|
found = 1;
|
|
|
|
} else {
|
2014-01-07 14:57:42 +01:00
|
|
|
/*
|
|
|
|
* Why check gl->matched_range.rm_eo?
|
|
|
|
* Zero-length match makes -w skip the line:
|
|
|
|
* "echo foo | grep ^" prints "foo",
|
|
|
|
* "echo foo | grep -w ^" prints nothing.
|
|
|
|
* Without such check, we can loop forever.
|
|
|
|
*/
|
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
2014-02-27 14:56:12 +01:00
|
|
|
if (gl->matched_range.rm_eo != 0) {
|
|
|
|
match_at += gl->matched_range.rm_eo;
|
|
|
|
match_flg |= REG_NOTBOL;
|
|
|
|
goto opt_w_again;
|
|
|
|
}
|
2014-01-07 14:57:42 +01:00
|
|
|
#else
|
2014-02-27 14:56:12 +01:00
|
|
|
if (gl->matched_range.rm_eo > start_pos) {
|
|
|
|
start_pos = gl->matched_range.rm_eo;
|
|
|
|
goto opt_w_again;
|
2013-05-15 03:53:26 +02:00
|
|
|
}
|
2014-02-27 14:56:12 +01:00
|
|
|
#endif
|
2007-02-25 02:38:20 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2003-04-27 01:50:57 +00:00
|
|
|
}
|
2019-01-28 19:41:12 +02:00
|
|
|
/* If it's a non-inverted search, we can stop
|
|
|
|
* at first match and report it.
|
|
|
|
* If it's an inverted search, we can move on
|
|
|
|
* to the next line of input, ignoring the
|
|
|
|
* rest of the patterns.
|
|
|
|
*/
|
|
|
|
if (found) {
|
|
|
|
//if (invert_search)
|
|
|
|
// goto do_not_found;
|
|
|
|
//goto do_found;
|
|
|
|
break; // this accomplishes both
|
|
|
|
}
|
2003-06-20 09:01:58 +00:00
|
|
|
pattern_ptr = pattern_ptr->link;
|
|
|
|
} /* while (pattern_ptr) */
|
|
|
|
|
2007-09-10 12:18:32 +00:00
|
|
|
if (found ^ invert_search) {
|
2019-01-28 19:41:12 +02:00
|
|
|
//do_found:
|
2007-02-25 02:37:49 +00:00
|
|
|
/* keep track of matches */
|
|
|
|
nmatches++;
|
2001-05-24 18:36:18 +00:00
|
|
|
|
2007-07-15 12:38:18 +00:00
|
|
|
/* quiet/print (non)matching file names only? */
|
|
|
|
if (option_mask32 & (OPT_q|OPT_l|OPT_L)) {
|
|
|
|
free(line); /* we don't need line anymore */
|
|
|
|
if (BE_QUIET) {
|
|
|
|
/* manpage says about -q:
|
|
|
|
* "exit immediately with zero status
|
|
|
|
* if any match is found,
|
|
|
|
* even if errors were detected" */
|
2008-05-19 09:29:47 +00:00
|
|
|
exit(EXIT_SUCCESS);
|
2007-07-15 12:38:18 +00:00
|
|
|
}
|
|
|
|
/* if we're just printing filenames, we stop after the first match */
|
|
|
|
if (PRINT_FILES_WITH_MATCHES) {
|
|
|
|
puts(cur_file);
|
2008-02-11 11:44:38 +00:00
|
|
|
/* fall through to "return 1" */
|
2007-07-15 12:38:18 +00:00
|
|
|
}
|
|
|
|
/* OPT_L aka PRINT_FILES_WITHOUT_MATCHES: return early */
|
|
|
|
return 1; /* one match */
|
|
|
|
}
|
2001-05-24 18:36:18 +00:00
|
|
|
|
2007-07-15 12:39:08 +00:00
|
|
|
#if ENABLE_FEATURE_GREP_CONTEXT
|
|
|
|
/* Were we printing context and saw next (unwanted) match? */
|
|
|
|
if ((option_mask32 & OPT_m) && nmatches > max_matches)
|
|
|
|
break;
|
|
|
|
#endif
|
|
|
|
|
2007-02-25 02:37:49 +00:00
|
|
|
/* print the matched line */
|
|
|
|
if (PRINT_MATCH_COUNTS == 0) {
|
2005-09-23 15:38:49 +00:00
|
|
|
#if ENABLE_FEATURE_GREP_CONTEXT
|
2007-02-25 02:37:49 +00:00
|
|
|
int prevpos = (curpos == 0) ? lines_before - 1 : curpos - 1;
|
|
|
|
|
|
|
|
/* if we were told to print 'before' lines and there is at least
|
|
|
|
* one line in the circular buffer, print them */
|
|
|
|
if (lines_before && before_buf[prevpos] != NULL) {
|
|
|
|
int first_buf_entry_line_num = linenum - lines_before;
|
|
|
|
|
|
|
|
/* advance to the first entry in the circular buffer, and
|
|
|
|
* figure out the line number is of the first line in the
|
|
|
|
* buffer */
|
|
|
|
idx = curpos;
|
|
|
|
while (before_buf[idx] == NULL) {
|
|
|
|
idx = (idx + 1) % lines_before;
|
|
|
|
first_buf_entry_line_num++;
|
2001-02-09 00:41:10 +00:00
|
|
|
}
|
|
|
|
|
2007-02-25 02:37:49 +00:00
|
|
|
/* now print each line in the buffer, clearing them as we go */
|
|
|
|
while (before_buf[idx] != NULL) {
|
2008-08-09 16:15:14 +00:00
|
|
|
print_line(before_buf[idx], before_buf_size[idx], first_buf_entry_line_num, '-');
|
2007-02-25 02:37:49 +00:00
|
|
|
free(before_buf[idx]);
|
|
|
|
before_buf[idx] = NULL;
|
|
|
|
idx = (idx + 1) % lines_before;
|
|
|
|
first_buf_entry_line_num++;
|
2006-09-29 20:58:53 +00:00
|
|
|
}
|
2001-05-24 18:36:18 +00:00
|
|
|
}
|
2007-02-25 02:37:49 +00:00
|
|
|
|
|
|
|
/* make a note that we need to print 'after' lines */
|
|
|
|
print_n_lines_after = lines_after;
|
|
|
|
#endif
|
2007-02-25 02:38:20 +00:00
|
|
|
if (option_mask32 & OPT_o) {
|
2007-11-04 00:46:03 +00:00
|
|
|
if (FGREP_FLAG) {
|
|
|
|
/* -Fo just prints the pattern
|
2017-04-17 16:13:32 +02:00
|
|
|
* (unless -v: -Fov doesn't print anything at all) */
|
2007-11-04 00:46:03 +00:00
|
|
|
if (found)
|
2008-08-09 16:15:14 +00:00
|
|
|
print_line(gl->pattern, strlen(gl->pattern), linenum, ':');
|
2008-09-30 22:37:29 +00:00
|
|
|
} else while (1) {
|
2010-08-23 02:39:47 +02:00
|
|
|
unsigned start = gl->matched_range.rm_so;
|
2009-07-29 01:20:09 +02:00
|
|
|
unsigned end = gl->matched_range.rm_eo;
|
2010-08-23 02:39:47 +02:00
|
|
|
unsigned len = end - start;
|
2009-07-29 01:20:09 +02:00
|
|
|
char old = line[end];
|
|
|
|
line[end] = '\0';
|
2010-08-23 02:39:47 +02:00
|
|
|
/* Empty match is not printed: try "echo test | grep -o ''" */
|
|
|
|
if (len != 0)
|
|
|
|
print_line(line + start, len, linenum, ':');
|
2009-12-04 02:48:14 +01:00
|
|
|
if (old == '\0')
|
|
|
|
break;
|
2009-07-29 01:20:09 +02:00
|
|
|
line[end] = old;
|
2010-08-23 02:39:47 +02:00
|
|
|
if (len == 0)
|
|
|
|
end++;
|
2008-09-30 22:37:29 +00:00
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
2009-07-29 01:20:09 +02:00
|
|
|
if (regexec(&gl->compiled_regex, line + end,
|
|
|
|
1, &gl->matched_range, REG_NOTBOL) != 0)
|
|
|
|
break;
|
|
|
|
gl->matched_range.rm_so += end;
|
|
|
|
gl->matched_range.rm_eo += end;
|
2008-09-30 22:37:29 +00:00
|
|
|
#else
|
|
|
|
if (re_search(&gl->compiled_regex, line, line_len,
|
2009-07-29 01:20:09 +02:00
|
|
|
end, line_len - end,
|
2008-09-30 22:37:29 +00:00
|
|
|
&gl->matched_range) < 0)
|
|
|
|
break;
|
|
|
|
#endif
|
2008-11-24 13:25:20 +00:00
|
|
|
}
|
2007-02-25 02:37:49 +00:00
|
|
|
} else {
|
2008-08-09 16:15:14 +00:00
|
|
|
print_line(line, line_len, linenum, ':');
|
2007-02-25 02:37:49 +00:00
|
|
|
}
|
2001-02-09 00:41:10 +00:00
|
|
|
}
|
2007-02-25 02:37:49 +00:00
|
|
|
}
|
2005-09-23 15:38:49 +00:00
|
|
|
#if ENABLE_FEATURE_GREP_CONTEXT
|
2007-02-25 02:37:49 +00:00
|
|
|
else { /* no match */
|
2019-01-28 19:41:12 +02:00
|
|
|
//do_not_found:
|
2007-07-15 12:38:18 +00:00
|
|
|
/* if we need to print some context lines after the last match, do so */
|
2007-07-15 12:39:08 +00:00
|
|
|
if (print_n_lines_after) {
|
2008-08-09 16:15:14 +00:00
|
|
|
print_line(line, strlen(line), linenum, '-');
|
2007-07-15 12:38:18 +00:00
|
|
|
print_n_lines_after--;
|
|
|
|
} else if (lines_before) {
|
|
|
|
/* Add the line to the circular 'before' buffer */
|
2007-02-25 02:37:49 +00:00
|
|
|
free(before_buf[curpos]);
|
2007-07-15 12:38:18 +00:00
|
|
|
before_buf[curpos] = line;
|
2009-04-21 11:09:40 +00:00
|
|
|
IF_EXTRA_COMPAT(before_buf_size[curpos] = line_len;)
|
2007-02-25 02:37:49 +00:00
|
|
|
curpos = (curpos + 1) % lines_before;
|
2008-03-17 09:09:09 +00:00
|
|
|
/* avoid free(line) - we took the line */
|
2007-07-15 12:39:08 +00:00
|
|
|
line = NULL;
|
2001-01-04 15:11:52 +00:00
|
|
|
}
|
2007-02-25 02:37:49 +00:00
|
|
|
}
|
2001-02-09 00:41:10 +00:00
|
|
|
|
2005-09-23 15:38:49 +00:00
|
|
|
#endif /* ENABLE_FEATURE_GREP_CONTEXT */
|
2008-08-09 16:15:14 +00:00
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
2000-06-28 22:00:26 +00:00
|
|
|
free(line);
|
2008-08-09 16:15:14 +00:00
|
|
|
#endif
|
2007-07-15 12:39:08 +00:00
|
|
|
/* Did we print all context after last requested match? */
|
|
|
|
if ((option_mask32 & OPT_m)
|
2009-03-20 22:17:13 +00:00
|
|
|
&& !print_n_lines_after
|
|
|
|
&& nmatches == max_matches
|
|
|
|
) {
|
2007-07-15 12:39:08 +00:00
|
|
|
break;
|
2009-03-20 22:17:13 +00:00
|
|
|
}
|
2008-08-09 16:15:14 +00:00
|
|
|
} /* while (read line) */
|
2000-07-18 18:37:01 +00:00
|
|
|
|
2001-05-14 19:40:32 +00:00
|
|
|
/* special-case file post-processing for options where we don't print line
|
2001-05-21 21:13:00 +00:00
|
|
|
* matches, just filenames and possibly match counts */
|
2001-05-14 19:40:32 +00:00
|
|
|
|
2001-05-21 21:13:00 +00:00
|
|
|
/* grep -c: print [filename:]count, even if count is zero */
|
2005-09-23 15:38:49 +00:00
|
|
|
if (PRINT_MATCH_COUNTS) {
|
2006-10-14 14:24:30 +00:00
|
|
|
if (print_filename)
|
2001-05-21 21:13:00 +00:00
|
|
|
printf("%s:", cur_file);
|
2006-10-03 19:56:34 +00:00
|
|
|
printf("%d\n", nmatches);
|
2001-05-14 19:40:32 +00:00
|
|
|
}
|
2001-05-21 21:13:00 +00:00
|
|
|
|
2007-07-15 12:38:18 +00:00
|
|
|
/* grep -L: print just the filename */
|
|
|
|
if (PRINT_FILES_WITHOUT_MATCHES) {
|
|
|
|
/* nmatches is zero, no need to check it:
|
|
|
|
* we return 1 early if we detected a match
|
|
|
|
* and PRINT_FILES_WITHOUT_MATCHES is set */
|
2004-05-26 11:47:55 +00:00
|
|
|
puts(cur_file);
|
|
|
|
}
|
|
|
|
|
2003-06-20 09:01:58 +00:00
|
|
|
return nmatches;
|
2001-05-24 18:36:18 +00:00
|
|
|
}
|
|
|
|
|
2006-02-28 10:10:19 +00:00
|
|
|
#if ENABLE_FEATURE_CLEAN_UP
|
|
|
|
#define new_grep_list_data(p, m) add_grep_list_data(p, m)
|
2007-09-10 12:18:32 +00:00
|
|
|
static char *add_grep_list_data(char *pattern, int flg_used_mem)
|
2006-02-28 10:10:19 +00:00
|
|
|
#else
|
|
|
|
#define new_grep_list_data(p, m) add_grep_list_data(p)
|
2007-09-10 12:18:32 +00:00
|
|
|
static char *add_grep_list_data(char *pattern)
|
2006-02-28 10:10:19 +00:00
|
|
|
#endif
|
|
|
|
{
|
2007-09-10 12:18:32 +00:00
|
|
|
grep_list_data_t *gl = xzalloc(sizeof(*gl));
|
2006-02-28 10:10:19 +00:00
|
|
|
gl->pattern = pattern;
|
|
|
|
#if ENABLE_FEATURE_CLEAN_UP
|
2016-09-17 20:58:22 +02:00
|
|
|
gl->flg_mem_allocated_compiled = flg_used_mem;
|
2006-02-28 10:10:19 +00:00
|
|
|
#else
|
2016-09-17 20:58:22 +02:00
|
|
|
/*gl->flg_mem_allocated_compiled = 0;*/
|
2006-02-28 10:10:19 +00:00
|
|
|
#endif
|
|
|
|
return (char *)gl;
|
|
|
|
}
|
|
|
|
|
2003-06-20 09:01:58 +00:00
|
|
|
static void load_regexes_from_file(llist_t *fopt)
|
2001-05-24 18:36:18 +00:00
|
|
|
{
|
2006-09-29 21:04:12 +00:00
|
|
|
while (fopt) {
|
2011-08-28 12:39:04 +02:00
|
|
|
char *line;
|
|
|
|
FILE *fp;
|
2003-06-20 09:01:58 +00:00
|
|
|
llist_t *cur = fopt;
|
|
|
|
char *ffile = cur->data;
|
|
|
|
|
|
|
|
fopt = cur->link;
|
|
|
|
free(cur);
|
2011-08-28 12:39:04 +02:00
|
|
|
fp = xfopen_stdin(ffile);
|
|
|
|
while ((line = xmalloc_fgetline(fp)) != NULL) {
|
2006-05-26 23:44:51 +00:00
|
|
|
llist_add_to(&pattern_head,
|
2008-06-07 05:19:31 +00:00
|
|
|
new_grep_list_data(line, ALLOCATED));
|
2004-10-08 08:10:57 +00:00
|
|
|
}
|
2011-08-28 12:39:04 +02:00
|
|
|
fclose_if_not_stdin(fp);
|
2001-05-24 18:36:18 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2008-06-27 02:52:20 +00:00
|
|
|
static int FAST_FUNC file_action_grep(const char *filename,
|
grep: skip grepping symlinks to directories
When grep is passed -r, recursive_action will treat any symlinks to
directories not in the root as normal files, since it lstat's them and
is therefore told they are not directories. However, file_action_grep
will still try to fopen and read from them to see whether they match,
which varies in behaviour across platforms. Linux will give EISDIR and
thus grep will not find any matching lines, but FreeBSD will give the
raw contents of the directory itself, which may match the given pattern.
Also, if grep is passed -c, it will even print a count for these
symlinks, even on Linux.
Since this recursive_action behaviour is required for the correct
functioning of other applets, such as tar, grep should handle this
special case and skip any such symlinks.
function old new delta
file_action_grep 80 161 +81
Signed-off-by: James Clarke <jrtc27@jrtc27.com>
Signed-off-by: Denys Vlasenko <vda.linux@googlemail.com>
2017-10-07 18:53:24 +01:00
|
|
|
struct stat *statbuf,
|
2008-03-17 09:09:09 +00:00
|
|
|
void* matched,
|
2008-07-05 09:18:54 +00:00
|
|
|
int depth UNUSED_PARAM)
|
2006-10-14 14:24:30 +00:00
|
|
|
{
|
grep: skip grepping symlinks to directories
When grep is passed -r, recursive_action will treat any symlinks to
directories not in the root as normal files, since it lstat's them and
is therefore told they are not directories. However, file_action_grep
will still try to fopen and read from them to see whether they match,
which varies in behaviour across platforms. Linux will give EISDIR and
thus grep will not find any matching lines, but FreeBSD will give the
raw contents of the directory itself, which may match the given pattern.
Also, if grep is passed -c, it will even print a count for these
symlinks, even on Linux.
Since this recursive_action behaviour is required for the correct
functioning of other applets, such as tar, grep should handle this
special case and skip any such symlinks.
function old new delta
file_action_grep 80 161 +81
Signed-off-by: James Clarke <jrtc27@jrtc27.com>
Signed-off-by: Denys Vlasenko <vda.linux@googlemail.com>
2017-10-07 18:53:24 +01:00
|
|
|
FILE *file;
|
|
|
|
|
|
|
|
/* If we are given a link to a directory, we should bail out now, rather
|
|
|
|
* than trying to open the "file" and hoping getline gives us nothing,
|
|
|
|
* since that is not portable across operating systems (FreeBSD for
|
|
|
|
* example will return the raw directory contents). */
|
|
|
|
if (S_ISLNK(statbuf->st_mode)) {
|
|
|
|
struct stat sb;
|
|
|
|
if (stat(filename, &sb) != 0) {
|
|
|
|
if (!SUPPRESS_ERR_MSGS)
|
|
|
|
bb_simple_perror_msg(filename);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
if (S_ISDIR(sb.st_mode))
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
file = fopen_for_read(filename);
|
2006-10-14 14:24:30 +00:00
|
|
|
if (file == NULL) {
|
|
|
|
if (!SUPPRESS_ERR_MSGS)
|
2008-01-24 01:30:36 +00:00
|
|
|
bb_simple_perror_msg(filename);
|
2006-10-14 14:24:30 +00:00
|
|
|
open_errors = 1;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
cur_file = filename;
|
|
|
|
*(int*)matched += grep_file(file);
|
2006-10-15 18:38:01 +00:00
|
|
|
fclose(file);
|
2006-10-14 14:24:30 +00:00
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int grep_dir(const char *dir)
|
|
|
|
{
|
|
|
|
int matched = 0;
|
|
|
|
recursive_action(dir,
|
2007-04-08 10:52:28 +00:00
|
|
|
/* recurse=yes */ ACTION_RECURSE |
|
2014-08-28 15:50:09 +02:00
|
|
|
/* followLinks=command line only */ ACTION_FOLLOWLINKS_L0 |
|
2007-04-08 10:52:28 +00:00
|
|
|
/* depthFirst=yes */ ACTION_DEPTHFIRST,
|
2006-10-14 14:24:30 +00:00
|
|
|
/* fileAction= */ file_action_grep,
|
|
|
|
/* dirAction= */ NULL,
|
2006-10-27 23:42:25 +00:00
|
|
|
/* userData= */ &matched,
|
|
|
|
/* depth= */ 0);
|
2006-10-14 14:24:30 +00:00
|
|
|
return matched;
|
|
|
|
}
|
|
|
|
|
2007-10-11 10:05:36 +00:00
|
|
|
int grep_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE;
|
2010-01-04 14:15:38 +01:00
|
|
|
int grep_main(int argc UNUSED_PARAM, char **argv)
|
1999-10-05 16:24:54 +00:00
|
|
|
{
|
2003-06-20 09:01:58 +00:00
|
|
|
FILE *file;
|
|
|
|
int matched;
|
2004-10-08 08:10:57 +00:00
|
|
|
llist_t *fopt = NULL;
|
2005-09-23 15:38:49 +00:00
|
|
|
#if ENABLE_FEATURE_GREP_CONTEXT
|
2010-10-02 12:42:28 +02:00
|
|
|
int Copt, opts;
|
2016-03-28 22:12:09 +02:00
|
|
|
#endif
|
2016-06-20 00:36:21 +02:00
|
|
|
INIT_G();
|
2003-06-20 09:01:58 +00:00
|
|
|
|
2016-03-28 22:12:09 +02:00
|
|
|
/* For grep, exitcode of 1 is "not found". Other errors are 2: */
|
|
|
|
xfunc_error_retval = 2;
|
|
|
|
|
|
|
|
/* do normal option parsing */
|
|
|
|
#if ENABLE_FEATURE_GREP_CONTEXT
|
2017-08-08 21:55:02 +02:00
|
|
|
/* -H unsets -h; -C unsets -A,-B */
|
2018-07-13 20:40:40 +02:00
|
|
|
opts = getopt32long(argv, "^"
|
|
|
|
OPTSTR_GREP
|
|
|
|
"\0"
|
|
|
|
"H-h:C-AB",
|
|
|
|
"color\0" Optional_argument "\xff",
|
2008-03-17 09:09:09 +00:00
|
|
|
&pattern_head, &fopt, &max_matches,
|
2018-07-13 20:40:40 +02:00
|
|
|
&lines_after, &lines_before, &Copt
|
|
|
|
, NULL
|
|
|
|
);
|
2003-06-20 09:01:58 +00:00
|
|
|
|
2010-10-02 12:42:28 +02:00
|
|
|
if (opts & OPT_C) {
|
2006-10-22 11:42:51 +00:00
|
|
|
/* -C unsets prev -A and -B, but following -A or -B
|
2013-01-14 15:57:44 +01:00
|
|
|
* may override it */
|
2010-10-02 12:42:28 +02:00
|
|
|
if (!(opts & OPT_A)) /* not overridden */
|
2008-03-17 09:09:09 +00:00
|
|
|
lines_after = Copt;
|
2010-10-02 12:42:28 +02:00
|
|
|
if (!(opts & OPT_B)) /* not overridden */
|
2008-03-17 09:09:09 +00:00
|
|
|
lines_before = Copt;
|
2005-09-23 15:38:49 +00:00
|
|
|
}
|
2006-10-22 11:42:51 +00:00
|
|
|
/* sanity checks */
|
2010-10-02 12:42:28 +02:00
|
|
|
if (opts & (OPT_c|OPT_q|OPT_l|OPT_L)) {
|
2007-02-25 02:38:20 +00:00
|
|
|
option_mask32 &= ~OPT_n;
|
2003-06-20 09:01:58 +00:00
|
|
|
lines_before = 0;
|
|
|
|
lines_after = 0;
|
2008-08-09 16:15:14 +00:00
|
|
|
} else if (lines_before > 0) {
|
2010-10-02 12:42:28 +02:00
|
|
|
if (lines_before > INT_MAX / sizeof(long long))
|
|
|
|
lines_before = INT_MAX / sizeof(long long);
|
|
|
|
/* overflow in (lines_before * sizeof(x)) is prevented (above) */
|
2008-08-09 16:15:14 +00:00
|
|
|
before_buf = xzalloc(lines_before * sizeof(before_buf[0]));
|
2009-04-21 11:09:40 +00:00
|
|
|
IF_EXTRA_COMPAT(before_buf_size = xzalloc(lines_before * sizeof(before_buf_size[0]));)
|
2008-08-09 16:15:14 +00:00
|
|
|
}
|
2003-06-20 09:01:58 +00:00
|
|
|
#else
|
|
|
|
/* with auto sanity checks */
|
2017-08-08 21:55:02 +02:00
|
|
|
getopt32(argv, "^" OPTSTR_GREP "\0" "H-h:c-n:q-n:l-n:", // why trailing ":"?
|
2008-03-17 09:09:09 +00:00
|
|
|
&pattern_head, &fopt, &max_matches);
|
2003-06-20 09:01:58 +00:00
|
|
|
#endif
|
2007-02-25 02:38:20 +00:00
|
|
|
invert_search = ((option_mask32 & OPT_v) != 0); /* 0 | 1 */
|
2005-09-23 15:38:49 +00:00
|
|
|
|
2011-08-28 12:39:04 +02:00
|
|
|
{ /* convert char **argv to grep_list_data_t */
|
2006-02-28 10:10:19 +00:00
|
|
|
llist_t *cur;
|
2006-09-29 21:04:12 +00:00
|
|
|
for (cur = pattern_head; cur; cur = cur->link)
|
2006-02-28 10:10:19 +00:00
|
|
|
cur->data = new_grep_list_data(cur->data, 0);
|
|
|
|
}
|
2011-08-28 12:39:04 +02:00
|
|
|
if (option_mask32 & OPT_f) {
|
2003-06-20 09:01:58 +00:00
|
|
|
load_regexes_from_file(fopt);
|
2011-08-28 12:39:04 +02:00
|
|
|
if (!pattern_head) { /* -f EMPTY_FILE? */
|
|
|
|
/* GNU grep treats it as "nothing matches" */
|
|
|
|
llist_add_to(&pattern_head, new_grep_list_data((char*) "", 0));
|
|
|
|
invert_search ^= 1;
|
|
|
|
}
|
|
|
|
}
|
2003-06-20 09:01:58 +00:00
|
|
|
|
2016-11-14 05:09:48 +01:00
|
|
|
if (ENABLE_FGREP && applet_name[0] == 'f')
|
2007-02-25 02:38:20 +00:00
|
|
|
option_mask32 |= OPT_F;
|
2005-07-31 22:41:05 +00:00
|
|
|
|
2008-09-19 21:29:21 +00:00
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
2013-05-07 12:32:21 +01:00
|
|
|
if (!(option_mask32 & (OPT_o | OPT_w | OPT_x)))
|
2006-09-29 20:58:53 +00:00
|
|
|
reflags = REG_NOSUB;
|
2008-09-19 21:29:21 +00:00
|
|
|
#endif
|
2006-09-29 20:58:53 +00:00
|
|
|
|
2016-11-14 05:09:48 +01:00
|
|
|
if ((ENABLE_EGREP && applet_name[0] == 'e')
|
|
|
|
|| (option_mask32 & OPT_E)
|
2007-09-10 12:18:32 +00:00
|
|
|
) {
|
2006-09-29 20:58:53 +00:00
|
|
|
reflags |= REG_EXTENDED;
|
2007-09-10 12:18:32 +00:00
|
|
|
}
|
2008-09-19 21:32:51 +00:00
|
|
|
#if ENABLE_EXTRA_COMPAT
|
|
|
|
else {
|
|
|
|
reflags = RE_SYNTAX_GREP;
|
|
|
|
}
|
|
|
|
#endif
|
2003-06-20 09:01:58 +00:00
|
|
|
|
2008-09-19 21:29:21 +00:00
|
|
|
if (option_mask32 & OPT_i) {
|
|
|
|
#if !ENABLE_EXTRA_COMPAT
|
2003-06-20 09:01:58 +00:00
|
|
|
reflags |= REG_ICASE;
|
2008-09-19 21:29:21 +00:00
|
|
|
#else
|
|
|
|
int i;
|
|
|
|
case_fold = xmalloc(256);
|
|
|
|
for (i = 0; i < 256; i++)
|
|
|
|
case_fold[i] = (unsigned char)i;
|
|
|
|
for (i = 'a'; i <= 'z'; i++)
|
|
|
|
case_fold[i] = (unsigned char)(i - ('a' - 'A'));
|
|
|
|
#endif
|
|
|
|
}
|
2003-06-20 09:01:58 +00:00
|
|
|
|
|
|
|
argv += optind;
|
2000-06-13 06:24:53 +00:00
|
|
|
|
2008-03-17 09:09:09 +00:00
|
|
|
/* if we didn't get a pattern from -e and no command file was specified,
|
|
|
|
* first parameter should be the pattern. no pattern, no worky */
|
2003-04-27 01:50:57 +00:00
|
|
|
if (pattern_head == NULL) {
|
2007-02-25 02:38:20 +00:00
|
|
|
char *pattern;
|
2003-06-20 09:01:58 +00:00
|
|
|
if (*argv == NULL)
|
2003-03-19 09:13:01 +00:00
|
|
|
bb_show_usage();
|
2007-02-25 02:38:20 +00:00
|
|
|
pattern = new_grep_list_data(*argv++, 0);
|
|
|
|
llist_add_to(&pattern_head, pattern);
|
2001-05-24 18:36:18 +00:00
|
|
|
}
|
2000-06-28 22:00:26 +00:00
|
|
|
|
2008-06-07 05:19:31 +00:00
|
|
|
/* argv[0..(argc-1)] should be names of file to grep through. If
|
2006-10-14 14:24:30 +00:00
|
|
|
* there is more than one file to grep, we will print the filenames. */
|
2010-01-04 14:15:38 +01:00
|
|
|
if (argv[0] && argv[1])
|
2006-10-14 14:24:30 +00:00
|
|
|
print_filename = 1;
|
2006-10-22 11:42:51 +00:00
|
|
|
/* -H / -h of course override */
|
2007-02-25 02:38:20 +00:00
|
|
|
if (option_mask32 & OPT_H)
|
2006-10-22 11:42:51 +00:00
|
|
|
print_filename = 1;
|
2007-02-25 02:38:20 +00:00
|
|
|
if (option_mask32 & OPT_h)
|
2006-10-22 11:42:51 +00:00
|
|
|
print_filename = 0;
|
1999-10-05 16:24:54 +00:00
|
|
|
|
2000-06-28 22:59:30 +00:00
|
|
|
/* If no files were specified, or '-' was specified, take input from
|
|
|
|
* stdin. Otherwise, we grep through all the files specified. */
|
2003-06-20 09:01:58 +00:00
|
|
|
matched = 0;
|
2007-09-10 12:18:32 +00:00
|
|
|
do {
|
2010-01-04 14:15:38 +01:00
|
|
|
cur_file = *argv;
|
2006-10-14 14:24:30 +00:00
|
|
|
file = stdin;
|
2008-03-17 09:09:09 +00:00
|
|
|
if (!cur_file || LONE_DASH(cur_file)) {
|
2005-09-23 15:38:49 +00:00
|
|
|
cur_file = "(standard input)";
|
2003-06-20 09:01:58 +00:00
|
|
|
} else {
|
2007-02-25 02:38:20 +00:00
|
|
|
if (option_mask32 & OPT_r) {
|
2006-10-14 14:24:30 +00:00
|
|
|
struct stat st;
|
|
|
|
if (stat(cur_file, &st) == 0 && S_ISDIR(st.st_mode)) {
|
2007-02-25 02:38:20 +00:00
|
|
|
if (!(option_mask32 & OPT_h))
|
2006-10-14 14:51:59 +00:00
|
|
|
print_filename = 1;
|
2006-10-14 14:24:30 +00:00
|
|
|
matched += grep_dir(cur_file);
|
|
|
|
goto grep_done;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/* else: fopen(dir) will succeed, but reading won't */
|
2008-07-21 23:05:26 +00:00
|
|
|
file = fopen_for_read(cur_file);
|
2006-10-14 14:24:30 +00:00
|
|
|
if (file == NULL) {
|
|
|
|
if (!SUPPRESS_ERR_MSGS)
|
2007-10-01 11:58:38 +00:00
|
|
|
bb_simple_perror_msg(cur_file);
|
2006-10-14 14:24:30 +00:00
|
|
|
open_errors = 1;
|
|
|
|
continue;
|
2000-07-18 21:02:06 +00:00
|
|
|
}
|
2000-02-08 19:58:47 +00:00
|
|
|
}
|
2006-10-14 14:24:30 +00:00
|
|
|
matched += grep_file(file);
|
2006-10-26 23:25:17 +00:00
|
|
|
fclose_if_not_stdin(file);
|
2007-07-15 12:39:08 +00:00
|
|
|
grep_done: ;
|
2010-01-04 14:15:38 +01:00
|
|
|
} while (*argv && *++argv);
|
2003-06-20 09:01:58 +00:00
|
|
|
|
2017-04-17 16:13:32 +02:00
|
|
|
/* destroy all the elements in the pattern list */
|
2006-02-28 10:10:19 +00:00
|
|
|
if (ENABLE_FEATURE_CLEAN_UP) {
|
|
|
|
while (pattern_head) {
|
|
|
|
llist_t *pattern_head_ptr = pattern_head;
|
2007-09-10 12:18:32 +00:00
|
|
|
grep_list_data_t *gl = (grep_list_data_t *)pattern_head_ptr->data;
|
2006-02-28 10:10:19 +00:00
|
|
|
|
|
|
|
pattern_head = pattern_head->link;
|
2016-09-17 20:58:22 +02:00
|
|
|
if (gl->flg_mem_allocated_compiled & ALLOCATED)
|
2006-02-28 10:10:19 +00:00
|
|
|
free(gl->pattern);
|
2016-09-17 20:58:22 +02:00
|
|
|
if (gl->flg_mem_allocated_compiled & COMPILED)
|
2008-08-09 16:15:14 +00:00
|
|
|
regfree(&gl->compiled_regex);
|
2007-04-12 18:29:27 +00:00
|
|
|
free(gl);
|
2006-02-28 10:10:19 +00:00
|
|
|
free(pattern_head_ptr);
|
|
|
|
}
|
2000-02-08 19:58:47 +00:00
|
|
|
}
|
2005-09-23 15:38:49 +00:00
|
|
|
/* 0 = success, 1 = failed, 2 = error */
|
2006-10-14 14:24:30 +00:00
|
|
|
if (open_errors)
|
2005-09-23 13:50:24 +00:00
|
|
|
return 2;
|
2007-09-10 12:18:32 +00:00
|
|
|
return !matched; /* invert return value: 0 = success, 1 = failed */
|
2000-06-28 22:00:26 +00:00
|
|
|
}
|