blob: aca469e2f21acc0925be4fb96d567a0250e9dd57 [file] [log] [blame]
Eric Andersencc8ed391999-10-05 16:24:54 +00001/*
Mark Whitleyd3721892000-06-28 22:00:26 +00002 * Mini grep implementation for busybox using libc regex.
Eric Andersenc4996011999-10-20 22:08:37 +00003 *
Erik Andersen61677fe2000-04-13 01:18:56 +00004 * Copyright (C) 1999,2000 by Lineo, inc.
Mark Whitleyd3721892000-06-28 22:00:26 +00005 * Written by Mark Whitley <markw@lineo.com>, <markw@enol.com>
Eric Andersencc8ed391999-10-05 16:24:54 +00006 *
Eric Andersen3e0fbae1999-10-19 06:02:44 +00007 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
11 *
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 *
Eric Andersencc8ed391999-10-05 16:24:54 +000021 */
22
Eric Andersencc8ed391999-10-05 16:24:54 +000023#include <stdio.h>
Mark Whitleyd3721892000-06-28 22:00:26 +000024#include <stdlib.h>
25#include <unistd.h> /* for getopt() */
26#include <regex.h>
27#include <string.h> /* for strerror() */
Eric Andersencc8ed391999-10-05 16:24:54 +000028#include <errno.h>
Mark Whitleyd3721892000-06-28 22:00:26 +000029#include "internal.h"
30
31extern int optind; /* in unistd.h */
32extern int errno; /* for use with strerror() */
Eric Andersencc8ed391999-10-05 16:24:54 +000033
Eric Andersene77ae3a1999-10-19 20:03:34 +000034static const char grep_usage[] =
Mark Whitleyd3721892000-06-28 22:00:26 +000035 "grep [-ihHnqvs] pattern [files...]\n"
Erik Andersen7ab9c7e2000-05-12 19:41:47 +000036#ifndef BB_FEATURE_TRIVIAL_HELP
37 "\nSearch for PATTERN in each FILE or standard input.\n\n"
Erik Andersene49d5ec2000-02-08 19:58:47 +000038 "OPTIONS:\n"
Mark Whitleyd3721892000-06-28 22:00:26 +000039 "\t-H\tprefix output lines with filename where match was found\n"
Erik Andersene49d5ec2000-02-08 19:58:47 +000040 "\t-h\tsuppress the prefixing filename on output\n"
41 "\t-i\tignore case distinctions\n"
42 "\t-n\tprint line number with output lines\n"
John Beppuf93a95d2000-04-24 18:07:30 +000043 "\t-q\tbe quiet. Returns 0 if result was found, 1 otherwise\n"
Mark Whitleyd3721892000-06-28 22:00:26 +000044 "\t-v\tselect non-matching lines\n"
45 "\t-s\tsuppress file open/read error messages\n\n"
Erik Andersen7ab9c7e2000-05-12 19:41:47 +000046#endif
47 ;
Eric Andersencc8ed391999-10-05 16:24:54 +000048
Mark Whitleyd3721892000-06-28 22:00:26 +000049static const int GROWBY = 80; /* how large we will grow strings by */
Eric Andersenfbb39c81999-11-08 17:00:52 +000050
Mark Whitleyd3721892000-06-28 22:00:26 +000051/* options */
52static int ignore_case = 0;
53static int print_filename = 0;
54static int print_line_num = 0;
55static int be_quiet = 0;
56static int invert_search = 0;
57static int suppress_err_msgs = 0;
58
59/* globals */
60static regex_t regex; /* storage space for compiled regular expression */
61static int nmatches = 0; /* keeps track of the number of matches */
62static char *cur_file = NULL; /* the current file we are reading */
63
64
65/* This returns a malloc'ed char * which must be stored and free'ed */
66/* XXX: This function should probably go in a 'common'/'util'/'misc' file
67 * somewhere so it can be used by other folks. */
68static char *get_line_from_file(FILE *file)
Eric Andersenfbb39c81999-11-08 17:00:52 +000069{
Mark Whitleyd3721892000-06-28 22:00:26 +000070 int ch;
71 int idx = 0;
72 char *linebuf = NULL;
73 int linebufsz = 0;
Eric Andersenfbb39c81999-11-08 17:00:52 +000074
Mark Whitleyd3721892000-06-28 22:00:26 +000075 while (1) {
76 ch = fgetc(file);
77 if (ch == EOF)
78 break;
79 /* grow the line buffer as necessary */
80 if (idx > linebufsz-1)
81 linebuf = realloc(linebuf, linebufsz += GROWBY);
82 linebuf[idx++] = (char)ch;
83 if ((char)ch == '\n')
84 break;
Eric Andersenfbb39c81999-11-08 17:00:52 +000085 }
Mark Whitleyd3721892000-06-28 22:00:26 +000086
87 if (idx == 0)
88 return NULL;
89
90 linebuf[idx] = 0;
91 return linebuf;
Eric Andersenfbb39c81999-11-08 17:00:52 +000092}
93
Mark Whitleyd3721892000-06-28 22:00:26 +000094static void print_matched_line(char *line, int linenum)
95{
96 if (print_filename)
97 printf("%s:", cur_file);
98 if (print_line_num)
99 printf("%i:", linenum);
100
101 printf("%s", line);
102}
103
104static void grep_file(FILE *file)
105{
106 char *line = NULL;
107 int ret;
108 int linenum = 0;
109
110 while ((line = get_line_from_file(file)) != NULL) {
111 linenum++;
112 ret = regexec(&regex, line, 0, NULL, 0);
113 if (ret == 0 && !invert_search) { /* match */
114
115 /* if we found a match but were told to be quiet, stop here and
116 * return success */
117 if (be_quiet) {
118 regfree(&regex);
119 exit(0);
120 }
121
122 nmatches++;
123
124 print_matched_line(line, linenum);
125
126 } else if (ret == REG_NOMATCH && invert_search) {
127 print_matched_line(line, linenum);
128 }
129
130 free(line);
131 }
132}
Eric Andersencc8ed391999-10-05 16:24:54 +0000133
Erik Andersene49d5ec2000-02-08 19:58:47 +0000134extern int grep_main(int argc, char **argv)
Eric Andersencc8ed391999-10-05 16:24:54 +0000135{
Mark Whitleyd3721892000-06-28 22:00:26 +0000136 int opt;
137 int reflags;
138 int ret;
Eric Andersencc8ed391999-10-05 16:24:54 +0000139
Mark Whitleyd3721892000-06-28 22:00:26 +0000140 /* do special-case option parsing */
141 if (argv[1] && (strcmp(argv[1], "--help") == 0))
Eric Andersen3e0fbae1999-10-19 06:02:44 +0000142 usage(grep_usage);
Erik Andersene49d5ec2000-02-08 19:58:47 +0000143
Mark Whitleyd3721892000-06-28 22:00:26 +0000144 /* do normal option parsing */
145 while ((opt = getopt(argc, argv, "iHhnqvs")) > 0) {
146 switch (opt) {
Erik Andersene49d5ec2000-02-08 19:58:47 +0000147 case 'i':
Mark Whitleyd3721892000-06-28 22:00:26 +0000148 ignore_case++;
Erik Andersene49d5ec2000-02-08 19:58:47 +0000149 break;
Mark Whitleyd3721892000-06-28 22:00:26 +0000150 case 'H':
151 print_filename++;
152 break;
Erik Andersene49d5ec2000-02-08 19:58:47 +0000153 case 'h':
Mark Whitleyd3721892000-06-28 22:00:26 +0000154 print_filename--;
Erik Andersene49d5ec2000-02-08 19:58:47 +0000155 break;
Erik Andersene49d5ec2000-02-08 19:58:47 +0000156 case 'n':
Mark Whitleyd3721892000-06-28 22:00:26 +0000157 print_line_num++;
Erik Andersene49d5ec2000-02-08 19:58:47 +0000158 break;
Erik Andersene49d5ec2000-02-08 19:58:47 +0000159 case 'q':
Mark Whitleyd3721892000-06-28 22:00:26 +0000160 be_quiet++;
Erik Andersene49d5ec2000-02-08 19:58:47 +0000161 break;
John Beppuf93a95d2000-04-24 18:07:30 +0000162 case 'v':
Mark Whitleyd3721892000-06-28 22:00:26 +0000163 invert_search++;
John Beppuf93a95d2000-04-24 18:07:30 +0000164 break;
Mark Whitleyd3721892000-06-28 22:00:26 +0000165 case 's':
166 suppress_err_msgs++;
167 break;
Eric Andersen053b1462000-06-13 06:24:53 +0000168 }
Eric Andersen053b1462000-06-13 06:24:53 +0000169 }
170
Mark Whitleyd3721892000-06-28 22:00:26 +0000171 /* argv[optind] should be the regex pattern; no pattern, no worky */
172 if (argv[optind] == NULL)
173 usage(grep_usage);
174
175 /* compile the regular expression */
176 reflags = REG_NOSUB; /* we're not going to mess with sub-expressions */
177 if (ignore_case)
178 reflags |= REG_ICASE;
179 if ((ret = regcomp(&regex, argv[optind], reflags)) != 0) {
180 int errmsgsz = regerror(ret, &regex, NULL, 0);
181 char *errmsg = malloc(errmsgsz);
182 if (errmsg == NULL) {
183 fprintf(stderr, "grep: memory error\n");
184 regfree(&regex);
185 exit(1);
186 }
187 regerror(ret, &regex, errmsg, errmsgsz);
188 fprintf(stderr, "grep: %s\n", errmsg);
189 free(errmsg);
190 regfree(&regex);
191 exit(1);
Erik Andersene49d5ec2000-02-08 19:58:47 +0000192 }
193
Mark Whitleyd3721892000-06-28 22:00:26 +0000194 /* argv[(optind+1)..(argc-1)] should be names of file to grep through. If
195 * there is more than one file to grep, we will print the filenames */
196 if ((argc-1) - (optind+1) > 0)
197 print_filename++;
Erik Andersene49d5ec2000-02-08 19:58:47 +0000198
Mark Whitleyd3721892000-06-28 22:00:26 +0000199 /* If no files were specified, take input from stdin. Otherwise, we grep
200 * through all the files specified. */
201 if (argv[optind+1] == NULL) {
202 grep_file(stdin);
Erik Andersene49d5ec2000-02-08 19:58:47 +0000203 } else {
Mark Whitleyd3721892000-06-28 22:00:26 +0000204 int i;
205 FILE *file;
206 for (i = optind + 1; i < argc; i++) {
207 cur_file = argv[i];
208 file = fopen(cur_file, "r");
209 if (file == NULL) {
210 if (!suppress_err_msgs)
211 fprintf(stderr, "grep: %s: %s\n", cur_file, strerror(errno));
212 } else {
213 grep_file(file);
214 fclose(file);
Erik Andersene49d5ec2000-02-08 19:58:47 +0000215 }
Erik Andersene49d5ec2000-02-08 19:58:47 +0000216 }
217 }
Mark Whitleyd3721892000-06-28 22:00:26 +0000218
219 regfree(&regex);
220
221 if (nmatches == 0)
222 return 1;
223
224 return 0;
Eric Andersencc8ed391999-10-05 16:24:54 +0000225}