Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 1 | /* vi: set sw=4 ts=4: */ |
| 2 | /* |
| 3 | * config file parser helper |
| 4 | * |
| 5 | * Copyright (C) 2008 by Vladimir Dronnikov <dronnikov@gmail.com> |
| 6 | * |
Denys Vlasenko | 0ef64bd | 2010-08-16 20:14:46 +0200 | [diff] [blame^] | 7 | * Licensed under GPLv2 or later, see file LICENSE in this source tree. |
Bernhard Reutner-Fischer | f3b39a2 | 2009-02-23 16:21:53 +0000 | [diff] [blame] | 8 | * Also for use in uClibc (http://uclibc.org/) licensed under LGPLv2.1 or later. |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 9 | */ |
| 10 | |
| 11 | #include "libbb.h" |
| 12 | |
Denis Vlasenko | 2d5bd80 | 2008-10-24 10:49:49 +0000 | [diff] [blame] | 13 | #if defined ENABLE_PARSE && ENABLE_PARSE |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 14 | int parse_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE; |
| 15 | int parse_main(int argc UNUSED_PARAM, char **argv) |
| 16 | { |
| 17 | const char *delims = "# \t"; |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 18 | unsigned flags = PARSE_NORMAL; |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 19 | int mintokens = 0, ntokens = 128; |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 20 | |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 21 | opt_complementary = "-1:n+:m+:f+"; |
| 22 | getopt32(argv, "n:m:d:f:", &ntokens, &mintokens, &delims, &flags); |
| 23 | //argc -= optind; |
| 24 | argv += optind; |
| 25 | while (*argv) { |
| 26 | parser_t *p = config_open(*argv); |
| 27 | if (p) { |
| 28 | int n; |
| 29 | char **t = xmalloc(sizeof(char *) * ntokens); |
Denis Vlasenko | 4a717e0 | 2008-07-20 13:01:56 +0000 | [diff] [blame] | 30 | while ((n = config_read(p, t, ntokens, mintokens, delims, flags)) != 0) { |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 31 | for (int i = 0; i < n; ++i) |
| 32 | printf("[%s]", t[i]); |
| 33 | puts(""); |
| 34 | } |
| 35 | config_close(p); |
| 36 | } |
| 37 | argv++; |
| 38 | } |
| 39 | return EXIT_SUCCESS; |
| 40 | } |
| 41 | #endif |
| 42 | |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 43 | /* |
| 44 | |
| 45 | Typical usage: |
| 46 | |
| 47 | ----- CUT ----- |
| 48 | char *t[3]; // tokens placeholder |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 49 | parser_t *p = config_open(filename); |
| 50 | if (p) { |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 51 | // parse line-by-line |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 52 | while (config_read(p, t, 3, 0, delimiters, flags)) { // 1..3 tokens |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 53 | // use tokens |
| 54 | bb_error_msg("TOKENS: [%s][%s][%s]", t[0], t[1], t[2]); |
| 55 | } |
| 56 | ... |
| 57 | // free parser |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 58 | config_close(p); |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 59 | } |
| 60 | ----- CUT ----- |
| 61 | |
| 62 | */ |
| 63 | |
Denis Vlasenko | 5415c85 | 2008-07-21 23:05:26 +0000 | [diff] [blame] | 64 | parser_t* FAST_FUNC config_open2(const char *filename, FILE* FAST_FUNC (*fopen_func)(const char *path)) |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 65 | { |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 66 | FILE* fp; |
| 67 | parser_t *parser; |
| 68 | |
| 69 | fp = fopen_func(filename); |
| 70 | if (!fp) |
| 71 | return NULL; |
| 72 | parser = xzalloc(sizeof(*parser)); |
| 73 | parser->fp = fp; |
| 74 | return parser; |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 75 | } |
| 76 | |
Denis Vlasenko | 5415c85 | 2008-07-21 23:05:26 +0000 | [diff] [blame] | 77 | parser_t* FAST_FUNC config_open(const char *filename) |
| 78 | { |
| 79 | return config_open2(filename, fopen_or_warn_stdin); |
| 80 | } |
| 81 | |
Denis Vlasenko | c7cc5a9 | 2009-04-19 01:27:20 +0000 | [diff] [blame] | 82 | static void config_free_data(parser_t *parser) |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 83 | { |
Denis Vlasenko | c01340f | 2008-07-16 22:12:18 +0000 | [diff] [blame] | 84 | free(parser->line); |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 85 | parser->line = NULL; |
Denis Vlasenko | dcb3fcb | 2008-07-19 22:57:00 +0000 | [diff] [blame] | 86 | if (PARSE_KEEP_COPY) { /* compile-time constant */ |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 87 | free(parser->data); |
| 88 | parser->data = NULL; |
Denis Vlasenko | dcb3fcb | 2008-07-19 22:57:00 +0000 | [diff] [blame] | 89 | } |
Bernhard Reutner-Fischer | 6792128 | 2008-07-17 11:59:13 +0000 | [diff] [blame] | 90 | } |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 91 | |
Bernhard Reutner-Fischer | 6792128 | 2008-07-17 11:59:13 +0000 | [diff] [blame] | 92 | void FAST_FUNC config_close(parser_t *parser) |
| 93 | { |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 94 | if (parser) { |
| 95 | config_free_data(parser); |
| 96 | fclose(parser->fp); |
| 97 | free(parser); |
| 98 | } |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 99 | } |
| 100 | |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 101 | /* |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 102 | 0. If parser is NULL return 0. |
| 103 | 1. Read a line from config file. If nothing to read then return 0. |
| 104 | Handle continuation character. Advance lineno for each physical line. |
Denys Vlasenko | 5370bfb | 2009-09-06 02:58:59 +0200 | [diff] [blame] | 105 | Discard everything past comment character. |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 106 | 2. if PARSE_TRIM is set (default), remove leading and trailing delimiters. |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 107 | 3. If resulting line is empty goto 1. |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 108 | 4. Look for first delimiter. If !PARSE_COLLAPSE or !PARSE_TRIM is set then |
| 109 | remember the token as empty. |
| 110 | 5. Else (default) if number of seen tokens is equal to max number of tokens |
| 111 | (token is the last one) and PARSE_GREEDY is set then the remainder |
| 112 | of the line is the last token. |
| 113 | Else (token is not last or PARSE_GREEDY is not set) just replace |
| 114 | first delimiter with '\0' thus delimiting the token. |
| 115 | 6. Advance line pointer past the end of token. If number of seen tokens |
| 116 | is less than required number of tokens then goto 4. |
| 117 | 7. Check the number of seen tokens is not less the min number of tokens. |
| 118 | Complain or die otherwise depending on PARSE_MIN_DIE. |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 119 | 8. Return the number of seen tokens. |
| 120 | |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 121 | mintokens > 0 make config_read() print error message if less than mintokens |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 122 | (but more than 0) are found. Empty lines are always skipped (not warned about). |
| 123 | */ |
| 124 | #undef config_read |
| 125 | int FAST_FUNC config_read(parser_t *parser, char **tokens, unsigned flags, const char *delims) |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 126 | { |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 127 | char *line; |
| 128 | int ntokens, mintokens; |
| 129 | int t, len; |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 130 | |
Denys Vlasenko | 63144be | 2010-06-26 04:00:52 +0200 | [diff] [blame] | 131 | ntokens = (uint8_t)flags; |
| 132 | mintokens = (uint8_t)(flags >> 8); |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 133 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 134 | if (parser == NULL) |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 135 | return 0; |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 136 | |
| 137 | again: |
| 138 | memset(tokens, 0, sizeof(tokens[0]) * ntokens); |
Bernhard Reutner-Fischer | 6792128 | 2008-07-17 11:59:13 +0000 | [diff] [blame] | 139 | config_free_data(parser); |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 140 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 141 | /* Read one line (handling continuations with backslash) */ |
| 142 | line = bb_get_chunk_with_continuation(parser->fp, &len, &parser->lineno); |
| 143 | if (line == NULL) |
| 144 | return 0; |
| 145 | parser->line = line; |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 146 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 147 | /* Strip trailing line-feed if any */ |
| 148 | if (len && line[len-1] == '\n') |
| 149 | line[len-1] = '\0'; |
Bernhard Reutner-Fischer | 6792128 | 2008-07-17 11:59:13 +0000 | [diff] [blame] | 150 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 151 | /* Skip token in the start of line? */ |
| 152 | if (flags & PARSE_TRIM) |
| 153 | line += strspn(line, delims + 1); |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 154 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 155 | if (line[0] == '\0' || line[0] == delims[0]) |
| 156 | goto again; |
| 157 | |
| 158 | if (flags & PARSE_KEEP_COPY) |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 159 | parser->data = xstrdup(line); |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 160 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 161 | /* Tokenize the line */ |
Denys Vlasenko | 63144be | 2010-06-26 04:00:52 +0200 | [diff] [blame] | 162 | t = 0; |
| 163 | do { |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 164 | /* Pin token */ |
| 165 | tokens[t] = line; |
| 166 | |
| 167 | /* Combine remaining arguments? */ |
| 168 | if ((t != (ntokens-1)) || !(flags & PARSE_GREEDY)) { |
| 169 | /* Vanilla token, find next delimiter */ |
| 170 | line += strcspn(line, delims[0] ? delims : delims + 1); |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 171 | } else { |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 172 | /* Combining, find comment char if any */ |
| 173 | line = strchrnul(line, delims[0]); |
| 174 | |
| 175 | /* Trim any extra delimiters from the end */ |
| 176 | if (flags & PARSE_TRIM) { |
| 177 | while (strchr(delims + 1, line[-1]) != NULL) |
| 178 | line--; |
Denis Vlasenko | 0f99d49 | 2008-07-24 23:38:04 +0000 | [diff] [blame] | 179 | } |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 180 | } |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 181 | |
| 182 | /* Token not terminated? */ |
Denys Vlasenko | 63144be | 2010-06-26 04:00:52 +0200 | [diff] [blame] | 183 | if (*line == delims[0]) |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 184 | *line = '\0'; |
Denys Vlasenko | 63144be | 2010-06-26 04:00:52 +0200 | [diff] [blame] | 185 | else if (*line != '\0') |
| 186 | *line++ = '\0'; |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 187 | |
| 188 | #if 0 /* unused so far */ |
| 189 | if (flags & PARSE_ESCAPE) { |
| 190 | const char *from; |
| 191 | char *to; |
| 192 | |
| 193 | from = to = tokens[t]; |
| 194 | while (*from) { |
| 195 | if (*from == '\\') { |
| 196 | from++; |
| 197 | *to++ = bb_process_escape_sequence(&from); |
| 198 | } else { |
| 199 | *to++ = *from++; |
| 200 | } |
| 201 | } |
| 202 | *to = '\0'; |
| 203 | } |
| 204 | #endif |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 205 | /* Skip possible delimiters */ |
| 206 | if (flags & PARSE_COLLAPSE) |
| 207 | line += strspn(line, delims + 1); |
Denys Vlasenko | 63144be | 2010-06-26 04:00:52 +0200 | [diff] [blame] | 208 | |
| 209 | t++; |
| 210 | } while (*line && *line != delims[0] && t < ntokens); |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 211 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 212 | if (t < mintokens) { |
Denis Vlasenko | 5415c85 | 2008-07-21 23:05:26 +0000 | [diff] [blame] | 213 | bb_error_msg("bad line %u: %d tokens found, %d needed", |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 214 | parser->lineno, t, mintokens); |
Denis Vlasenko | 5415c85 | 2008-07-21 23:05:26 +0000 | [diff] [blame] | 215 | if (flags & PARSE_MIN_DIE) |
| 216 | xfunc_die(); |
Denys Vlasenko | 63144be | 2010-06-26 04:00:52 +0200 | [diff] [blame] | 217 | if (flags & PARSE_KEEP_COPY) |
| 218 | free(parser->data); |
Denis Vlasenko | 5415c85 | 2008-07-21 23:05:26 +0000 | [diff] [blame] | 219 | goto again; |
| 220 | } |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 221 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 222 | return t; |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 223 | } |