Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 1 | /* vi: set sw=4 ts=4: */ |
| 2 | /* |
| 3 | * config file parser helper |
| 4 | * |
| 5 | * Copyright (C) 2008 by Vladimir Dronnikov <dronnikov@gmail.com> |
| 6 | * |
Denys Vlasenko | 0ef64bd | 2010-08-16 20:14:46 +0200 | [diff] [blame] | 7 | * Licensed under GPLv2 or later, see file LICENSE in this source tree. |
Bernhard Reutner-Fischer | f3b39a2 | 2009-02-23 16:21:53 +0000 | [diff] [blame] | 8 | * Also for use in uClibc (http://uclibc.org/) licensed under LGPLv2.1 or later. |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 9 | */ |
| 10 | |
Denys Vlasenko | 3a64936 | 2011-06-18 09:23:09 +0200 | [diff] [blame] | 11 | /* Uncomment to enable test applet */ |
| 12 | ////config:config PARSE |
| 13 | ////config: bool "Uniform config file parser debugging applet: parse" |
| 14 | ////config: default n |
| 15 | ////config: help |
| 16 | ////config: Typical usage of parse API: |
| 17 | ////config: char *t[3]; |
| 18 | ////config: parser_t *p = config_open(filename); |
| 19 | ////config: while (config_read(p, t, 3, 0, delimiters, flags)) { // 1..3 tokens |
| 20 | ////config: bb_error_msg("TOKENS: '%s''%s''%s'", t[0], t[1], t[2]); |
| 21 | ////config: } |
| 22 | ////config: config_close(p); |
| 23 | |
| 24 | ////applet:IF_PARSE(APPLET(parse, BB_DIR_USR_BIN, BB_SUID_DROP)) |
| 25 | |
| 26 | //kbuild:lib-y += parse_config.o |
| 27 | |
Pere Orga | 5bc8c00 | 2011-04-11 03:29:49 +0200 | [diff] [blame] | 28 | //usage:#define parse_trivial_usage |
Denys Vlasenko | 3a64936 | 2011-06-18 09:23:09 +0200 | [diff] [blame] | 29 | //usage: "[-x] [-n MAXTOKENS] [-m MINTOKENS] [-d DELIMS] [-f FLAGS] FILE..." |
| 30 | //usage:#define parse_full_usage "\n\n" |
| 31 | //usage: " -x Suppress output (for benchmarking)" |
Pere Orga | 5bc8c00 | 2011-04-11 03:29:49 +0200 | [diff] [blame] | 32 | |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 33 | #include "libbb.h" |
| 34 | |
Denis Vlasenko | 2d5bd80 | 2008-10-24 10:49:49 +0000 | [diff] [blame] | 35 | #if defined ENABLE_PARSE && ENABLE_PARSE |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 36 | int parse_main(int argc, char **argv) MAIN_EXTERNALLY_VISIBLE; |
| 37 | int parse_main(int argc UNUSED_PARAM, char **argv) |
| 38 | { |
| 39 | const char *delims = "# \t"; |
Denys Vlasenko | 3a64936 | 2011-06-18 09:23:09 +0200 | [diff] [blame] | 40 | char **t; |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 41 | unsigned flags = PARSE_NORMAL; |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 42 | int mintokens = 0, ntokens = 128; |
Denys Vlasenko | 3a64936 | 2011-06-18 09:23:09 +0200 | [diff] [blame] | 43 | unsigned noout; |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 44 | |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 45 | opt_complementary = "-1:n+:m+:f+"; |
Denys Vlasenko | 3a64936 | 2011-06-18 09:23:09 +0200 | [diff] [blame] | 46 | noout = 1 & getopt32(argv, "xn:m:d:f:", &ntokens, &mintokens, &delims, &flags); |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 47 | //argc -= optind; |
| 48 | argv += optind; |
Denys Vlasenko | 3a64936 | 2011-06-18 09:23:09 +0200 | [diff] [blame] | 49 | |
| 50 | t = xmalloc(sizeof(t[0]) * ntokens); |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 51 | while (*argv) { |
Denys Vlasenko | 3a64936 | 2011-06-18 09:23:09 +0200 | [diff] [blame] | 52 | int n; |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 53 | parser_t *p = config_open(*argv); |
Denys Vlasenko | 3a64936 | 2011-06-18 09:23:09 +0200 | [diff] [blame] | 54 | while ((n = config_read(p, t, ntokens, mintokens, delims, flags)) != 0) { |
| 55 | if (!noout) { |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 56 | for (int i = 0; i < n; ++i) |
| 57 | printf("[%s]", t[i]); |
| 58 | puts(""); |
| 59 | } |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 60 | } |
Denys Vlasenko | 3a64936 | 2011-06-18 09:23:09 +0200 | [diff] [blame] | 61 | config_close(p); |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 62 | argv++; |
| 63 | } |
| 64 | return EXIT_SUCCESS; |
| 65 | } |
| 66 | #endif |
| 67 | |
Denis Vlasenko | 5415c85 | 2008-07-21 23:05:26 +0000 | [diff] [blame] | 68 | parser_t* FAST_FUNC config_open2(const char *filename, FILE* FAST_FUNC (*fopen_func)(const char *path)) |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 69 | { |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 70 | FILE* fp; |
| 71 | parser_t *parser; |
| 72 | |
| 73 | fp = fopen_func(filename); |
| 74 | if (!fp) |
| 75 | return NULL; |
| 76 | parser = xzalloc(sizeof(*parser)); |
| 77 | parser->fp = fp; |
| 78 | return parser; |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 79 | } |
| 80 | |
Denis Vlasenko | 5415c85 | 2008-07-21 23:05:26 +0000 | [diff] [blame] | 81 | parser_t* FAST_FUNC config_open(const char *filename) |
| 82 | { |
| 83 | return config_open2(filename, fopen_or_warn_stdin); |
| 84 | } |
| 85 | |
Bernhard Reutner-Fischer | 6792128 | 2008-07-17 11:59:13 +0000 | [diff] [blame] | 86 | void FAST_FUNC config_close(parser_t *parser) |
| 87 | { |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 88 | if (parser) { |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 89 | if (PARSE_KEEP_COPY) /* compile-time constant */ |
| 90 | free(parser->data); |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 91 | fclose(parser->fp); |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 92 | free(parser->line); |
| 93 | free(parser->nline); |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 94 | free(parser); |
| 95 | } |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 96 | } |
| 97 | |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 98 | /* This function reads an entire line from a text file, |
| 99 | * up to a newline, exclusive. |
Denys Vlasenko | a1a4483 | 2011-06-17 03:37:43 +0200 | [diff] [blame] | 100 | * Trailing '\' is recognized as line continuation. |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 101 | * Returns -1 if EOF/error. |
Denys Vlasenko | a1a4483 | 2011-06-17 03:37:43 +0200 | [diff] [blame] | 102 | */ |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 103 | static int get_line_with_continuation(parser_t *parser) |
Denys Vlasenko | a1a4483 | 2011-06-17 03:37:43 +0200 | [diff] [blame] | 104 | { |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 105 | ssize_t len, nlen; |
| 106 | char *line; |
Denys Vlasenko | a1a4483 | 2011-06-17 03:37:43 +0200 | [diff] [blame] | 107 | |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 108 | len = getline(&parser->line, &parser->line_alloc, parser->fp); |
| 109 | if (len <= 0) |
| 110 | return len; |
| 111 | |
| 112 | line = parser->line; |
| 113 | for (;;) { |
| 114 | parser->lineno++; |
| 115 | if (line[len - 1] == '\n') |
| 116 | len--; |
| 117 | if (len == 0 || line[len - 1] != '\\') |
| 118 | break; |
| 119 | len--; |
| 120 | |
| 121 | nlen = getline(&parser->nline, &parser->nline_alloc, parser->fp); |
| 122 | if (nlen <= 0) |
| 123 | break; |
| 124 | |
Tanguy Pruvot | 6fef6a3 | 2012-05-05 15:26:43 +0200 | [diff] [blame] | 125 | if ((ssize_t)parser->line_alloc < len + nlen + 1) { |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 126 | parser->line_alloc = len + nlen + 1; |
| 127 | line = parser->line = xrealloc(line, parser->line_alloc); |
Denys Vlasenko | a1a4483 | 2011-06-17 03:37:43 +0200 | [diff] [blame] | 128 | } |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 129 | memcpy(&line[len], parser->nline, nlen); |
| 130 | len += nlen; |
Denys Vlasenko | a1a4483 | 2011-06-17 03:37:43 +0200 | [diff] [blame] | 131 | } |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 132 | |
| 133 | line[len] = '\0'; |
| 134 | return len; |
Denys Vlasenko | a1a4483 | 2011-06-17 03:37:43 +0200 | [diff] [blame] | 135 | } |
| 136 | |
| 137 | |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 138 | /* |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 139 | 0. If parser is NULL return 0. |
| 140 | 1. Read a line from config file. If nothing to read then return 0. |
| 141 | Handle continuation character. Advance lineno for each physical line. |
Denys Vlasenko | 5370bfb | 2009-09-06 02:58:59 +0200 | [diff] [blame] | 142 | Discard everything past comment character. |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 143 | 2. if PARSE_TRIM is set (default), remove leading and trailing delimiters. |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 144 | 3. If resulting line is empty goto 1. |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 145 | 4. Look for first delimiter. If !PARSE_COLLAPSE or !PARSE_TRIM is set then |
| 146 | remember the token as empty. |
| 147 | 5. Else (default) if number of seen tokens is equal to max number of tokens |
| 148 | (token is the last one) and PARSE_GREEDY is set then the remainder |
| 149 | of the line is the last token. |
| 150 | Else (token is not last or PARSE_GREEDY is not set) just replace |
| 151 | first delimiter with '\0' thus delimiting the token. |
| 152 | 6. Advance line pointer past the end of token. If number of seen tokens |
| 153 | is less than required number of tokens then goto 4. |
| 154 | 7. Check the number of seen tokens is not less the min number of tokens. |
| 155 | Complain or die otherwise depending on PARSE_MIN_DIE. |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 156 | 8. Return the number of seen tokens. |
| 157 | |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 158 | mintokens > 0 make config_read() print error message if less than mintokens |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 159 | (but more than 0) are found. Empty lines are always skipped (not warned about). |
| 160 | */ |
| 161 | #undef config_read |
| 162 | int FAST_FUNC config_read(parser_t *parser, char **tokens, unsigned flags, const char *delims) |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 163 | { |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 164 | char *line; |
| 165 | int ntokens, mintokens; |
Denys Vlasenko | a1a4483 | 2011-06-17 03:37:43 +0200 | [diff] [blame] | 166 | int t; |
| 167 | |
| 168 | if (!parser) |
| 169 | return 0; |
Denis Vlasenko | 084266e | 2008-07-26 23:08:31 +0000 | [diff] [blame] | 170 | |
Denys Vlasenko | 63144be | 2010-06-26 04:00:52 +0200 | [diff] [blame] | 171 | ntokens = (uint8_t)flags; |
| 172 | mintokens = (uint8_t)(flags >> 8); |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 173 | |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 174 | again: |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 175 | memset(tokens, 0, sizeof(tokens[0]) * ntokens); |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 176 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 177 | /* Read one line (handling continuations with backslash) */ |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 178 | if (get_line_with_continuation(parser) < 0) |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 179 | return 0; |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 180 | |
| 181 | line = parser->line; |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 182 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 183 | /* Skip token in the start of line? */ |
| 184 | if (flags & PARSE_TRIM) |
| 185 | line += strspn(line, delims + 1); |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 186 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 187 | if (line[0] == '\0' || line[0] == delims[0]) |
| 188 | goto again; |
| 189 | |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 190 | if (flags & PARSE_KEEP_COPY) { |
| 191 | free(parser->data); |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 192 | parser->data = xstrdup(line); |
Timo Teras | adcabf3 | 2011-06-20 09:49:56 +0200 | [diff] [blame] | 193 | } |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 194 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 195 | /* Tokenize the line */ |
Denys Vlasenko | 63144be | 2010-06-26 04:00:52 +0200 | [diff] [blame] | 196 | t = 0; |
| 197 | do { |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 198 | /* Pin token */ |
| 199 | tokens[t] = line; |
| 200 | |
| 201 | /* Combine remaining arguments? */ |
| 202 | if ((t != (ntokens-1)) || !(flags & PARSE_GREEDY)) { |
| 203 | /* Vanilla token, find next delimiter */ |
| 204 | line += strcspn(line, delims[0] ? delims : delims + 1); |
Denis Vlasenko | 2e157dd | 2008-07-19 09:27:19 +0000 | [diff] [blame] | 205 | } else { |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 206 | /* Combining, find comment char if any */ |
Tanguy Pruvot | 8a6c2c2 | 2012-04-28 00:24:09 +0200 | [diff] [blame] | 207 | line = strchrnul(line, PARSE_EOL_COMMENTS ? delims[0] : '\0'); |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 208 | |
| 209 | /* Trim any extra delimiters from the end */ |
| 210 | if (flags & PARSE_TRIM) { |
| 211 | while (strchr(delims + 1, line[-1]) != NULL) |
| 212 | line--; |
Denis Vlasenko | 0f99d49 | 2008-07-24 23:38:04 +0000 | [diff] [blame] | 213 | } |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 214 | } |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 215 | |
| 216 | /* Token not terminated? */ |
Denys Vlasenko | 63144be | 2010-06-26 04:00:52 +0200 | [diff] [blame] | 217 | if (*line == delims[0]) |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 218 | *line = '\0'; |
Denys Vlasenko | 63144be | 2010-06-26 04:00:52 +0200 | [diff] [blame] | 219 | else if (*line != '\0') |
| 220 | *line++ = '\0'; |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 221 | |
| 222 | #if 0 /* unused so far */ |
| 223 | if (flags & PARSE_ESCAPE) { |
Denys Vlasenko | 5360059 | 2010-10-23 21:06:06 +0200 | [diff] [blame] | 224 | strcpy_and_process_escape_sequences(tokens[t], tokens[t]); |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 225 | } |
| 226 | #endif |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 227 | /* Skip possible delimiters */ |
| 228 | if (flags & PARSE_COLLAPSE) |
| 229 | line += strspn(line, delims + 1); |
Denys Vlasenko | 63144be | 2010-06-26 04:00:52 +0200 | [diff] [blame] | 230 | |
| 231 | t++; |
| 232 | } while (*line && *line != delims[0] && t < ntokens); |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 233 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 234 | if (t < mintokens) { |
Denis Vlasenko | 5415c85 | 2008-07-21 23:05:26 +0000 | [diff] [blame] | 235 | bb_error_msg("bad line %u: %d tokens found, %d needed", |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 236 | parser->lineno, t, mintokens); |
Denis Vlasenko | 5415c85 | 2008-07-21 23:05:26 +0000 | [diff] [blame] | 237 | if (flags & PARSE_MIN_DIE) |
| 238 | xfunc_die(); |
| 239 | goto again; |
| 240 | } |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 241 | |
Denis Vlasenko | 69f4f9a | 2008-08-09 17:16:40 +0000 | [diff] [blame] | 242 | return t; |
Denis Vlasenko | e559e0a | 2008-07-15 21:09:30 +0000 | [diff] [blame] | 243 | } |