/* argcv.c - simple functions for parsing input based on whitespace Copyright (C) 1999, 2000, 2001, 2007, 2009, 2010 Free Software Foundation, Inc. This library is free software; you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License as published by the Free Software Foundation; either version 3 of the License, or (at your option) any later version. This library is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more details. You should have received a copy of the GNU Lesser General Public License along with this library; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA */ #ifdef HAVE_CONFIG_H # include #endif #include #include /* * takes a string and splits it into several strings, breaking at ' ' * command is the string to split * the number of strings is placed into argc * the split strings are put into argv * returns 0 on success, nonzero on failure */ #define isws(c) ((c)==' '||(c)=='\t'||(c)=='\n') #define isdelim(c,delim) ((c)=='"'||strchr(delim,(c))!=NULL) static int argcv_scan (int len, const char *command, const char *delim, const char* cmnt, int *start, int *end, int *save) { int i = 0; for (;;) { i = *save; if (i >= len) return i + 1; /* Skip initial whitespace */ while (i < len && isws (command[i])) i++; *start = i; switch (command[i]) { case '"': case '\'': while (++i < len && (command[i] != command[*start] || command[i-1] == '\\')) ; if (i < len) /* found matching quote */ break; /*FALLTHRU*/ default: if (isdelim (command[i], delim)) break; /* Skip until next whitespace character or end of line. Honor escaped whitespace. */ while (++i < len && !((isws (command[i]) && command[i-1] != '\\') || isdelim (command[i], delim))); i--; break; } *end = i; *save = i + 1; /* If we have a token, and it starts with a comment character, skip to the newline and restart the token search. */ if (*save <= len) { if (cmnt && strchr (cmnt, command[*start]) != NULL) { i = *save; while (i < len && command[i] != '\n') i++; *save = i; continue; } } break; } return *save; } static char escape_transtab[] = "\\\\a\ab\bf\fn\nr\rt\t"; int argcv_unescape_char (int c) { char *p; for (p = escape_transtab; *p; p += 2) { if (*p == c) return p[1]; } return c; } int argcv_escape_char (int c) { char *p; for (p = escape_transtab + sizeof(escape_transtab) - 2; p > escape_transtab; p -= 2) { if (*p == c) return p[-1]; } return -1; } static int xtonum (const char *src, int base, size_t cnt) { int val; char *p; char tmp[4]; /* At most three characters + zero */ /* Notice: No use to check `cnt'. It should be either 2 or 3 */ memcpy (tmp, src, cnt); tmp[cnt] = 0; val = strtoul (tmp, &p, base); return (*p == 0) ? val : -1; } static size_t escaped_length (const char *str, int *quote) { size_t len = 0; for (; *str; str++) { if (*str == ' ') { len++; *quote = 1; } else if (*str == '"') { len += 2; *quote = 1; } else if (isprint ((unsigned char) *str)) len++; else if (argcv_escape_char (*str) != -1) len += 2; else len += 4; } return len; } static void unescape_copy (char *dst, const char *src, size_t n) { int c; while (n > 0) { n--; if (*src == '\\') { switch (*++src) { case 'x': case 'X': ++src; --n; if (n == 0) { *dst++ = '\\'; *dst++ = src[-1]; } else { c = xtonum(src, 16, 2); if (c == -1) { *dst++ = '\\'; *dst++ = src[-1]; } else { *dst++ = c; src += 2; n -= 2; } } break; case '0': ++src; --n; if (n == 0) { *dst++ = '\\'; *dst++ = src[-1]; } else { c = xtonum(src, 8, 3); if (c == -1) { *dst++ = '\\'; *dst++ = src[-1]; } else { *dst++ = c; src += 3; n -= 3; } } break; default: *dst++ = argcv_unescape_char (*src++); n--; } } else { *dst++ = *src++; } } *dst = 0; } static void escape_copy (char *dst, const char *src) { for (; *src; src++) { if (*src == '"') { *dst++ = '\\'; *dst++ = '"'; } else if (*src != '\t' && isprint ((unsigned char) *src)) *dst++ = *src; else { int c = argcv_escape_char (*src); *dst++ = '\\'; if (c != -1) *dst++ = c; else { char tmp[4]; snprintf (tmp, sizeof tmp, "%03o", *(unsigned char*)src); memcpy (dst, tmp, 3); dst += 3; } } } } int argcv_get (const char *command, const char *delim, const char* cmnt, int *argc, char ***argv) { int len = strlen (command); int i = 0; int start, end, save; *argv = NULL; /* Count number of arguments */ *argc = 0; save = 0; while (argcv_scan (len, command, delim, cmnt, &start, &end, &save) <= len) (*argc)++; *argv = calloc ((*argc + 1), sizeof (char *)); i = 0; save = 0; for (i = 0; i < *argc; i++) { int n; argcv_scan (len, command, delim, cmnt, &start, &end, &save); if ((command[start] == '"' || command[end] == '\'') && command[end] == command[start]) { start++; end--; } n = end - start + 1; (*argv)[i] = calloc (n+1, sizeof (char)); if ((*argv)[i] == NULL) return 1; unescape_copy ((*argv)[i], &command[start], n); (*argv)[i][n] = 0; } (*argv)[i] = NULL; return 0; } /* * frees all elements of an argv array * argc is the number of elements * argv is the array */ int argcv_free (int argc, char **argv) { while (--argc >= 0) if (argv[argc]) free (argv[argc]); free (argv); return 1; } /* Take a argv an make string separated by ' '. */ int argcv_string (int argc, char **argv, char **pstring) { size_t i, j, len; char *buffer; /* No need. */ if (pstring == NULL) return 1; buffer = malloc (1); if (buffer == NULL) return 1; *buffer = '\0'; for (len = i = j = 0; i < argc; i++) { int quote = 0; int toklen; toklen = escaped_length (argv[i], "e); len += toklen + 2; if (quote) len += 2; buffer = realloc (buffer, len); if (buffer == NULL) return 1; if (i != 0) buffer[j++] = ' '; if (quote) buffer[j++] = '"'; escape_copy (buffer + j, argv[i]); j += toklen; if (quote) buffer[j++] = '"'; } for (; j > 0 && isspace ((unsigned char) buffer[j - 1]); j--) ; buffer[j] = 0; if (pstring) *pstring = buffer; return 0; } #if 0 char *command = "set prompt=\"& \a\\\"\" \\x25\\0145\\098\\ta"; main(int xargc, char **xargv) { int i, argc; char **argv; char *s; argcv_get (xargv[1] ? xargv[1]:command, "=", "#", &argc, &argv); printf ("%d args:\n", argc); for (i = 0; i < argc; i++) printf ("%s\n", argv[i]); printf ("===\n"); argcv_string (argc, argv, &s); printf ("%s\n", s); } #endif