/*
* argv_parse.c --- utility function for parsing a string into a
* argc, argv array.
*
* This file defines a function argv_parse() which parsing a
* passed-in string, handling double quotes and backslashes, and
* creates an allocated argv vector which can be freed using the
* argv_free() function.
*
* See argv_parse.h for the formal definition of the functions.
*
* Copyright 1999 by Theodore Ts'o.
*
* Permission to use, copy, modify, and distribute this software for
* any purpose with or without fee is hereby granted, provided that
* the above copyright notice and this permission notice appear in all
* copies. THE SOFTWARE IS PROVIDED "AS IS" AND THEODORE TS'O (THE
* AUTHOR) DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE,
* INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS.
* IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT,
* INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER
* RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION
* OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR
* IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. (Isn't
* it sick that the U.S. culture of lawsuit-happy lawyers requires
* this kind of disclaimer?)
*
* Version 1.1, modified 2/27/1999
*/
#ifdef HAVE_STDLIB_H
#include <stdlib.h>
#endif
#include <ctype.h>
#include <string.h>
#include "argv_parse.h"
#define STATE_WHITESPACE 1
#define STATE_TOKEN 2
#define STATE_QUOTED 3
/*
* Returns 0 on success, -1 on failure.
*/
int argv_parse(char *in_buf, int *ret_argc, char ***ret_argv)
{
int argc = 0, max_argc = 0;
char **argv, **new_argv, *buf, ch;
char *cp = 0, *outcp = 0;
int state = STATE_WHITESPACE;
buf = malloc(strlen(in_buf)+1);
if (!buf)
return -1;
max_argc = 0; argc = 0; argv = 0;
outcp = buf;
for (cp = in_buf; (ch = *cp); cp++) {
if (state == STATE_WHITESPACE) {
if (isspace((int) ch))
continue;
/* Not whitespace, so start a new token */
state = STATE_TOKEN;
if (argc >= max_argc) {
max_argc += 3;
new_argv = realloc(argv,
(max_argc+1)*sizeof(char *));
if (!new_argv) {
if (argv) free(argv);
free(buf);
return -1;
}
argv = new_argv;
}
argv[argc++] = outcp;
}
if (state == STATE_QUOTED) {
if (ch == '"')
state = STATE_TOKEN;
else
*outcp++ = ch;
continue;
}
/* Must be processing characters in a word */
if (isspace((int) ch)) {
/*
* Terminate the current word and start
* looking for the beginning of the next word.
*/
*outcp++ = 0;
state = STATE_WHITESPACE;
continue;
}
if (ch == '"') {
state = STATE_QUOTED;
continue;
}
if (ch == '\\') {
ch = *++cp;
switch (ch) {
case '\0':
ch = '\\'; cp--; break;
case 'n':
ch = '\n'; break;
case 't':
ch = '\t'; break;
case 'b':
ch = '\b'; break;
}
}
*outcp++ = ch;
}
if (state != STATE_WHITESPACE)
*outcp++ = '\0';
if (argv == 0) {
argv = malloc(sizeof(char *));
free(buf);
}
argv[argc] = 0;
if (ret_argc)
*ret_argc = argc;
if (ret_argv)
*ret_argv = argv;
return 0;
}
void argv_free(char **argv)
{
if (*argv)
free(*argv);
free(argv);
}
#ifdef DEBUG
/*
* For debugging
*/
#include <stdio.h>
int main(int argc, char **argv)
{
int ac, ret;
char **av, **cpp;
char buf[256];
while (!feof(stdin)) {
if (fgets(buf, sizeof(buf), stdin) == NULL)
break;
ret = argv_parse(buf, &ac, &av);
if (ret != 0) {
printf("Argv_parse returned %d!\n", ret);
continue;
}
printf("Argv_parse returned %d arguments...\n", ac);
for (cpp = av; *cpp; cpp++) {
if (cpp != av)
printf(", ");
printf("'%s'", *cpp);
}
printf("\n");
argv_free(av);
}
exit(0);
}
#endif /* DEBUG */