mirror of
https://github.com/bkaradzic/bx.git
synced 2026-02-17 20:52:37 +01:00
Added command line tokenizer.
This commit is contained in:
146
include/bx/tokenizecmd.h
Normal file
146
include/bx/tokenizecmd.h
Normal file
@@ -0,0 +1,146 @@
|
||||
/*
|
||||
* Copyright 2012-2014 Branimir Karadzic. All rights reserved.
|
||||
* License: http://www.opensource.org/licenses/BSD-2-Clause
|
||||
*/
|
||||
|
||||
#ifndef BX_TOKENIZE_CMD_H_HEADER_GUARD
|
||||
#define BX_TOKENIZE_CMD_H_HEADER_GUARD
|
||||
|
||||
#include <stdint.h>
|
||||
#include <stdio.h>
|
||||
#include <ctype.h>
|
||||
|
||||
namespace bx
|
||||
{
|
||||
// Reference:
|
||||
// http://msdn.microsoft.com/en-us/library/a1y7w461.aspx
|
||||
static inline const char* tokenizeCommandLine(const char* _commandLine, char* _buffer, uint32_t& _bufferSize, int& _argc, char* _argv[], int _maxArgvs, char _term = '\0')
|
||||
{
|
||||
int argc = 0;
|
||||
const char* curr = _commandLine;
|
||||
char* currOut = _buffer;
|
||||
char term = ' ';
|
||||
bool sub = false;
|
||||
|
||||
enum ParserState
|
||||
{
|
||||
SkipWhitespace,
|
||||
SetTerm,
|
||||
Copy,
|
||||
Escape,
|
||||
End,
|
||||
};
|
||||
|
||||
ParserState state = SkipWhitespace;
|
||||
|
||||
while ('\0' != *curr
|
||||
&& _term != *curr
|
||||
&& argc < _maxArgvs)
|
||||
{
|
||||
switch (state)
|
||||
{
|
||||
case SkipWhitespace:
|
||||
for (; isspace(*curr); ++curr) {}; // skip whitespace
|
||||
state = SetTerm;
|
||||
break;
|
||||
|
||||
case SetTerm:
|
||||
if ('"' == *curr)
|
||||
{
|
||||
term = '"';
|
||||
++curr; // skip begining quote
|
||||
}
|
||||
else
|
||||
{
|
||||
term = ' ';
|
||||
}
|
||||
|
||||
_argv[argc] = currOut;
|
||||
++argc;
|
||||
|
||||
state = Copy;
|
||||
break;
|
||||
|
||||
case Copy:
|
||||
if ('\\' == *curr)
|
||||
{
|
||||
state = Escape;
|
||||
}
|
||||
else if ('"' == *curr
|
||||
&& '"' != term)
|
||||
{
|
||||
sub = !sub;
|
||||
}
|
||||
else if (isspace(*curr) && !sub)
|
||||
{
|
||||
state = End;
|
||||
}
|
||||
else if (term != *curr || sub)
|
||||
{
|
||||
*currOut = *curr;
|
||||
++currOut;
|
||||
}
|
||||
else
|
||||
{
|
||||
state = End;
|
||||
}
|
||||
++curr;
|
||||
break;
|
||||
|
||||
case Escape:
|
||||
{
|
||||
const char* start = --curr;
|
||||
for (; '\\' == *curr; ++curr) {};
|
||||
|
||||
if ('"' != *curr)
|
||||
{
|
||||
int count = (int)(curr-start);
|
||||
|
||||
curr = start;
|
||||
for (int ii = 0; ii < count; ++ii)
|
||||
{
|
||||
*currOut = *curr;
|
||||
++currOut;
|
||||
++curr;
|
||||
}
|
||||
}
|
||||
else
|
||||
{
|
||||
curr = start+1;
|
||||
*currOut = *curr;
|
||||
++currOut;
|
||||
++curr;
|
||||
}
|
||||
}
|
||||
state = Copy;
|
||||
break;
|
||||
|
||||
case End:
|
||||
*currOut = '\0';
|
||||
++currOut;
|
||||
state = SkipWhitespace;
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
*currOut = '\0';
|
||||
if (0 < argc
|
||||
&& '\0' == _argv[argc-1][0])
|
||||
{
|
||||
--argc;
|
||||
}
|
||||
|
||||
_bufferSize = (uint32_t)(currOut - _buffer);
|
||||
_argc = argc;
|
||||
|
||||
if ('\0' != *curr)
|
||||
{
|
||||
++curr;
|
||||
}
|
||||
|
||||
return curr;
|
||||
}
|
||||
|
||||
} // namespace bx
|
||||
|
||||
#endif // TOKENIZE_CMD_H_HEADER_GUARD
|
||||
72
tests/tokenizecmd.cpp
Normal file
72
tests/tokenizecmd.cpp
Normal file
@@ -0,0 +1,72 @@
|
||||
/*
|
||||
* Copyright 2012-2014 Branimir Karadzic. All rights reserved.
|
||||
* License: http://www.opensource.org/licenses/BSD-2-Clause
|
||||
*/
|
||||
|
||||
#include "test.h"
|
||||
#include <bx/tokenizecmd.h>
|
||||
#include <string.h>
|
||||
|
||||
TEST(tokenizeCommandLine)
|
||||
{
|
||||
const char* input[] =
|
||||
{
|
||||
" ",
|
||||
"\\",
|
||||
// "\"a b c\" d e",
|
||||
"\"ab\\\"c\" \"\\\\\" d",
|
||||
"a\\\\\\b d\"e f\"g h",
|
||||
"a\\\\\\\"b c d",
|
||||
"a\\\\\\\\\"b c\" d e",
|
||||
};
|
||||
|
||||
const int expected_argc[] =
|
||||
{
|
||||
0,
|
||||
0,
|
||||
// 3,
|
||||
3,
|
||||
3,
|
||||
3,
|
||||
3
|
||||
};
|
||||
|
||||
const char* expected_results[] =
|
||||
{
|
||||
"a b c", "d", "e",
|
||||
"ab\"c", "\\", "d",
|
||||
"a\\\\\\b", "de fg", "h",
|
||||
"a\\\"b", "c", "d",
|
||||
"a\\\\b c", "d", "e",
|
||||
};
|
||||
|
||||
const char** expected_argv[] =
|
||||
{
|
||||
NULL,
|
||||
NULL,
|
||||
// &expected_results[0],
|
||||
&expected_results[3],
|
||||
&expected_results[6],
|
||||
&expected_results[9],
|
||||
&expected_results[12],
|
||||
};
|
||||
|
||||
for (uint32_t ii = 0; ii < BX_COUNTOF(exptected_argv); ++ii)
|
||||
{
|
||||
printf("x\n");
|
||||
char commandLine[1024];
|
||||
uint32_t size = BX_COUNTOF(commandLine);
|
||||
char* argv[50];
|
||||
int32_t argc;
|
||||
bx::tokenizeCommandLine(input[ii], commandLine, size, argc, argv, BX_COUNTOF(argv) );
|
||||
printf("\n%d (%d): %s %s\n", ii, argc, input[ii], expected_argc[ii] == argc ? "" : "FAILED!");
|
||||
for (uint32_t jj = 0; jj < argc; ++jj)
|
||||
{
|
||||
printf("\t%d: {%s} %s\n"
|
||||
, jj
|
||||
, argv[jj]
|
||||
, jj < argc ? (0==strcmp(argv[jj], expected_argv[ii][jj]) ? "" : "FAILED!") : "FAILED!"
|
||||
);
|
||||
}
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user