blob: d49ba98b94da6ea71aae090aa6eeef67eb2a9283 [file] [log] [blame]
/*
*------------------------------------------------------------------
* Copyright (c) 2006-2016 Cisco and/or its affiliates.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
/* Break up a delimited string into a vector of substrings */
#include <stdio.h>
#include <vppinfra/clib.h>
#include <vppinfra/vec.h>
#include <vppinfra/hash.h>
#include <stdarg.h>
/*
* #define UNIT_TESTS 1
* #define MATCH_TRACE 1
*/
/*
* delsvec
* break up an input string into a vector of [null-terminated] u8 *'s
*
* Each supplied delimiter character results in a string in the output
* vector, unless the delimiters occur back-to-back. When matched,
* a whitespace character in the delimiter consumes an arbitrary
* run of whitespace. See the unit tests at the end of this file
* for a set of examples.
*
* Returns a u8 **, or NULL if the input fails to match. It is assumed
* that both input and fmt are C strings, not necessarily vectors.
*
* Output strings are both vectors and proper C strings.
*/
static u8 **string_cache;
static u8 **svec_cache;
void
delsvec_recycle_this_string (u8 *s)
{
if (s)
{
vec_set_len (s, 0);
vec_add1 (string_cache, s);
}
}
void
delsvec_recycle_this_svec (u8 **svec)
{
if (svec)
{
if (svec_cache)
{
vec_free (svec_cache);
}
vec_set_len (svec, 0);
svec_cache = svec;
}
}
int
pvl (char *a)
{
return vec_len (a);
}
u8 **
delsvec (void *input_arg, char *fmt)
{
u8 **rv = 0;
int input_index = 0;
u8 *this;
int dirflag = 0;
int i;
u8 *input = input_arg;
if (svec_cache)
{
rv = svec_cache;
svec_cache = 0;
}
while (fmt)
{
dirflag = 0;
if (vec_len (string_cache) > 0)
{
this = string_cache[vec_len (string_cache) - 1];
vec_set_len (string_cache, vec_len (string_cache) - 1);
}
else
this = 0;
/*
* '*' means one of two things: match the rest of the input,
* or match as many characters as possible
*/
if (fmt[0] == '*')
{
fmt++;
dirflag = 1;
/*
* no more format: eat rest of string...
*/
if (!fmt[0])
{
for (; input[input_index]; input_index++)
vec_add1 (this, input[input_index]);
if (vec_len (this))
{
vec_add1 (this, 0);
#ifdef MATCH_TRACE
printf ("final star-match adds: '%s'\n", this);
#endif
vec_add1 (rv, this);
}
else
{
vec_add1 (string_cache, this);
}
return (rv);
}
}
/*
* Left-to-right scan, adding chars until next delimiter char
* appears.
*/
if (!dirflag)
{
while (input[input_index])
{
if (input[input_index] == fmt[0])
{
/* If we just (exact) matched a whitespace delimiter */
if (fmt[0] == ' ')
{
/* scan forward eating whitespace */
while (input[input_index] == ' ' ||
input[input_index] == '\t' ||
input[input_index] == '\n')
input_index++;
input_index--;
}
goto found;
}
/* If we're looking for whitespace */
if (fmt[0] == ' ')
{
/* and we have whitespace */
if (input[input_index] == ' ' ||
input[input_index] == '\t' || input[input_index] == '\n')
{
/* scan forward eating whitespace */
while (input[input_index] == ' ' ||
input[input_index] == '\t' ||
input[input_index] == '\n')
{
input_index++;
}
input_index--;
goto found;
}
}
/* Not a delimiter, save it */
vec_add1 (this, input[input_index]);
input_index++;
}
/*
* Fell off the wagon, clean up and bail out
*/
bail:
#ifdef MATCH_TRACE
printf ("failed, fmt[0] = '%c', input[%d]='%s'\n", fmt[0],
input_index, &input[input_index]);
#endif
delsvec_recycle_this_string (this);
for (i = 0; i < vec_len (rv); i++)
delsvec_recycle_this_string (rv[i]);
delsvec_recycle_this_svec (rv);
return (0);
found:
/*
* Delimiter matched
*/
input_index++;
fmt++;
/*
* If we actually accumulated non-delimiter characters,
* add them to the result vector
*/
if (vec_len (this))
{
vec_add1 (this, 0);
#ifdef MATCH_TRACE
printf ("match: add '%s'\n", this);
#endif
vec_add1 (rv, this);
}
else
{
vec_add1 (string_cache, this);
}
}
else
{
/*
* right-to-left scan, '*' not at
* the end of the delimiter string
*/
i = input_index;
while (input[++i])
; /* scan forward */
i--;
while (i > input_index)
{
if (input[i] == fmt[0])
goto found2;
if (fmt[0] == ' ' || fmt[0] == '\t' || fmt[0] == '\n')
{
if (input[i] == ' ' || input[i] == '\t' || input[i] == '\n')
goto found2;
}
i--;
}
goto bail;
found2:
for (; input_index < i; input_index++)
{
vec_add1 (this, input[input_index]);
}
input_index++;
fmt++;
vec_add1 (this, 0);
#ifdef MATCH_TRACE
printf ("inner '*' match: add '%s'\n", this);
#endif
vec_add1 (rv, this);
}
}
return (rv);
}
#ifdef UNIT_TESTS
typedef struct utest_
{
char *string;
char *fmt;
} utest_t;
utest_t tests[] = {
#ifdef NOTDEF
{ "Dec 7 08:56", " :*" },
{ "Dec 17 08:56", " :*" },
{ "Dec 7 08:56:41.239 install/inst_repl 0/9/CPU0 t1 [40989] File "
"List:Successfully blobbified file list. Took 1 milliseconds",
" ::. / // [] *" },
{ "RP/0/9/CPU0:Dec 7 08:55:28.550 : sam_server[291]: SAM backs up digest "
"list to memory file",
"///: ::. : []: *" },
/* Expected to fail */
{ "Dec 7 08:56:41.239 install/inst_repl 0/9/CPU0 t1 [40989] File "
"List:Successfully blobbified file list. Took 1 milliseconds",
"///: ::. : : *" },
/* Expected to fail */
{ "RP/0/9/CPU0:Dec 7 08:55:28.550 : sam_server[291]: SAM backs up digest "
"list to memory file",
" ::. / // [] *" },
{ "THIS that and + theother", "*+ *" },
{ "Dec 12 15:33:07.103 ifmgr/errors 0/RP0/CPU0 3# t2 Failed to open IM "
"connection: No such file or directory",
" ::. / // *" },
{ "Dec 16 21:43:47.328 ifmgr/bulk 0/3/CPU0 t8 Bulk DPC async download "
"complete. Partitions 1, node_count 1, total_out 0, out_offset 0, "
"out_expected 0: No error",
" ::. / // *" },
{ "t:0x53034bd6 CPU:00 PROCESS :PROCCREATE_NAME", ": : :*" },
{ " pid:1", " *" },
{ "t:0x53034cbb CPU:00 THREAD :THCREATE pid:1 tid:1",
": : : pid: tid:*" },
{ "t:0x5303f950 CPU:00 COMM :REC_PULSE scoid:0x40000003 pid:364659",
": : : *" },
{ "/hfr-base-3.3.85/lib/libttyconnection.dll 0xfc000000 0x0000306c "
"0xfc027000 0x000001c8 1",
" *" },
{ "Feb 28 02:38:26.123 seqtrace 0/1/CPU0 t8 "
":msg_receive:ifmgr/t8:IMC_MSG_MTU_UPDATE:ppp_ma/t1",
" ::. // ::::*" },
{ "Feb 28 02:38:26.123 seqtrace 0/1/CPU0 t8 "
":msg_send_event:call:ifmgr/t8:124/0:cdp/t1",
" ::. // :msg_send_event::::*" },
{ "Feb 28 02:38:26.125 seqtrace 0/1/CPU0 t1 "
":msg_receive_event:cdp/t1:124/0",
" ::. // :msg_receive_event::*" } {
"t:0x645dd86d CPU:00 USREVENT:EVENT:100, d0:0x00000002 d1:0x00000000",
": : USREVENT:EVENT:, d0: *" } {
"t:0x5303f950 CPU:00 COMM :REC_PULSE scoid:0x40000003 pid:364659",
": : : *" },
{ "t:0x2ccf9f5a CPU:00 INT_ENTR:0x80000000 (-2147483648) "
"IP:0x002d8b18",
": : INT_ENTR: IP:*" } {
"t:0xd473951c CPU:00 KER_EXIT:SCHED_GET/88 ret_val:2 sched_priority:10",
": : KER_EXIT:SCHED_GET : sched_priority:*" } {
"t:0x00000123 CPU:01 SYSTEM :FUNC_ENTER thisfn:0x40e62048 "
"call_site:0x00000000",
": : SYSTEM :FUNC_ thisfn: *" },
{ "t:0x5af8de95 CPU:00 INT_HANDLER_ENTR:0x0000004d (77) PID:8200 "
"IP:0x00000000 AREA:0x0bf9b290",
": : INT_HANDLER_*" },
#endif
{ "t:0x6d1ff92f CPU:00 CONTROL: BUFFER sequence = 1053, num_events = 714",
": : CONTROL*" },
{ "t:0x6d1ff92f CPU:00 CONTROL :TIME msb:0x0000003c lsb(offset):0x6d1ff921",
": : CONTROL*" },
};
int
main (int argc, char **argv)
{
int i, j;
u8 **svec;
for (j = 0; j < ARRAY_LEN (tests); j++)
{
printf ("input string: '%s'\n", tests[j].string);
printf ("delimiter arg: '%s'\n", tests[j].fmt);
printf ("parse trace:\n");
svec = delsvec (tests[j].string, tests[j].fmt);
if (!svec)
{
printf ("index %d failed\n", j);
continue;
}
printf ("%d substring vectors\n", vec_len (svec));
for (i = 0; i < vec_len (svec); i++)
{
printf ("[%d]: '%s'\n", i, svec[i]);
}
printf ("-------------------\n");
}
exit (0);
}
#endif