ossp-pkg/var/var.c
1.36
/*
** VAR - OSSP variable expression library.
** Copyright (c) 2001 The OSSP Project (http://www.ossp.org/)
** Copyright (c) 2001 Cable & Wireless Deutschland (http://www.cw.com/de/)
**
** This file is part of OSSP VAR, an extensible data serialization
** library which can be found at http://www.ossp.org/pkg/var/.
**
** Permission to use, copy, modify, and distribute this software for
** any purpose with or without fee is hereby granted, provided that
** the above copyright notice and this permission notice appear in all
** copies.
**
** THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
** WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
** MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
** IN NO EVENT SHALL THE AUTHORS AND COPYRIGHT HOLDERS AND THEIR
** CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
** SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
** LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
** USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
** ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
** OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
** OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
** SUCH DAMAGE.
**
** var.c: VAR library implementation.
*/
#include <ctype.h>
#include <string.h>
#include <stdio.h>
#include <errno.h>
#include <sys/types.h>
#if defined(HAVE_PCREPOSIX)
# include <pcreposix.h>
#else
# include <regex.h>
#endif
#include "var.h"
/* The default configuration for the parser. */
const var_config_t var_config_default = {
'$', /* varinit */
'{', /* startdelim */
'}', /* enddelim */
'\\', /* escape */
"a-zA-Z0-9_" /* namechars */
};
/* The var_strerror() routine will map a var_rc_t into a text message. */
const char* var_strerror(var_rc_t rc)
{
static char *var_errors[] = {
"OK", /* VAR_OK = 0 */
"incomplete named character", /* VAR_ERR_INCOMPLETE_NAMED_CHARACTER = -1 */
"incomplete hex", /* VAR_ERR_INCOMPLETE_HEX = -2 */
"invalid hex", /* VAR_ERR_INVALID_HEX = -3 */
"octal too large", /* VAR_ERR_OCTAL_TOO_LARGE = -4 */
"invalid octal", /* VAR_ERR_INVALID_OCTAL = -5 */
"incomplete octal", /* VAR_ERR_INCOMPLETE_OCTAL = -6 */
"incomplete grouped hex", /* VAR_ERR_INCOMPLETE_GROUPED_HEX = -7 */
"incorrect character class specification", /* VAR_ERR_INCORRECT_CLASS_SPEC = -8 */
"var_expand() configuration is inconsistent", /* VAR_ERR_INVALID_CONFIGURATION = -9 */
"out of memory", /* VAR_ERR_OUT_OF_MEMORY = -10 */
"incomplete variable", /* VAR_ERR_INCOMPLETE_VARIABLE_SPEC = -11 */
"undefined variable", /* VAR_ERR_UNDEFINED_VARIABLE = -12 */
"input is neither text nor variable", /* VAR_ERR_INPUT_ISNT_TEXT_NOR_VARIABLE = -13 */
"unknown command in variable", /* VAR_ERR_UNKNOWN_COMMAND_CHAR = -14 */
"malformated search and replace operation", /* VAR_ERR_MALFORMATTED_REPLACE = -16 */
"unknown flag specified in search and replace operation", /* VAR_ERR_UNKNOWN_REPLACE_FLAG = -17 */
"invalid regular expression in search and replace operation", /* VAR_ERR_INVALID_REGEX_IN_REPLACE = -18 */
"missing parameter in command", /* VAR_ERR_MISSING_PARAMETER_IN_COMMAND = -19 */
"empty search string in search and replace operation", /* VAR_ERR_EMPTY_SEARCH_STRING = -20 */
"start offset missing in cut operation" /* VAR_ERR_MISSING_START_OFFSET = -21 */
"offsets in cut operation delimited by unknown character", /* VAR_ERR_INVALID_OFFSET_DELIMITER = -22 */
"range in cut operation is out of bounds", /* VAR_ERR_RANGE_OUT_OF_BOUNDS = -23 */
"offset in cut operation is out of bounds", /* VAR_ERR_OFFSET_OUT_OF_BOUNDS = -24 */
"logic error in cut operation", /* VAR_ERR_OFFSET_LOGIC = -25 */
"malformatted transpose operation", /* VAR_ERR_MALFORMATTED_TRANSPOSE = -26 */
"source class does not match destination class in transpose operation", /* VAR_ERR_TRANSPOSE_CLASSES_MISMATCH = -27 */
"empty character class in transpose operation", /* VAR_ERR_EMPTY_TRANSPOSE_CLASS = -28 */
"incorrect character class in transpose operation", /* VAR_ERR_INCORRECT_TRANSPOSE_CLASS_SPEC = -29 */
"malformatted padding operation", /* VAR_ERR_MALFORMATTED_PADDING = -30 */
"width parameter missing in padding operation", /* VAR_ERR_MISSING_PADDING_WIDTH = -31 */
"fill string missing in padding operation", /* VAR_ERR_EMPTY_PADDING_FILL_STRING = -32 */
"unknown quoted pair in search and replace operation", /* VAR_ERR_UNKNOWN_QUOTED_PAIR_IN_REPLACE = -33 */
"submatch referred to in replace string does not exist in search string", /* VAR_ERR_SUBMATCH_OUT_OF_RANGE = -34 */
"invalid argument", /* VAR_ERR_INVALID_ARGUMENT = -35 */
"incomplete quoted pair" /* VAR_ERR_INCOMPLETE_QUOTED_PAIR = -36 */
};
rc = 0 - rc;
if (rc < 0 || rc >= sizeof(var_errors) / sizeof(char *))
return "unknown error";
return var_errors[rc];
}
/* Routines for manipulation of token buffers. */
#define TOKENBUF_INITIAL_BUFSIZE 64
typedef struct {
const char *begin;
const char *end;
size_t buffer_size;
} tokenbuf_t;
static void tokenbuf_init(tokenbuf_t *buf)
{
buf->begin = NULL;
buf->end = NULL;
buf->buffer_size = 0;
return;
}
static void tokenbuf_move(tokenbuf_t *src, tokenbuf_t *dst)
{
dst->begin = src->begin;
dst->end = src->end;
dst->buffer_size = src->buffer_size;
tokenbuf_init(src);
return;
}
static int tokenbuf_assign(tokenbuf_t *buf, const char *data, size_t len)
{
char *p;
if ((p = malloc(len + 1)) == NULL)
return 0;
memcpy(p, data, len);
buf->begin = p;
buf->end = p + len;
buf->buffer_size = len + 1;
*((char *)(buf->end)) = '\0';
return 1;
}
static int tokenbuf_append(tokenbuf_t *output, const char *data, size_t len)
{
char *new_buffer;
size_t new_size;
char *tmp;
/* Is the tokenbuffer initialized at all? If not, allocate a
standard-sized buffer to begin with. */
if (output->begin == NULL) {
if ((output->begin = output->end = malloc(TOKENBUF_INITIAL_BUFSIZE)) == NULL)
return 0;
output->buffer_size = TOKENBUF_INITIAL_BUFSIZE;
}
/* Does the token contain text, but no buffer has been allocated yet? */
if (output->buffer_size == 0) {
/* Check whether data borders to output. If, we can append
simly by increasing the end pointer. */
if (output->end == data) {
output->end += len;
return 1;
}
/* OK, so copy the contents of output into an allocated buffer
so that we can append that way. */
if ((tmp = malloc(output->end - output->begin + len + 1)) == NULL)
return 0;
memcpy(tmp, output->begin, output->end - output->begin);
output->buffer_size = output->end - output->begin;
output->begin = tmp;
output->end = tmp + output->buffer_size;
output->buffer_size += len + 1;
}
/* Does the token fit into the current buffer? If not, realloc a
larger buffer that fits. */
if ((output->buffer_size - (output->end - output->begin)) <= len) {
new_size = output->buffer_size;
do {
new_size *= 2;
} while ((new_size - (output->end - output->begin)) <= len);
if ((new_buffer = realloc((char *)output->begin, new_size)) == NULL)
return 0;
output->end = new_buffer + (output->end - output->begin);
output->begin = new_buffer;
output->buffer_size = new_size;
}
/* Append the data at the end of the current buffer. */
memcpy((char *)output->end, data, len);
output->end += len;
*((char *)output->end) = '\0';
return 1;
}
static void tokenbuf_free(tokenbuf_t *buf)
{
if (buf->begin != NULL && buf->buffer_size > 0)
free((char *)buf->begin);
buf->begin = buf->end = NULL;
buf->buffer_size = 0;
return;
}
static size_t tokenbuf_toint(tokenbuf_t *number)
{
const char *p;
size_t num;
num = 0;
for (p = number->begin; p != number->end; ++p) {
num *= 10;
num += *p - '0';
}
return num;
}
/* Routines for the expansion of quoted-pair expressions. */
typedef char char_class_t[256]; /* 256 == 2 ^ sizeof(unsigned char)*8 */
static void expand_range(char a, char b, char_class_t class)
{
do {
class[(int)a] = 1;
}
while (++a <= b);
}
static var_rc_t expand_character_class(const char *desc, char_class_t class)
{
size_t i;
/* Clear the class array. */
for (i = 0; i < 256; ++i)
class[i] = 0;
/* Walk through the class description and set the appropriate
entries in the array. */
while (*desc != '\0') {
if (desc[1] == '-' && desc[2] != '\0') {
if (desc[0] > desc[2])
return VAR_ERR_INCORRECT_CLASS_SPEC;
expand_range(desc[0], desc[2], class);
desc += 3;
} else {
class[(int) *desc] = 1;
++desc;
}
}
return VAR_OK;
}
static int isoct(char c)
{
if (c >= '0' && c <= '7')
return 1;
else
return 0;
}
static var_rc_t expand_octal(const char **src, char **dst, const char *end)
{
unsigned char c;
if (end - *src < 3)
return VAR_ERR_INCOMPLETE_OCTAL;
if (!isoct(**src) || !isoct((*src)[1]) || !isoct((*src)[2]))
return VAR_ERR_INVALID_OCTAL;
c = **src - '0';
if (c > 3)
return VAR_ERR_OCTAL_TOO_LARGE;
c *= 8;
++(*src);
c += **src - '0';
c *= 8;
++(*src);
c += **src - '0';
**dst = (char) c;
++(*dst);
return VAR_OK;
}
static int ishex(char c)
{
if ((c >= '0' && c <= '9') ||
(c >= 'a' && c <= 'f') || (c >= 'A' && c <= 'F'))
return 1;
else
return 0;
}
static var_rc_t expand_simple_hex(const char **src, char **dst,
const char *end)
{
unsigned char c = 0;
if (end - *src < 2)
return VAR_ERR_INCOMPLETE_HEX;
if (!ishex(**src) || !ishex((*src)[1]))
return VAR_ERR_INVALID_HEX;
if (**src >= '0' && **src <= '9')
c = **src - '0';
else if (c >= 'a' && c <= 'f')
c = **src - 'a' + 10;
else if (c >= 'A' && c <= 'F')
c = **src - 'A' + 10;
c = c << 4;
++(*src);
if (**src >= '0' && **src <= '9')
c += **src - '0';
else if (**src >= 'a' && **src <= 'f')
c += **src - 'a' + 10;
else if (**src >= 'A' && **src <= 'F')
c += **src - 'A' + 10;
**dst = (char) c;
++(*dst);
return VAR_OK;
}
static var_rc_t expand_grouped_hex(const char **src, char **dst,
const char *end)
{
var_rc_t rc;
while (*src < end && **src != '}') {
if ((rc = expand_simple_hex(src, dst, end)) != VAR_OK)
return rc;
++(*src);
}
if (*src == end)
return VAR_ERR_INCOMPLETE_GROUPED_HEX;
return VAR_OK;
}
static var_rc_t expand_hex(const char **src, char **dst, const char *end)
{
if (*src == end)
return VAR_ERR_INCOMPLETE_HEX;
if (**src == '{') {
++(*src);
return expand_grouped_hex(src, dst, end);
} else
return expand_simple_hex(src, dst, end);
}
var_rc_t var_unescape(const char *src, size_t len, char *dst,
int unescape_all)
{
const char *end = src + len;
var_rc_t rc;
while (src < end) {
if (*src == '\\') {
if (++src == end)
return VAR_ERR_INCOMPLETE_NAMED_CHARACTER;
switch (*src) {
case '\\':
if (!unescape_all) {
*dst++ = '\\';
}
*dst++ = '\\';
break;
case 'n':
*dst++ = '\n';
break;
case 't':
*dst++ = '\t';
break;
case 'r':
*dst++ = '\r';
break;
case 'x':
++src;
if ((rc = expand_hex(&src, &dst, end)) != VAR_OK)
return rc;
break;
case '0':
case '1':
case '2':
case '3':
case '4':
case '5':
case '6':
case '7':
case '8':
case '9':
if (end - src >= 3 && isdigit((int)src[1]) && isdigit((int)src[2])) {
if ((rc = expand_octal(&src, &dst, end)) != 0)
return rc;
break;
}
default:
if (!unescape_all) {
*dst++ = '\\';
}
*dst++ = *src;
}
++src;
} else
*dst++ = *src++;
}
*dst = '\0';
return VAR_OK;
}
/* The recursive-descent parser for variable expressions. */
static int variable(const char *, const char *, const var_config_t *,
const char_class_t, var_cb_t, void *, int, tokenbuf_t *);
static int command(const char *, const char *, const var_config_t *,
const char_class_t, var_cb_t, void *, int, tokenbuf_t *);
static int text(const char *begin, const char *end, char varinit,
char escape)
{
const char *p;
for (p = begin; p != end && *p != varinit; ++p) {
if (*p == escape) {
if (p + 1 == end)
return VAR_ERR_INCOMPLETE_QUOTED_PAIR;
else
++p;
}
}
return p - begin;
}
static int varname(const char *begin, const char *end,
const char_class_t nameclass)
{
const char *p;
for (p = begin; p != end && nameclass[(int) *p]; ++p);
return p - begin;
}
static int number(const char *begin, const char *end)
{
const char *p;
for (p = begin; p != end && isdigit((int)*p); ++p);
return p - begin;
}
static int substext(const char *begin, const char *end,
const var_config_t *config)
{
const char *p;
for (p = begin; p != end && *p != config->varinit && *p != '/'; ++p) {
if (*p == config->escape) {
if (p + 1 == end)
return VAR_ERR_INCOMPLETE_QUOTED_PAIR;
++p;
}
}
return p - begin;
}
static int exptext(const char *begin, const char *end,
const var_config_t *config)
{
const char *p;
for (p = begin;
p != end && *p != config->varinit && *p != config->enddelim
&& *p != ':'; ++p) {
if (*p == config->escape) {
if (p + 1 == end)
return VAR_ERR_INCOMPLETE_QUOTED_PAIR;
++p;
}
}
return p - begin;
}
static int expression(const char *begin, const char *end,
const var_config_t *config,
const char_class_t nameclass, var_cb_t lookup,
void *lookup_context, int force_expand,
tokenbuf_t *result)
{
const char *p = begin;
const char *data;
size_t len, buffer_size;
int failed = 0;
int rc;
tokenbuf_t name;
tokenbuf_t tmp;
/* Clear the tokenbufs to make sure we have a defined state. */
tokenbuf_init(&name);
tokenbuf_init(&tmp);
tokenbuf_init(result);
/* Expect STARTDELIM. */
if (p == end || *p != config->startdelim)
return 0;
if (++p == end)
return VAR_ERR_INCOMPLETE_VARIABLE_SPEC;
/* Get the name of the variable to expand. The name may consist of
an arbitrary number of VARNAMEs and VARIABLEs. */
do {
rc = varname(p, end, nameclass);
if (rc < 0)
goto error_return;
if (rc > 0) {
if (!tokenbuf_append(&name, p, rc)) {
rc = VAR_ERR_OUT_OF_MEMORY;
goto error_return;
}
p += rc;
}
rc = variable(p, end, config, nameclass, lookup, lookup_context,
force_expand, &tmp);
if (rc < 0)
goto error_return;
if (rc > 0) {
if (!tokenbuf_append(&name, tmp.begin, tmp.end - tmp.begin)) {
rc = VAR_ERR_OUT_OF_MEMORY;
goto error_return;
}
p += rc;
}
}
while (rc > 0);
/* We must have the complete variable name now, so make sure we
do. */
if (name.begin == name.end) {
rc = VAR_ERR_INCOMPLETE_VARIABLE_SPEC;
goto error_return;
}
/* Now we have the name of the variable stored in "name". We
expect an ENDDELIM here. */
if (p == end || (*p != config->enddelim && *p != ':')) {
rc = VAR_ERR_INCOMPLETE_VARIABLE_SPEC;
goto error_return;
}
++p;
/* Use the lookup callback to get the variable's contents. */
rc = (*lookup) (lookup_context, name.begin, name.end - name.begin,
&data, &len, &buffer_size);
if (rc < 0)
goto error_return;
if (rc == 0) {
/* The variable is undefined. What we'll do now depends on the
force_expand flag. */
if (force_expand) {
rc = VAR_ERR_UNDEFINED_VARIABLE;
goto error_return;
}
/* Initialize result to point back to the original text in
the buffer. */
result->begin = begin - 1;
result->end = p;
result->buffer_size = 0;
failed = 1;
} else {
/* The preliminary result is the contents of the variable.
This may be modified by the commands that may follow. */
result->begin = data;
result->end = data + len;
result->buffer_size = buffer_size;
}
if (p[-1] == ':') {
/* Parse and execute commands. */
tokenbuf_free(&tmp);
--p;
while (p != end && *p == ':') {
++p;
if (!failed)
rc = command(p, end, config, nameclass, lookup,
lookup_context, force_expand, result);
else
rc = command(p, end, config, nameclass, lookup,
lookup_context, force_expand, &tmp);
if (rc < 0)
goto error_return;
p += rc;
if (failed)
result->end += rc;
}
if (p == end || *p != config->enddelim) {
rc = VAR_ERR_INCOMPLETE_VARIABLE_SPEC;
goto error_return;
}
++p;
if (failed)
++result->end;
}
/* Exit gracefully. */
tokenbuf_free(&name);
tokenbuf_free(&tmp);
return p - begin;
/* Exit in case of an error. */
error_return:
tokenbuf_free(&name);
tokenbuf_free(&tmp);
tokenbuf_free(result);
return rc;
}
static int variable(const char *begin, const char *end,
const var_config_t *config, const char_class_t nameclass,
var_cb_t lookup, void *lookup_context,
int force_expand, tokenbuf_t *result)
{
const char *p = begin;
const char *data;
size_t len, buffer_size;
int rc, rc2;
/* Clear the result tokenbuf to make sure we're in a defined
state. */
tokenbuf_init(result);
/* Expect VARINIT. */
if (p == end || *p != config->varinit)
return 0;
if (++p == end)
return VAR_ERR_INCOMPLETE_VARIABLE_SPEC;
/* Try to read the variable name. If that fails, we're parsing a
complex expression. */
rc = varname(p, end, nameclass);
if (rc < 0)
return rc;
if (rc > 0) {
rc2 = (*lookup) (lookup_context, p, rc, &data, &len, &buffer_size);
if (rc2 < 0)
return rc2;
if (rc2 == 0) {
if (force_expand)
return VAR_ERR_UNDEFINED_VARIABLE;
result->begin = begin;
result->end = begin + 1 + rc;
result->buffer_size = 0;
return 1 + rc;
}
result->begin = data;
result->end = data + len;
result->buffer_size = buffer_size;
return 1 + rc;
}
/* OK, we're dealing with a complex expression here. */
rc = expression(p, end, config, nameclass, lookup, lookup_context,
force_expand, result);
if (rc > 0)
++rc;
return rc;
}
static int exptext_or_variable(const char *begin, const char *end,
const var_config_t *config,
const char_class_t nameclass, var_cb_t lookup,
void *lookup_context, int force_expand,
tokenbuf_t *result)
{
const char *p = begin;
tokenbuf_t tmp;
int rc;
tokenbuf_init(result);
tokenbuf_init(&tmp);
if (begin == end)
return 0;
do {
rc = exptext(p, end, config);
if (rc < 0)
goto error_return;
if (rc > 0) {
if (!tokenbuf_append(result, p, rc)) {
rc = VAR_ERR_OUT_OF_MEMORY;
goto error_return;
}
p += rc;
}
rc = variable(p, end, config, nameclass, lookup, lookup_context,
force_expand, &tmp);
if (rc < 0)
goto error_return;
if (rc > 0) {
p += rc;
if (!tokenbuf_append
(result, tmp.begin, tmp.end - tmp.begin)) {
rc = VAR_ERR_OUT_OF_MEMORY;
goto error_return;
}
}
}
while (rc > 0);
tokenbuf_free(&tmp);
return p - begin;
error_return:
tokenbuf_free(&tmp);
tokenbuf_free(result);
return rc;
}
static int substext_or_variable(const char *begin, const char *end,
const var_config_t *config,
const char_class_t nameclass, var_cb_t lookup,
void *lookup_context, int force_expand,
tokenbuf_t *result)
{
const char *p = begin;
tokenbuf_t tmp;
int rc;
tokenbuf_init(result);
tokenbuf_init(&tmp);
if (begin == end)
return 0;
do {
rc = substext(p, end, config);
if (rc < 0)
goto error_return;
if (rc > 0) {
if (!tokenbuf_append(result, p, rc)) {
rc = VAR_ERR_OUT_OF_MEMORY;
goto error_return;
}
p += rc;
}
rc = variable(p, end, config, nameclass, lookup, lookup_context,
force_expand, &tmp);
if (rc < 0)
goto error_return;
if (rc > 0) {
p += rc;
if (!tokenbuf_append
(result, tmp.begin, tmp.end - tmp.begin)) {
rc = VAR_ERR_OUT_OF_MEMORY;
goto error_return;
}
}
}
while (rc > 0);
tokenbuf_free(&tmp);
return p - begin;
error_return:
tokenbuf_free(&tmp);
tokenbuf_free(result);
return rc;
}
static int expand_class_description(tokenbuf_t *src, tokenbuf_t *dst)
{
unsigned char c, d;
const char *p = src->begin;
while (p != src->end) {
if ((src->end - p) >= 3 && p[1] == '-') {
if (*p > p[2])
return VAR_ERR_INCORRECT_TRANSPOSE_CLASS_SPEC;
for (c = *p, d = p[2]; c <= d; ++c) {
if (!tokenbuf_append(dst, (char *) &c, 1))
return VAR_ERR_OUT_OF_MEMORY;
}
p += 3;
} else {
if (!tokenbuf_append(dst, p, 1))
return VAR_ERR_OUT_OF_MEMORY;
++p;
}
}
return VAR_OK;
}
static int transpose(tokenbuf_t *data, tokenbuf_t *search,
tokenbuf_t *replace)
{
tokenbuf_t srcclass, dstclass;
const char *p;
int rc;
size_t i;
tokenbuf_init(&srcclass);
tokenbuf_init(&dstclass);
if ((rc = expand_class_description(search, &srcclass)) != VAR_OK)
goto error_return;
if ((rc = expand_class_description(replace, &dstclass)) != VAR_OK)
goto error_return;
if (srcclass.begin == srcclass.end) {
rc = VAR_ERR_EMPTY_TRANSPOSE_CLASS;
goto error_return;
}
if ((srcclass.end - srcclass.begin) != (dstclass.end - dstclass.begin)) {
rc = VAR_ERR_TRANSPOSE_CLASSES_MISMATCH;
goto error_return;
}
if (data->buffer_size == 0) {
tokenbuf_t tmp;
if (!tokenbuf_assign
(&tmp, data->begin, data->end - data->begin)) {
rc = VAR_ERR_OUT_OF_MEMORY;
goto error_return;
}
tokenbuf_move(&tmp, data);
}
for (p = data->begin; p != data->end; ++p) {
for (i = 0; i <= (srcclass.end - srcclass.begin); ++i) {
if (*p == srcclass.begin[i]) {
*((char *) p) = dstclass.begin[i];
break;
}
}
}
tokenbuf_free(&srcclass);
tokenbuf_free(&dstclass);
return VAR_OK;
error_return:
tokenbuf_free(search);
tokenbuf_free(replace);
tokenbuf_free(&srcclass);
tokenbuf_free(&dstclass);
return rc;
}
static int cut_out_offset(tokenbuf_t *data, tokenbuf_t *number1,
tokenbuf_t *number2, int isrange)
{
tokenbuf_t res;
const char *p;
size_t num1 = tokenbuf_toint(number1);
size_t num2 = tokenbuf_toint(number2);
/* Determine begin of result string. */
if ((data->end - data->begin) < num1)
return VAR_ERR_OFFSET_OUT_OF_BOUNDS;
else
p = data->begin + num1;
/* If num2 is zero, we copy the rest from there. */
if (num2 == 0) {
if (!tokenbuf_assign(&res, p, data->end - p))
return VAR_ERR_OUT_OF_MEMORY;
} else { /* OK, then use num2. */
if (isrange) {
if ((p + num2) > data->end)
return VAR_ERR_RANGE_OUT_OF_BOUNDS;
if (!tokenbuf_assign(&res, p, num2))
return VAR_ERR_OUT_OF_MEMORY;
} else {
if (num2 < num1)
return VAR_ERR_OFFSET_LOGIC;
if ((data->begin + num2) > data->end)
return VAR_ERR_RANGE_OUT_OF_BOUNDS;
if (!tokenbuf_assign(&res, p, num2 - num1 + 1))
return VAR_ERR_OUT_OF_MEMORY;
}
}
tokenbuf_free(data);
tokenbuf_move(&res, data);
return VAR_OK;
}
static int expand_regex_replace(const char *data, tokenbuf_t *orig,
regmatch_t *pmatch, tokenbuf_t *expanded)
{
const char *p = orig->begin;
size_t i;
tokenbuf_init(expanded);
while (p != orig->end) {
if (*p == '\\') {
if (orig->end - p <= 1) {
tokenbuf_free(expanded);
return VAR_ERR_INCOMPLETE_QUOTED_PAIR;
}
++p;
if (*p == '\\') {
if (!tokenbuf_append(expanded, p, 1)) {
tokenbuf_free(expanded);
return VAR_ERR_OUT_OF_MEMORY;
}
++p;
continue;
}
if (!isdigit((int)*p)) {
tokenbuf_free(expanded);
return VAR_ERR_UNKNOWN_QUOTED_PAIR_IN_REPLACE;
}
i = *p - '0';
++p;
if (pmatch[i].rm_so == -1) {
tokenbuf_free(expanded);
return VAR_ERR_SUBMATCH_OUT_OF_RANGE;
}
if (!tokenbuf_append(expanded, data + pmatch[i].rm_so,
pmatch[i].rm_eo - pmatch[i].rm_so)) {
tokenbuf_free(expanded);
return VAR_ERR_OUT_OF_MEMORY;
}
} else {
if (!tokenbuf_append(expanded, p, 1)) {
tokenbuf_free(expanded);
return VAR_ERR_OUT_OF_MEMORY;
}
++p;
}
}
return VAR_OK;
}
static int search_and_replace(tokenbuf_t *data, tokenbuf_t *search,
tokenbuf_t *replace, tokenbuf_t *flags)
{
const char *p;
int case_insensitive = 0;
int global = 0;
int no_regex = 0;
int rc;
if (search->begin == search->end)
return VAR_ERR_EMPTY_SEARCH_STRING;
for (p = flags->begin; p != flags->end; ++p) {
switch (tolower(*p)) {
case 'i':
case_insensitive = 1;
break;
case 'g':
global = 1;
break;
case 't':
no_regex = 1;
break;
default:
return VAR_ERR_UNKNOWN_REPLACE_FLAG;
}
}
if (no_regex) {
tokenbuf_t tmp;
tokenbuf_init(&tmp);
for (p = data->begin; p != data->end;) {
if (case_insensitive)
rc = strncasecmp(p, search->begin,
search->end - search->begin);
else
rc = strncmp(p, search->begin,
search->end - search->begin);
if (rc != 0) { /* no match, copy character */
if (!tokenbuf_append(&tmp, p, 1)) {
tokenbuf_free(&tmp);
return VAR_ERR_OUT_OF_MEMORY;
}
++p;
} else {
tokenbuf_append(&tmp, replace->begin,
replace->end - replace->begin);
p += search->end - search->begin;
if (!global) {
if (!tokenbuf_append(&tmp, p, data->end - p)) {
tokenbuf_free(&tmp);
return VAR_ERR_OUT_OF_MEMORY;
}
break;
}
}
}
tokenbuf_free(data);
tokenbuf_move(&tmp, data);
} else {
tokenbuf_t tmp;
tokenbuf_t mydata;
tokenbuf_t myreplace;
regex_t preg;
regmatch_t pmatch[10];
int regexec_flag;
/* Copy the pattern and the data to our own buffer to make
sure they're terminated with a null byte. */
if (!tokenbuf_assign
(&tmp, search->begin, search->end - search->begin))
return VAR_ERR_OUT_OF_MEMORY;
if (!tokenbuf_assign
(&mydata, data->begin, data->end - data->begin)) {
tokenbuf_free(&tmp);
return VAR_ERR_OUT_OF_MEMORY;
}
/* Compile the pattern. */
rc = regcomp(&preg, tmp.begin,
REG_EXTENDED | ((case_insensitive) ? REG_ICASE : 0));
tokenbuf_free(&tmp);
if (rc != 0) {
tokenbuf_free(&mydata);
return VAR_ERR_INVALID_REGEX_IN_REPLACE;
}
/* Match the pattern and create the result string in the tmp
buffer. */
for (p = mydata.begin; p != mydata.end;) {
if (p == mydata.begin || p[-1] == '\n')
regexec_flag = 0;
else
regexec_flag = REG_NOTBOL;
if (regexec
(&preg, p, sizeof(pmatch) / sizeof(regmatch_t), pmatch,
regexec_flag) == REG_NOMATCH) {
tokenbuf_append(&tmp, p, mydata.end - p);
break;
} else {
rc = expand_regex_replace(p, replace, pmatch, &myreplace);
if (rc != VAR_OK) {
regfree(&preg);
tokenbuf_free(&tmp);
tokenbuf_free(&mydata);
return rc;
}
if (!tokenbuf_append(&tmp, p, pmatch[0].rm_so) ||
!tokenbuf_append(&tmp, myreplace.begin,
myreplace.end - myreplace.begin)) {
regfree(&preg);
tokenbuf_free(&tmp);
tokenbuf_free(&mydata);
tokenbuf_free(&myreplace);
return VAR_ERR_OUT_OF_MEMORY;
} else {
p += (pmatch[0].rm_eo > 0) ? pmatch[0].rm_eo : 1;
tokenbuf_free(&myreplace);
}
if (!global) {
tokenbuf_append(&tmp, p, mydata.end - p);
break;
}
}
}
regfree(&preg);
tokenbuf_free(data);
tokenbuf_move(&tmp, data);
tokenbuf_free(&mydata);
}
return VAR_OK;
}
static int padding(tokenbuf_t *data, tokenbuf_t *widthstr, tokenbuf_t *fill,
char position)
{
tokenbuf_t result;
size_t width = tokenbuf_toint(widthstr);
int i;
if (fill->begin == fill->end)
return VAR_ERR_EMPTY_PADDING_FILL_STRING;
tokenbuf_init(&result);
if (position == 'l') {
i = width - (data->end - data->begin);
if (i > 0) {
i = i / (fill->end - fill->begin);
while (i > 0) {
if (!tokenbuf_append
(data, fill->begin, fill->end - fill->begin))
return VAR_ERR_OUT_OF_MEMORY;
--i;
}
i = (width - (data->end - data->begin)) % (fill->end -
fill->begin);
if (!tokenbuf_append(data, fill->begin, i))
return VAR_ERR_OUT_OF_MEMORY;
}
} else if (position == 'r') {
i = width - (data->end - data->begin);
if (i > 0) {
i = i / (fill->end - fill->begin);
while (i > 0) {
if (!tokenbuf_append
(&result, fill->begin, fill->end - fill->begin)) {
tokenbuf_free(&result);
return VAR_ERR_OUT_OF_MEMORY;
}
--i;
}
i = (width - (data->end - data->begin)) % (fill->end -
fill->begin);
if (!tokenbuf_append(&result, fill->begin, i)) {
tokenbuf_free(&result);
return VAR_ERR_OUT_OF_MEMORY;
}
if (!tokenbuf_append
(&result, data->begin, data->end - data->begin)) {
tokenbuf_free(&result);
return VAR_ERR_OUT_OF_MEMORY;
}
tokenbuf_free(data);
tokenbuf_move(&result, data);
}
} else if (position == 'c') {
i = (width - (data->end - data->begin)) / 2;
if (i > 0) {
/* Create the prefix. */
i = i / (fill->end - fill->begin);
while (i > 0) {
if (!tokenbuf_append
(&result, fill->begin, fill->end - fill->begin)) {
tokenbuf_free(&result);
return VAR_ERR_OUT_OF_MEMORY;
}
--i;
}
i = ((width - (data->end - data->begin)) / 2) % (fill->end -
fill->begin);
if (!tokenbuf_append(&result, fill->begin, i)) {
tokenbuf_free(&result);
return VAR_ERR_OUT_OF_MEMORY;
}
/* Append the actual data string. */
if (!tokenbuf_append
(&result, data->begin, data->end - data->begin)) {
tokenbuf_free(&result);
return VAR_ERR_OUT_OF_MEMORY;
}
/* Append the suffix. */
i = width - (result.end - result.begin);
i = i / (fill->end - fill->begin);
while (i > 0) {
if (!tokenbuf_append
(&result, fill->begin, fill->end - fill->begin)) {
tokenbuf_free(&result);
return VAR_ERR_OUT_OF_MEMORY;
}
--i;
}
i = width - (result.end - result.begin);
if (!tokenbuf_append(&result, fill->begin, i)) {
tokenbuf_free(&result);
return VAR_ERR_OUT_OF_MEMORY;
}
/* Move string from temporary buffer to data buffer. */
tokenbuf_free(data);
tokenbuf_move(&result, data);
}
}
return VAR_OK;
}
static int command(const char *begin, const char *end,
const var_config_t *config, const char_class_t nameclass,
var_cb_t lookup, void *lookup_context, int force_expand,
tokenbuf_t *data)
{
const char *p = begin;
tokenbuf_t tmptokbuf;
tokenbuf_t search, replace, flags;
tokenbuf_t number1, number2;
int isrange;
int rc;
tokenbuf_init(&tmptokbuf);
tokenbuf_init(&search);
tokenbuf_init(&replace);
tokenbuf_init(&flags);
tokenbuf_init(&number1);
tokenbuf_init(&number2);
if (begin == end)
return 0;
switch (tolower(*p)) {
case 'l': /* Turn data to lowercase. */
if (data->begin) {
char *ptr;
/* If the buffer does not live in an allocated buffer,
we have to copy it before modifying the contents. */
if (data->buffer_size == 0) {
if (!tokenbuf_assign
(data, data->begin, data->end - data->begin)) {
rc = VAR_ERR_OUT_OF_MEMORY;
goto error_return;
}
}
for (ptr = (char *) data->begin; ptr != data->end; ++ptr)
*ptr = tolower(*ptr);
}
++p;
break;
case 'u': /* Turn data to uppercase. */
if (data->begin) {
char *ptr;
if (data->buffer_size == 0) {
if (!tokenbuf_assign
(data, data->begin, data->end - data->begin)) {
rc = VAR_ERR_OUT_OF_MEMORY;
goto error_return;
}
}
for (ptr = (char *) data->begin; ptr != data->end; ++ptr)
*ptr = toupper(*ptr);
}
++p;
break;
case 'o': /* Cut out substrings. */
++p;
rc = number(p, end);
if (rc == 0) {
rc = VAR_ERR_MISSING_START_OFFSET;
goto error_return;
}
number1.begin = p;
number1.end = p + rc;
number1.buffer_size = 0;
p += rc;
if (*p == ',') {
isrange = 0;
++p;
} else if (*p == '-') {
isrange = 1;
++p;
} else {
rc = VAR_ERR_INVALID_OFFSET_DELIMITER;
goto error_return;
}
rc = number(p, end);
number2.begin = p;
number2.end = p + rc;
number2.buffer_size = 0;
p += rc;
if (data->begin) {
rc = cut_out_offset(data, &number1, &number2, isrange);
if (rc < 0)
goto error_return;
}
break;
case '#': /* Substitute length of the string. */
if (data->begin) {
char buf[((sizeof(int)*8)/3)+10]; /* sufficient size: <#bits> x log_10(2) + safety */
sprintf(buf, "%d", (int)(data->end - data->begin));
tokenbuf_free(data);
if (!tokenbuf_assign(data, buf, strlen(buf))) {
rc = VAR_ERR_OUT_OF_MEMORY;
goto error_return;
}
}
++p;
break;
case '-': /* Substitute parameter if data is empty. */
++p;
rc = exptext_or_variable(p, end, config, nameclass, lookup,
lookup_context, force_expand, &tmptokbuf);
if (rc < 0)
goto error_return;
if (rc == 0) {
rc = VAR_ERR_MISSING_PARAMETER_IN_COMMAND;
goto error_return;
}
p += rc;
if (data->begin != NULL && data->begin == data->end) {
tokenbuf_free(data);
tokenbuf_move(&tmptokbuf, data);
}
break;
case '*': /* Return "" if data is not empty, parameter otherwise. */
++p;
rc = exptext_or_variable(p, end, config, nameclass, lookup,
lookup_context, force_expand, &tmptokbuf);
if (rc < 0)
goto error_return;
if (rc == 0) {
rc = VAR_ERR_MISSING_PARAMETER_IN_COMMAND;
goto error_return;
}
p += rc;
if (data->begin != NULL) {
if (data->begin == data->end) {
tokenbuf_free(data);
tokenbuf_move(&tmptokbuf, data);
} else {
tokenbuf_free(data);
data->begin = data->end = "";
data->buffer_size = 0;
}
}
break;
case '+': /* Substitute parameter if data is not empty. */
++p;
rc = exptext_or_variable(p, end, config, nameclass, lookup,
lookup_context, force_expand, &tmptokbuf);
if (rc < 0)
goto error_return;
if (rc == 0) {
rc = VAR_ERR_MISSING_PARAMETER_IN_COMMAND;
goto error_return;
}
p += rc;
if (data->begin != NULL && data->begin != data->end) {
tokenbuf_free(data);
tokenbuf_move(&tmptokbuf, data);
}
break;
case 's': /* Search and replace. */
++p;
if (*p != '/')
return VAR_ERR_MALFORMATTED_REPLACE;
++p;
rc = substext_or_variable(p, end, config, nameclass, lookup,
lookup_context, force_expand, &search);
if (rc < 0)
goto error_return;
p += rc;
if (*p != '/') {
rc = VAR_ERR_MALFORMATTED_REPLACE;
goto error_return;
}
++p;
rc = substext_or_variable(p, end, config, nameclass, lookup,
lookup_context, force_expand, &replace);
if (rc < 0)
goto error_return;
p += rc;
if (*p != '/') {
rc = VAR_ERR_MALFORMATTED_REPLACE;
goto error_return;
}
++p;
rc = exptext(p, end, config);
if (rc < 0)
goto error_return;
flags.begin = p;
flags.end = p + rc;
flags.buffer_size = 0;
p += rc;
if (data->begin) {
rc = search_and_replace(data, &search, &replace, &flags);
if (rc < 0)
goto error_return;
}
break;
case 'y': /* Transpose characters from class A to class B. */
++p;
if (*p != '/')
return VAR_ERR_MALFORMATTED_TRANSPOSE;
++p;
rc = substext_or_variable(p, end, config, nameclass, lookup,
lookup_context, force_expand, &search);
if (rc < 0)
goto error_return;
p += rc;
if (*p != '/') {
rc = VAR_ERR_MALFORMATTED_TRANSPOSE;
goto error_return;
}
++p;
rc = substext_or_variable(p, end, config, nameclass, lookup,
lookup_context, force_expand, &replace);
if (rc < 0)
goto error_return;
p += rc;
if (*p != '/') {
rc = VAR_ERR_MALFORMATTED_TRANSPOSE;
goto error_return;
} else
++p;
if (data->begin) {
rc = transpose(data, &search, &replace);
if (rc < 0)
goto error_return;
}
break;
case 'p': /* Padding. */
++p;
if (*p != '/')
return VAR_ERR_MALFORMATTED_PADDING;
++p;
rc = number(p, end);
if (rc == 0) {
rc = VAR_ERR_MISSING_PADDING_WIDTH;
goto error_return;
}
number1.begin = p;
number1.end = p + rc;
number1.buffer_size = 0;
p += rc;
if (*p != '/') {
rc = VAR_ERR_MALFORMATTED_PADDING;
goto error_return;
}
++p;
rc = substext_or_variable(p, end, config, nameclass, lookup,
lookup_context, force_expand, &replace);
if (rc < 0)
goto error_return;
p += rc;
if (*p != '/') {
rc = VAR_ERR_MALFORMATTED_PADDING;
goto error_return;
}
++p;
if (*p != 'l' && *p != 'c' && *p != 'r') {
rc = VAR_ERR_MALFORMATTED_PADDING;
goto error_return;
}
++p;
if (data->begin) {
rc = padding(data, &number1, &replace, p[-1]);
if (rc < 0)
goto error_return;
}
break;
default:
return VAR_ERR_UNKNOWN_COMMAND_CHAR;
}
/* Exit gracefully. */
tokenbuf_free(&tmptokbuf);
tokenbuf_free(&search);
tokenbuf_free(&replace);
tokenbuf_free(&flags);
tokenbuf_free(&number1);
tokenbuf_free(&number2);
return p - begin;
error_return:
tokenbuf_free(data);
tokenbuf_free(&tmptokbuf);
tokenbuf_free(&search);
tokenbuf_free(&replace);
tokenbuf_free(&flags);
tokenbuf_free(&number1);
tokenbuf_free(&number2);
return rc;
}
static var_rc_t input(const char *begin, const char *end,
const var_config_t *config,
const char_class_t nameclass, var_cb_t lookup,
void *lookup_context, int force_expand,
tokenbuf_t *output)
{
const char* p = begin;
int rc;
tokenbuf_t result;
tokenbuf_init(&result);
do {
rc = text(begin, end, config->varinit, config->escape);
if (rc > 0) {
if (!tokenbuf_append(output, begin, rc)) {
rc = VAR_ERR_OUT_OF_MEMORY;
goto error_return;
}
begin += rc;
} else if (rc < 0)
goto error_return;
rc = variable(begin, end, config, nameclass, lookup,
lookup_context, force_expand, &result);
if (rc > 0) {
if (!tokenbuf_append
(output, result.begin, result.end - result.begin)) {
rc = VAR_ERR_OUT_OF_MEMORY;
goto error_return;
}
begin += rc;
}
if (rc < 0)
goto error_return;
}
while (rc > 0);
if (begin != end) {
rc = VAR_ERR_INPUT_ISNT_TEXT_NOR_VARIABLE;
goto error_return;
}
return VAR_OK;
error_return:
tokenbuf_free(output);
tokenbuf_free(&result);
output->begin = p;
output->end = begin;
output->buffer_size = 0;
return rc;
}
var_rc_t var_expand(const char *input_buf, size_t input_len,
char **result, size_t *result_len,
var_cb_t lookup, void *lookup_context,
const var_config_t *config, int force_expand)
{
char_class_t nameclass;
var_rc_t rc;
tokenbuf_t output;
/* Argument sanity checks */
if (input_buf == NULL || input_len == 0 ||
result == NULL || result_len == NULL ||
lookup == NULL)
return VAR_ERR_INVALID_ARGUMENT;
/* Optionally use default configuration */
if (config == NULL)
config = &var_config_default;
/* Set the result pointer to the begining of the input buffer so
that it is correctly initialized in case we fail with an error. */
*result = (char *)input_buf;
/* Expand the class description for valid variable names. */
if ((rc = expand_character_class(config->namechars, nameclass)) != VAR_OK)
return rc;
/* Make sure that the specials defined in the configuration do not
appear in the character name class. */
if (nameclass[(int)config->varinit] ||
nameclass[(int)config->startdelim] ||
nameclass[(int)config->enddelim] ||
nameclass[(int)config->escape])
return VAR_ERR_INVALID_CONFIGURATION;
/* Call the parser. */
tokenbuf_init(&output);
rc = input(input_buf, input_buf + input_len, config, nameclass,
lookup, lookup_context, force_expand, &output);
*result = (char *)output.begin;
*result_len = output.end - output.begin;
return rc;
}