OSSP CVS Repository

ossp - ossp-pkg/var/var.c 1.17
Not logged in
[Honeypot]  [Browse]  [Directory]  [Home]  [Login
[Reports]  [Search]  [Ticket]  [Timeline
  [Raw

ossp-pkg/var/var.c 1.17
/*
**  VAR - OSSP variable expression library.
**  Copyright (c) 2001 The OSSP Project (http://www.ossp.org/)
**  Copyright (c) 2001 Cable & Wireless Deutschland (http://www.cw.com/de/)
**
**  This file is part of OSSP VAR, an extensible data serialization
**  library which can be found at http://www.ossp.org/pkg/var/.
**
**  Permission to use, copy, modify, and distribute this software for
**  any purpose with or without fee is hereby granted, provided that
**  the above copyright notice and this permission notice appear in all
**  copies.
**
**  THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
**  WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
**  MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
**  IN NO EVENT SHALL THE AUTHORS AND COPYRIGHT HOLDERS AND THEIR
**  CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
**  SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
**  LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
**  USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
**  ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
**  OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
**  OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
**  SUCH DAMAGE.
**
**  var.c: VAR library implementation.
*/

#include <ctype.h>
#include <string.h>
#include <stdio.h>
#include <errno.h>
#include <sys/types.h>
#include <regex.h>
#include "var.h"

/* The default configuration for the parser. */

const var_config_t var_config_default = {
    '$',                        /* varinit */
    '{',                        /* startdelim */
    '}',                        /* enddelim */
    '\\',                       /* escape */
    "a-zA-Z0-9_"                /* namechars */
};

/* Routines for manipulation of token buffers. */

#define TOKENBUF_INITIAL_BUFSIZE 64

typedef struct {
    const char *begin;
    const char *end;
    size_t buffer_size;
} tokenbuf_t;

static void tokenbuf_init(tokenbuf_t *buf)
{
    buf->begin = NULL;
    buf->end = NULL;
    buf->buffer_size = 0;
    return;
}

static void tokenbuf_move(tokenbuf_t *src, tokenbuf_t *dst)
{
    dst->begin = src->begin;
    dst->end = src->end;
    dst->buffer_size = src->buffer_size;
    tokenbuf_init(src);
    return;
}

static int tokenbuf_assign(tokenbuf_t *buf, const char *data, size_t len)
{
    char *p;
    
    if ((p = malloc(len + 1)) == NULL)
        return 0;
    memcpy(p, data, len);
    buf->begin = p;
    buf->end = p + len;
    buf->buffer_size = len + 1;
    *((char *)(buf->end)) = '\0';
    return 1;
}

static int tokenbuf_append(tokenbuf_t *output, const char *data, size_t len)
{
    char *new_buffer;
    size_t new_size;
    char *tmp;

    /* Is the tokenbuffer initialized at all? If not, allocate a
       standard-sized buffer to begin with. */
    if (output->begin == NULL) {
        if ((output->begin = output->end = malloc(TOKENBUF_INITIAL_BUFSIZE)) == NULL)
            return 0;
        output->buffer_size = TOKENBUF_INITIAL_BUFSIZE;
    }

    /* Does the token contain text, but no buffer has been allocated yet? */
    if (output->buffer_size == 0) {
        /* Check whether data borders to output. If, we can append
           simly by increasing the end pointer. */
        if (output->end == data) {
            output->end += len;
            return 1;
        }
        /* OK, so copy the contents of output into an allocated buffer
           so that we can append that way. */
        if ((tmp = malloc(output->end - output->begin + len + 1)) == NULL)
            return 0;
        memcpy(tmp, output->begin, output->end - output->begin);
        output->buffer_size = output->end - output->begin;
        output->begin = tmp;
        output->end = tmp + output->buffer_size;
        output->buffer_size += len + 1;
    }

    /* Does the token fit into the current buffer? If not, realloc a
       larger buffer that fits. */
    if ((output->buffer_size - (output->end - output->begin)) <= len) {
        new_size = output->buffer_size;
        do {
            new_size *= 2;
        } while ((new_size - (output->end - output->begin)) <= len);
        if ((new_buffer = realloc((char *)output->begin, new_size)) == NULL)
            return 0;
        output->end = new_buffer + (output->end - output->begin);
        output->begin = new_buffer;
        output->buffer_size = new_size;
    }

    /* Append the data at the end of the current buffer. */
    memcpy((char *)output->end, data, len);
    output->end += len;
    *((char *)output->end) = '\0';
    return 1;
}

static void tokenbuf_free(tokenbuf_t *buf)
{
    if (buf->begin != NULL && buf->buffer_size > 0)
        free((char *)buf->begin);
    buf->begin = buf->end = NULL;
    buf->buffer_size = 0;
    return;
}

static size_t tokenbuf_toint(tokenbuf_t *number)
{
    const char *p;
    size_t num;
    
    num = 0;
    for (p = number->begin; p != number->end; ++p) {
        num *= 10;
        num += *p - '0';
    }
    return num;
}

/* Routines for the expansion of quoted-pair expressions. */

static void expand_range(char a, char b, char class[256])
{
    do {
        class[(int)a] = 1;
    }
    while (++a <= b);
}

static var_rc_t expand_character_class(const char *desc, char class[256])
{
    size_t i;

    /* Clear the class array. */

    for (i = 0; i < 256; ++i)
        class[i] = 0;

    /* Walk through the class description and set the appropriate
       entries in the array. */

    while (*desc != '\0') {
        if (desc[1] == '-' && desc[2] != '\0') {
            if (desc[0] > desc[2])
                return VAR_ERR_INCORRECT_CLASS_SPEC;
            expand_range(desc[0], desc[2], class);
            desc += 3;
        } else {
            class[(int) *desc] = 1;
            ++desc;
        }
    }

    return VAR_OK;
}

static int isoct(char c)
{
    if (c >= '0' && c <= '7')
        return 1;
    else
        return 0;
}

static var_rc_t expand_octal(const char **src, char **dst, const char *end)
{
    unsigned char c;

    if (end - *src < 3)
        return VAR_ERR_INCOMPLETE_OCTAL;
    if (!isoct(**src) || !isoct((*src)[1]) || !isoct((*src)[2]))
        return VAR_ERR_INVALID_OCTAL;

    c = **src - '0';
    if (c > 3)
        return VAR_ERR_OCTAL_TOO_LARGE;
    c *= 8;
    ++(*src);

    c += **src - '0';
    c *= 8;
    ++(*src);

    c += **src - '0';

    **dst = (char) c;
    ++(*dst);
    return VAR_OK;
}

static int ishex(char c)
{
    if ((c >= '0' && c <= '9') ||
        (c >= 'a' && c <= 'f') || (c >= 'A' && c <= 'F'))
        return 1;
    else
        return 0;
}

static var_rc_t expand_simple_hex(const char **src, char **dst,
                                  const char *end)
{
    unsigned char c = 0;

    if (end - *src < 2)
        return VAR_ERR_INCOMPLETE_HEX;
    if (!ishex(**src) || !ishex((*src)[1]))
        return VAR_ERR_INVALID_HEX;

    if (**src >= '0' && **src <= '9')
        c = **src - '0';
    else if (c >= 'a' && c <= 'f')
        c = **src - 'a' + 10;
    else if (c >= 'A' && c <= 'F')
        c = **src - 'A' + 10;

    c = c << 4;
    ++(*src);

    if (**src >= '0' && **src <= '9')
        c += **src - '0';
    else if (**src >= 'a' && **src <= 'f')
        c += **src - 'a' + 10;
    else if (**src >= 'A' && **src <= 'F')
        c += **src - 'A' + 10;

    **dst = (char) c;
    ++(*dst);
    return VAR_OK;
}

static var_rc_t expand_grouped_hex(const char **src, char **dst,
                                   const char *end)
{
    var_rc_t rc;

    while (*src < end && **src != '}') {
        if ((rc = expand_simple_hex(src, dst, end)) != VAR_OK)
            return rc;
        ++(*src);
    }
    if (*src == end)
        return VAR_ERR_INCOMPLETE_GROUPED_HEX;

    return VAR_OK;
}

static var_rc_t expand_hex(const char **src, char **dst, const char *end)
{
    if (*src == end)
        return VAR_ERR_INCOMPLETE_HEX;
    if (**src == '{') {
        ++(*src);
        return expand_grouped_hex(src, dst, end);
    } else
        return expand_simple_hex(src, dst, end);
}

var_rc_t var_unescape(const char *src, size_t len, char *dst,
                      int unescape_all)
{
    const char *end = src + len;
    var_rc_t rc;

    while (src < end) {
        if (*src == '\\') {
            if (++src == end)
                return VAR_ERR_INCOMPLETE_NAMED_CHARACTER;
            switch (*src) {
            case '\\':
                if (!unescape_all) {
                    *dst++ = '\\';
                }
                *dst++ = '\\';
                break;
            case 'n':
                *dst++ = '\n';
                break;
            case 't':
                *dst++ = '\t';
                break;
            case 'r':
                *dst++ = '\r';
                break;
            case 'x':
                ++src;
                if ((rc = expand_hex(&src, &dst, end)) != VAR_OK)
                    return rc;
                break;
            case '0':
            case '1':
            case '2':
            case '3':
            case '4':
            case '5':
            case '6':
            case '7':
            case '8':
            case '9':
                if (end - src >= 3 && isdigit((int)src[1]) && isdigit((int)src[2])) {
                    if ((rc = expand_octal(&src, &dst, end)) != 0)
                        return rc;
                    break;
                }
            default:
                if (!unescape_all) {
                    *dst++ = '\\';
                }
                *dst++ = *src;
            }
            ++src;
        } else
            *dst++ = *src++;
    }
    *dst = '\0';
    return VAR_OK;
}

/* The recursive-descent parser for variable expressions. */

static int variable(const char *, const char *, const var_config_t *,
                    const char[256], var_cb_t, void *, int, tokenbuf_t *);
static int command(const char *, const char *, const var_config_t *,
                   const char[256], var_cb_t, void *, int, tokenbuf_t *);

static int text(const char *begin, const char *end, char varinit,
                char escape)
{
    const char *p;
    for (p = begin; p != end && *p != varinit; ++p) {
        if (*p == escape) {
            if (p + 1 == end)
                return VAR_ERR_INCOMPLETE_QUOTED_PAIR;
            else
                ++p;
        }
    }
    return p - begin;
}

static int varname(const char *begin, const char *end,
                   const char nameclass[256])
{
    const char *p;
    for (p = begin; p != end && nameclass[(int) *p]; ++p);
    return p - begin;
}

static int number(const char *begin, const char *end)
{
    const char *p;
    for (p = begin; p != end && isdigit((int)*p); ++p);
    return p - begin;
}

static int substext(const char *begin, const char *end,
                    const var_config_t *config)
{
    const char *p;
    for (p = begin; p != end && *p != config->varinit && *p != '/'; ++p) {
        if (*p == config->escape) {
            if (p + 1 == end)
                return VAR_ERR_INCOMPLETE_QUOTED_PAIR;
            else
                ++p;
        }
    }
    return p - begin;
}

static int exptext(const char *begin, const char *end,
                   const var_config_t *config)
{
    const char *p;
    for (p = begin;
         p != end && *p != config->varinit && *p != config->enddelim
         && *p != ':'; ++p) {
        if (*p == config->escape) {
            if (p + 1 == end)
                return VAR_ERR_INCOMPLETE_QUOTED_PAIR;
            else
                ++p;
        }
    }
    return p - begin;
}


static int expression(const char *begin, const char *end,
                      const var_config_t *config,
                      const char nameclass[256], var_cb_t lookup,
                      void *lookup_context, int force_expand,
                      tokenbuf_t *result)
{
    const char *p = begin;
    const char *data;
    size_t len, buffer_size;
    int failed = 0;
    int rc;
    tokenbuf_t name;
    tokenbuf_t tmp;

    /* Clear the tokenbufs to make sure we have a defined state. */

    tokenbuf_init(&name);
    tokenbuf_init(&tmp);
    tokenbuf_init(result);

    /* Expect STARTDELIM. */

    if (p == end || *p != config->startdelim)
        return 0;

    if (++p == end)
        return VAR_ERR_INCOMPLETE_VARIABLE_SPEC;

    /* Get the name of the variable to expand. The name may consist of
       an arbitrary number of VARNAMEs and VARIABLEs. */

    do {
        rc = varname(p, end, nameclass);
        if (rc < 0)
            goto error_return;
        else if (rc > 0) {
            if (!tokenbuf_append(&name, p, rc)) {
                rc = VAR_ERR_OUT_OF_MEMORY;
                goto error_return;
            } else
                p += rc;
        }

        rc = variable(p, end, config, nameclass, lookup, lookup_context,
                      force_expand, &tmp);
        if (rc < 0)
            goto error_return;
        else if (rc > 0) {
            if (!tokenbuf_append(&name, tmp.begin, tmp.end - tmp.begin)) {
                rc = VAR_ERR_OUT_OF_MEMORY;
                goto error_return;
            } else
                p += rc;
        }
    }
    while (rc > 0);

    /* We must have the complete variable name now, so make sure we
       do. */

    if (name.begin == name.end) {
        rc = VAR_ERR_INCOMPLETE_VARIABLE_SPEC;
        goto error_return;
    }

    /* Now we have the name of the variable stored in "name". We
       expect an ENDDELIM here. */

    if (p == end || (*p != config->enddelim && *p != ':')) {
        rc = VAR_ERR_INCOMPLETE_VARIABLE_SPEC;
        goto error_return;
    } else
        ++p;

    /* Use the lookup callback to get the variable's contents. */

    rc = (*lookup) (lookup_context, name.begin, name.end - name.begin,
                    &data, &len, &buffer_size);
    if (rc < 0)
        goto error_return;
    else if (rc == 0) {
        /* The variable is undefined. What we'll do now depends on the
           force_expand flag. */

        if (force_expand) {
            rc = VAR_ERR_UNDEFINED_VARIABLE;
            goto error_return;
        } else {
            /* Initialize result to point back to the original text in
               the buffer. */

            result->begin = begin - 1;
            result->end = p;
            result->buffer_size = 0;
            failed = 1;
        }
    } else {
        /* The preliminary result is the contents of the variable.
           This may be modified by the commands that may follow. */

        result->begin = data;
        result->end = data + len;
        result->buffer_size = buffer_size;
    }

    if (p[-1] == ':') {
        /* Parse and execute commands. */

        tokenbuf_free(&tmp);
        --p;
        while (p != end && *p == ':') {
            ++p;
            if (!failed)
                rc = command(p, end, config, nameclass, lookup,
                             lookup_context, force_expand, result);
            else
                rc = command(p, end, config, nameclass, lookup,
                             lookup_context, force_expand, &tmp);
            if (rc < 0)
                goto error_return;
            p += rc;
            if (failed)
                result->end += rc;
        }

        if (p == end || *p != config->enddelim) {
            rc = VAR_ERR_INCOMPLETE_VARIABLE_SPEC;
            goto error_return;
        }
        ++p;
        if (failed)
            ++result->end;
    }

    /* Exit gracefully. */

    tokenbuf_free(&name);
    tokenbuf_free(&tmp);
    return p - begin;

    /* Exit in case of an error. */

  error_return:
    tokenbuf_free(&name);
    tokenbuf_free(&tmp);
    tokenbuf_free(result);
    return rc;
}

static int variable(const char *begin, const char *end,
                    const var_config_t *config, const char nameclass[256],
                    var_cb_t lookup, void *lookup_context,
                    int force_expand, tokenbuf_t *result)
{
    const char *p = begin;
    const char *data;
    size_t len, buffer_size;
    int rc, rc2;

    /* Clear the result tokenbuf to make sure we're in a defined
       state. */

    tokenbuf_init(result);

    /* Expect VARINIT. */

    if (p == end || *p != config->varinit)
        return 0;

    if (++p == end)
        return VAR_ERR_INCOMPLETE_VARIABLE_SPEC;

    /* Try to read the variable name. If that fails, we're parsing a
       complex expression. */

    rc = varname(p, end, nameclass);
    if (rc < 0)
        return rc;
    else if (rc > 0) {
        rc2 = (*lookup) (lookup_context, p, rc, &data, &len, &buffer_size);
        if (rc2 < 0)
            return rc2;
        else if (rc2 == 0) {
            if (force_expand)
                return VAR_ERR_UNDEFINED_VARIABLE;
            else {
                result->begin = begin;
                result->end = begin + 1 + rc;
                result->buffer_size = 0;
                return 1 + rc;
            }
        } else {
            result->begin = data;
            result->end = data + len;
            result->buffer_size = buffer_size;
            return 1 + rc;
        }
    }

    /* OK, we're dealing with a complex expression here. */

    rc = expression(p, end, config, nameclass, lookup, lookup_context,
                    force_expand, result);
    if (rc > 0)
        ++rc;
    return rc;
}

static int exptext_or_variable(const char *begin, const char *end,
                               const var_config_t *config,
                               const char nameclass[256], var_cb_t lookup,
                               void *lookup_context, int force_expand,
                               tokenbuf_t *result)
{
    const char *p = begin;
    tokenbuf_t tmp;
    int rc;

    tokenbuf_init(result);
    tokenbuf_init(&tmp);

    if (begin == end)
        return 0;

    do {
        rc = exptext(p, end, config);
        if (rc < 0)
            goto error_return;
        else if (rc > 0) {
            if (!tokenbuf_append(result, p, rc)) {
                rc = VAR_ERR_OUT_OF_MEMORY;
                goto error_return;
            } else
                p += rc;
        }

        rc = variable(p, end, config, nameclass, lookup, lookup_context,
                      force_expand, &tmp);
        if (rc < 0)
            goto error_return;
        else if (rc > 0) {
            p += rc;
            if (!tokenbuf_append
                (result, tmp.begin, tmp.end - tmp.begin)) {
                rc = VAR_ERR_OUT_OF_MEMORY;
                goto error_return;
            }
        }
    }
    while (rc > 0);

    tokenbuf_free(&tmp);
    return p - begin;

  error_return:
    tokenbuf_free(&tmp);
    tokenbuf_free(result);
    return rc;
}

static int substext_or_variable(const char *begin, const char *end,
                                const var_config_t *config,
                                const char nameclass[256], var_cb_t lookup,
                                void *lookup_context, int force_expand,
                                tokenbuf_t *result)
{
    const char *p = begin;
    tokenbuf_t tmp;
    int rc;

    tokenbuf_init(result);
    tokenbuf_init(&tmp);

    if (begin == end)
        return 0;

    do {
        rc = substext(p, end, config);
        if (rc < 0)
            goto error_return;
        else if (rc > 0) {
            if (!tokenbuf_append(result, p, rc)) {
                rc = VAR_ERR_OUT_OF_MEMORY;
                goto error_return;
            } else
                p += rc;
        }

        rc = variable(p, end, config, nameclass, lookup, lookup_context,
                      force_expand, &tmp);
        if (rc < 0)
            goto error_return;
        else if (rc > 0) {
            p += rc;
            if (!tokenbuf_append
                (result, tmp.begin, tmp.end - tmp.begin)) {
                rc = VAR_ERR_OUT_OF_MEMORY;
                goto error_return;
            }
        }
    }
    while (rc > 0);

    tokenbuf_free(&tmp);
    return p - begin;

  error_return:
    tokenbuf_free(&tmp);
    tokenbuf_free(result);
    return rc;
}


static int expand_class_description(tokenbuf_t *src, tokenbuf_t *dst)
{
    unsigned char c, d;
    const char *p = src->begin;
    while (p != src->end) {
        if ((src->end - p) >= 3 && p[1] == '-') {
            if (*p > p[2])
                return VAR_ERR_INCORRECT_TRANSPOSE_CLASS_SPEC;
            for (c = *p, d = p[2]; c <= d; ++c) {
                if (!tokenbuf_append(dst, (char *) &c, 1))
                    return VAR_ERR_OUT_OF_MEMORY;
            }
            p += 3;
        } else {
            if (!tokenbuf_append(dst, p, 1))
                return VAR_ERR_OUT_OF_MEMORY;
            else
                ++p;
        }
    }
    return VAR_OK;
}

static int transpose(tokenbuf_t *data, tokenbuf_t *search,
                     tokenbuf_t *replace)
{
    tokenbuf_t srcclass, dstclass;
    const char *p;
    int rc;
    size_t i;

    tokenbuf_init(&srcclass);
    tokenbuf_init(&dstclass);

    if ((rc = expand_class_description(search, &srcclass)) != VAR_OK)
        goto error_return;
    if ((rc = expand_class_description(replace, &dstclass)) != VAR_OK)
        goto error_return;

    if (srcclass.begin == srcclass.end) {
        rc = VAR_ERR_EMPTY_TRANSPOSE_CLASS;
        goto error_return;
    }
    if ((srcclass.end - srcclass.begin) != (dstclass.end - dstclass.begin)) {
        rc = VAR_ERR_TRANSPOSE_CLASSES_MISMATCH;
        goto error_return;
    }

    if (data->buffer_size == 0) {
        tokenbuf_t tmp;
        if (!tokenbuf_assign
            (&tmp, data->begin, data->end - data->begin)) {
            rc = VAR_ERR_OUT_OF_MEMORY;
            goto error_return;
        }
        tokenbuf_move(&tmp, data);
    }

    for (p = data->begin; p != data->end; ++p) {
        for (i = 0; i <= (srcclass.end - srcclass.begin); ++i) {
            if (*p == srcclass.begin[i]) {
                *((char *) p) = dstclass.begin[i];
                break;
            }
        }
    }

    tokenbuf_free(&srcclass);
    tokenbuf_free(&dstclass);
    return VAR_OK;

  error_return:
    tokenbuf_free(search);
    tokenbuf_free(replace);
    tokenbuf_free(&srcclass);
    tokenbuf_free(&dstclass);
    return rc;
}

static int cut_out_offset(tokenbuf_t *data, tokenbuf_t *number1,
                          tokenbuf_t *number2, int isrange)
{
    tokenbuf_t res;
    const char *p;
    size_t num1 = tokenbuf_toint(number1);
    size_t num2 = tokenbuf_toint(number2);

    /* Determine begin of result string. */

    if ((data->end - data->begin) < num1)
        return VAR_ERR_OFFSET_OUT_OF_BOUNDS;
    else
        p = data->begin + num1;

    /* If num2 is zero, we copy the rest from there. */

    if (num2 == 0) {
        if (!tokenbuf_assign(&res, p, data->end - p))
            return VAR_ERR_OUT_OF_MEMORY;
    } else {                    /* OK, then use num2. */

        if (isrange) {
            if ((p + num2) > data->end)
                return VAR_ERR_RANGE_OUT_OF_BOUNDS;
            if (!tokenbuf_assign(&res, p, num2))
                return VAR_ERR_OUT_OF_MEMORY;
        } else {
            if (num2 < num1)
                return VAR_ERR_OFFSET_LOGIC;
            if ((data->begin + num2) > data->end)
                return VAR_ERR_RANGE_OUT_OF_BOUNDS;
            if (!tokenbuf_assign(&res, p, (data->begin + num2) - p))
                return VAR_ERR_OUT_OF_MEMORY;
        }
    }
    tokenbuf_free(data);
    tokenbuf_move(&res, data);
    return VAR_OK;
}

static int expand_regex_replace(const char *data, tokenbuf_t *orig,
                                regmatch_t *pmatch, tokenbuf_t *expanded)
{
    const char *p = orig->begin;
    size_t i;

    tokenbuf_init(expanded);

    while (p != orig->end) {
        if (*p == '\\') {
            if (orig->end - p <= 1) {
                tokenbuf_free(expanded);
                return VAR_ERR_INCOMPLETE_QUOTED_PAIR;
            } else
                ++p;
            if (*p == '\\') {
                if (!tokenbuf_append(expanded, p, 1)) {
                    tokenbuf_free(expanded);
                    return VAR_ERR_OUT_OF_MEMORY;
                }
                ++p;
                continue;
            }
            if (!isdigit((int)*p)) {
                tokenbuf_free(expanded);
                return VAR_ERR_UNKNOWN_QUOTED_PAIR_IN_REPLACE;
            }
            i = *p - '0';
            ++p;
            if (pmatch[i].rm_so == -1) {
                tokenbuf_free(expanded);
                return VAR_ERR_SUBMATCH_OUT_OF_RANGE;
            }
            if (!tokenbuf_append(expanded, data + pmatch[i].rm_so,
                                    pmatch[i].rm_eo - pmatch[i].rm_so)) {
                tokenbuf_free(expanded);
                return VAR_ERR_OUT_OF_MEMORY;
            }
        } else {
            if (!tokenbuf_append(expanded, p, 1)) {
                tokenbuf_free(expanded);
                return VAR_ERR_OUT_OF_MEMORY;
            }
            ++p;
        }
    }

    return VAR_OK;
}

static int search_and_replace(tokenbuf_t *data, tokenbuf_t *search,
                              tokenbuf_t *replace, tokenbuf_t *flags)
{
    const char *p;
    int case_insensitive = 0;
    int global = 0;
    int no_regex = 0;
    int rc;

    if (search->begin == search->end)
        return VAR_ERR_EMPTY_SEARCH_STRING;

    for (p = flags->begin; p != flags->end; ++p) {
        switch (tolower(*p)) {
        case 'i':
            case_insensitive = 1;
            break;
        case 'g':
            global = 1;
            break;
        case 't':
            no_regex = 1;
            break;
        default:
            return VAR_ERR_UNKNOWN_REPLACE_FLAG;
        }
    }

    if (no_regex) {
        tokenbuf_t tmp;
        tokenbuf_init(&tmp);

        for (p = data->begin; p != data->end;) {
            if (case_insensitive)
                rc = strncasecmp(p, search->begin,
                                 search->end - search->begin);
            else
                rc = strncmp(p, search->begin,
                             search->end - search->begin);
            if (rc != 0) {      /* no match, copy character */
                if (!tokenbuf_append(&tmp, p, 1)) {
                    tokenbuf_free(&tmp);
                    return VAR_ERR_OUT_OF_MEMORY;
                }
                ++p;
            } else {
                tokenbuf_append(&tmp, replace->begin,
                                   replace->end - replace->begin);
                p += search->end - search->begin;
                if (!global) {
                    if (!tokenbuf_append(&tmp, p, data->end - p)) {
                        tokenbuf_free(&tmp);
                        return VAR_ERR_OUT_OF_MEMORY;
                    }
                    break;
                }
            }
        }

        tokenbuf_free(data);
        tokenbuf_move(&tmp, data);
    } else {
        tokenbuf_t tmp;
        tokenbuf_t mydata;
        tokenbuf_t myreplace;
        regex_t preg;
        regmatch_t pmatch[10];
        int regexec_flag;

        /* Copy the pattern and the data to our own buffer to make
           sure they're terminated with a null byte. */

        if (!tokenbuf_assign
            (&tmp, search->begin, search->end - search->begin))
            return VAR_ERR_OUT_OF_MEMORY;
        if (!tokenbuf_assign
            (&mydata, data->begin, data->end - data->begin)) {
            tokenbuf_free(&tmp);
            return VAR_ERR_OUT_OF_MEMORY;
        }

        /* Compile the pattern. */

        rc = regcomp(&preg, tmp.begin,
                     REG_EXTENDED | ((case_insensitive) ? REG_ICASE : 0));
        tokenbuf_free(&tmp);
        if (rc != 0) {
            tokenbuf_free(&mydata);
            return VAR_ERR_INVALID_REGEX_IN_REPLACE;
        }

        /* Match the pattern and create the result string in the tmp
           buffer. */

        for (p = mydata.begin; p != mydata.end;) {
            if (p == mydata.begin || p[-1] == '\n')
                regexec_flag = 0;
            else
                regexec_flag = REG_NOTBOL;
            if (regexec
                (&preg, p, sizeof(pmatch) / sizeof(regmatch_t), pmatch,
                 regexec_flag) == REG_NOMATCH) {
                tokenbuf_append(&tmp, p, mydata.end - p);
                break;
            } else {
                rc = expand_regex_replace(p, replace, pmatch, &myreplace);
                if (rc != VAR_OK) {
                    regfree(&preg);
                    tokenbuf_free(&tmp);
                    tokenbuf_free(&mydata);
                    return rc;
                }
                if (!tokenbuf_append(&tmp, p, pmatch[0].rm_so) ||
                    !tokenbuf_append(&tmp, myreplace.begin,
                                        myreplace.end - myreplace.begin)) {
                    regfree(&preg);
                    tokenbuf_free(&tmp);
                    tokenbuf_free(&mydata);
                    tokenbuf_free(&myreplace);
                    return VAR_ERR_OUT_OF_MEMORY;
                } else {
                    p += (pmatch[0].rm_eo > 0) ? pmatch[0].rm_eo : 1;
                    tokenbuf_free(&myreplace);
                }
                if (!global) {
                    tokenbuf_append(&tmp, p, mydata.end - p);
                    break;
                }
            }
        }

        regfree(&preg);
        tokenbuf_free(data);
        tokenbuf_move(&tmp, data);
        tokenbuf_free(&mydata);
    }

    return VAR_OK;
}

static int padding(tokenbuf_t *data, tokenbuf_t *widthstr, tokenbuf_t *fill,
                   char position)
{
    tokenbuf_t result;
    size_t width = tokenbuf_toint(widthstr);
    int i;

    if (fill->begin == fill->end)
        return VAR_ERR_EMPTY_PADDING_FILL_STRING;

    tokenbuf_init(&result);

    if (position == 'l') {
        i = width - (data->end - data->begin);
        if (i > 0) {
            i = i / (fill->end - fill->begin);
            while (i > 0) {
                if (!tokenbuf_append
                    (data, fill->begin, fill->end - fill->begin))
                    return VAR_ERR_OUT_OF_MEMORY;
                --i;
            }
            i = (width - (data->end - data->begin)) % (fill->end -
                                                       fill->begin);
            if (!tokenbuf_append(data, fill->begin, i))
                return VAR_ERR_OUT_OF_MEMORY;
        }
    } else if (position == 'r') {
        i = width - (data->end - data->begin);
        if (i > 0) {
            i = i / (fill->end - fill->begin);
            while (i > 0) {
                if (!tokenbuf_append
                    (&result, fill->begin, fill->end - fill->begin)) {
                    tokenbuf_free(&result);
                    return VAR_ERR_OUT_OF_MEMORY;
                }
                --i;
            }
            i = (width - (data->end - data->begin)) % (fill->end -
                                                       fill->begin);
            if (!tokenbuf_append(&result, fill->begin, i)) {
                tokenbuf_free(&result);
                return VAR_ERR_OUT_OF_MEMORY;
            }
            if (!tokenbuf_append
                (&result, data->begin, data->end - data->begin)) {
                tokenbuf_free(&result);
                return VAR_ERR_OUT_OF_MEMORY;
            }

            tokenbuf_free(data);
            tokenbuf_move(&result, data);
        }
    } else if (position == 'c') {
        i = (width - (data->end - data->begin)) / 2;
        if (i > 0) {
            /* Create the prefix. */

            i = i / (fill->end - fill->begin);
            while (i > 0) {
                if (!tokenbuf_append
                    (&result, fill->begin, fill->end - fill->begin)) {
                    tokenbuf_free(&result);
                    return VAR_ERR_OUT_OF_MEMORY;
                }
                --i;
            }
            i = ((width - (data->end - data->begin)) / 2) % (fill->end -
                                                             fill->begin);
            if (!tokenbuf_append(&result, fill->begin, i)) {
                tokenbuf_free(&result);
                return VAR_ERR_OUT_OF_MEMORY;
            }

            /* Append the actual data string. */

            if (!tokenbuf_append
                (&result, data->begin, data->end - data->begin)) {
                tokenbuf_free(&result);
                return VAR_ERR_OUT_OF_MEMORY;
            }

            /* Append the suffix. */

            i = width - (result.end - result.begin);
            i = i / (fill->end - fill->begin);
            while (i > 0) {
                if (!tokenbuf_append
                    (&result, fill->begin, fill->end - fill->begin)) {
                    tokenbuf_free(&result);
                    return VAR_ERR_OUT_OF_MEMORY;
                }
                --i;
            }
            i = width - (result.end - result.begin);
            if (!tokenbuf_append(&result, fill->begin, i)) {
                tokenbuf_free(&result);
                return VAR_ERR_OUT_OF_MEMORY;
            }

            /* Move string from temporary buffer to data buffer. */

            tokenbuf_free(data);
            tokenbuf_move(&result, data);
        }
    }

    return VAR_OK;
}

static int command(const char *begin, const char *end,
                   const var_config_t *config, const char nameclass[256],
                   var_cb_t lookup, void *lookup_context, int force_expand,
                   tokenbuf_t *data)
{
    const char *p = begin;
    tokenbuf_t tmptokbuf;
    tokenbuf_t search, replace, flags;
    tokenbuf_t number1, number2;
    int isrange;
    int rc;

    tokenbuf_init(&tmptokbuf);
    tokenbuf_init(&search);
    tokenbuf_init(&replace);
    tokenbuf_init(&flags);
    tokenbuf_init(&number1);
    tokenbuf_init(&number2);

    if (begin == end)
        return 0;

    switch (tolower(*p)) {
    case 'l':                   /* Turn data to lowercase. */
        if (data->begin) {
            char *ptr;
            /* If the buffer does not life in an allocated buffer,
               we have to copy it before modifying the contents. */

            if (data->buffer_size == 0) {
                if (!tokenbuf_assign
                    (data, data->begin, data->end - data->begin)) {
                    rc = VAR_ERR_OUT_OF_MEMORY;
                    goto error_return;
                }
            }
            for (ptr = (char *) data->begin; ptr != data->end; ++ptr)
                *ptr = tolower(*ptr);
        }
        ++p;
        break;

    case 'u':                   /* Turn data to uppercase. */
        if (data->begin) {
            char *ptr;
            if (data->buffer_size == 0) {
                if (!tokenbuf_assign
                    (data, data->begin, data->end - data->begin)) {
                    rc = VAR_ERR_OUT_OF_MEMORY;
                    goto error_return;
                }
            }
            for (ptr = (char *) data->begin; ptr != data->end; ++ptr)
                *ptr = toupper(*ptr);
        }
        ++p;
        break;

    case 'o':                   /* Cut out substrings. */
        ++p;
        rc = number(p, end);
        if (rc == 0) {
            rc = VAR_ERR_MISSING_START_OFFSET;
            goto error_return;
        } else {
            number1.begin = p;
            number1.end = p + rc;
            number1.buffer_size = 0;
            p += rc;
        }

        if (*p == ',') {
            isrange = 0;
            ++p;
        } else if (*p == '-') {
            isrange = 1;
            ++p;
        } else {
            rc = VAR_ERR_INVALID_OFFSET_DELIMITER;
            goto error_return;
        }

        rc = number(p, end);
        number2.begin = p;
        number2.end = p + rc;
        number2.buffer_size = 0;
        p += rc;
        if (data->begin) {
            rc = cut_out_offset(data, &number1, &number2, isrange);
            if (rc < 0)
                goto error_return;
        }
        break;

    case '#':                   /* Substitute length of the string. */
        if (data->begin) {
            char buf[1024];
            sprintf(buf, "%d", data->end - data->begin);
            tokenbuf_free(data);
            if (!tokenbuf_assign(data, buf, strlen(buf))) {
                rc = VAR_ERR_OUT_OF_MEMORY;
                goto error_return;
            }
        }
        ++p;
        break;

    case '-':                   /* Substitute parameter if data is empty. */
        ++p;
        rc = exptext_or_variable(p, end, config, nameclass, lookup,
                                 lookup_context, force_expand, &tmptokbuf);
        if (rc < 0)
            goto error_return;
        else if (rc == 0) {
            rc = VAR_ERR_MISSING_PARAMETER_IN_COMMAND;
            goto error_return;
        } else
            p += rc;
        if (data->begin != NULL && data->begin == data->end) {
            tokenbuf_free(data);
            tokenbuf_move(&tmptokbuf, data);
        }
        break;

    case '*':                   /* Return "" if data is not empty, parameter otherwise. */
        ++p;
        rc = exptext_or_variable(p, end, config, nameclass, lookup,
                                 lookup_context, force_expand, &tmptokbuf);
        if (rc < 0)
            goto error_return;
        else if (rc == 0) {
            rc = VAR_ERR_MISSING_PARAMETER_IN_COMMAND;
            goto error_return;
        } else
            p += rc;
        if (data->begin != NULL) {
            if (data->begin == data->end) {
                tokenbuf_free(data);
                tokenbuf_move(&tmptokbuf, data);
            } else {
                tokenbuf_free(data);
                data->begin = data->end = "";
                data->buffer_size = 0;
            }
        }
        break;

    case '+':                   /* Substitute parameter if data is not empty. */
        ++p;
        rc = exptext_or_variable(p, end, config, nameclass, lookup,
                                 lookup_context, force_expand, &tmptokbuf);
        if (rc < 0)
            goto error_return;
        else if (rc == 0) {
            rc = VAR_ERR_MISSING_PARAMETER_IN_COMMAND;
            goto error_return;
        } else
            p += rc;
        if (data->begin != NULL) {
            if (data->begin != data->end) {
                tokenbuf_free(data);
                tokenbuf_move(&tmptokbuf, data);
            }
        }
        break;

    case 's':                   /* Search and replace. */
        ++p;

        if (*p != '/')
            return VAR_ERR_MALFORMATTED_REPLACE;
        else
            ++p;

        rc = substext_or_variable(p, end, config, nameclass, lookup,
                                  lookup_context, force_expand, &search);
        if (rc < 0)
            goto error_return;
        else
            p += rc;

        if (*p != '/') {
            rc = VAR_ERR_MALFORMATTED_REPLACE;
            goto error_return;
        } else
            ++p;

        rc = substext_or_variable(p, end, config, nameclass, lookup,
                                  lookup_context, force_expand, &replace);
        if (rc < 0)
            goto error_return;
        else
            p += rc;

        if (*p != '/') {
            rc = VAR_ERR_MALFORMATTED_REPLACE;
            goto error_return;
        } else
            ++p;

        rc = exptext(p, end, config);
        if (rc < 0)
            goto error_return;
        else {
            flags.begin = p;
            flags.end = p + rc;
            flags.buffer_size = 0;
            p += rc;
        }

        if (data->begin) {
            rc = search_and_replace(data, &search, &replace, &flags);
            if (rc < 0)
                goto error_return;
        }
        break;

    case 'y':                   /* Transpose characters from class A to class B. */
        ++p;

        if (*p != '/')
            return VAR_ERR_MALFORMATTED_TRANSPOSE;
        else
            ++p;

        rc = substext_or_variable(p, end, config, nameclass, lookup,
                                  lookup_context, force_expand, &search);
        if (rc < 0)
            goto error_return;
        else
            p += rc;

        if (*p != '/') {
            rc = VAR_ERR_MALFORMATTED_TRANSPOSE;
            goto error_return;
        } else
            ++p;

        rc = substext_or_variable(p, end, config, nameclass, lookup,
                                  lookup_context, force_expand, &replace);
        if (rc < 0)
            goto error_return;
        else
            p += rc;

        if (*p != '/') {
            rc = VAR_ERR_MALFORMATTED_TRANSPOSE;
            goto error_return;
        } else
            ++p;

        if (data->begin) {
            rc = transpose(data, &search, &replace);
            if (rc < 0)
                goto error_return;
        }
        break;


    case 'p':                   /* Padding. */
        ++p;

        if (*p != '/')
            return VAR_ERR_MALFORMATTED_PADDING;
        else
            ++p;

        rc = number(p, end);
        if (rc == 0) {
            rc = VAR_ERR_MISSING_PADDING_WIDTH;
            goto error_return;
        } else {
            number1.begin = p;
            number1.end = p + rc;
            number1.buffer_size = 0;
            p += rc;
        }

        if (*p != '/') {
            rc = VAR_ERR_MALFORMATTED_PADDING;
            goto error_return;
        } else
            ++p;

        rc = substext_or_variable(p, end, config, nameclass, lookup,
                                  lookup_context, force_expand, &replace);
        if (rc < 0)
            goto error_return;
        else
            p += rc;

        if (*p != '/') {
            rc = VAR_ERR_MALFORMATTED_PADDING;
            goto error_return;
        } else
            ++p;

        if (*p != 'l' && *p != 'c' && *p != 'r') {
            rc = VAR_ERR_MALFORMATTED_PADDING;
            goto error_return;
        } else
            ++p;

        if (data->begin) {
            rc = padding(data, &number1, &replace, p[-1]);
            if (rc < 0)
                goto error_return;
        }
        break;

    default:
        return VAR_ERR_UNKNOWN_COMMAND_CHAR;
    }

    /* Exit gracefully. */

    tokenbuf_free(&tmptokbuf);
    tokenbuf_free(&search);
    tokenbuf_free(&replace);
    tokenbuf_free(&flags);
    tokenbuf_free(&number1);
    tokenbuf_free(&number2);
    return p - begin;

  error_return:
    tokenbuf_free(data);
    tokenbuf_free(&tmptokbuf);
    tokenbuf_free(&search);
    tokenbuf_free(&replace);
    tokenbuf_free(&flags);
    tokenbuf_free(&number1);
    tokenbuf_free(&number2);
    return rc;
}

static var_rc_t input(const char *begin, const char *end,
                      const var_config_t *config,
                      const char nameclass[256], var_cb_t lookup,
                      void *lookup_context, int force_expand,
                      tokenbuf_t *output)
{
    int rc;
    tokenbuf_t result;

    tokenbuf_init(&result);

    do {
        rc = text(begin, end, config->varinit, config->escape);
        if (rc > 0) {
            if (!tokenbuf_append(output, begin, rc)) {
                rc = VAR_ERR_OUT_OF_MEMORY;
                goto error_return;
            }
            begin += rc;
        } else if (rc < 0)
            goto error_return;

        rc = variable(begin, end, config, nameclass, lookup,
                      lookup_context, force_expand, &result);
        if (rc > 0) {
            if (!tokenbuf_append
                (output, result.begin, result.end - result.begin)) {
                rc = VAR_ERR_OUT_OF_MEMORY;
                goto error_return;
            } else
                begin += rc;
        } else if (rc < 0)
            goto error_return;
    }
    while (rc > 0);

    if (begin != end) {
        rc = VAR_ERR_INPUT_ISNT_TEXT_NOR_VARIABLE;
        goto error_return;
    }

    return VAR_OK;

  error_return:
    tokenbuf_free(&result);
    return rc;
}

var_rc_t var_expand(const char *input_buf, size_t input_len,
                    char **result, size_t *result_len,
                    var_cb_t lookup, void *lookup_context,
                    const var_config_t *config, int force_expand)
{
    char nameclass[256];
    var_rc_t rc;
    tokenbuf_t output;

    /* Argument sanity checks */
    if (input_buf == NULL || input_len == 0 || 
        result == NULL || result_len == NULL ||
        lookup == NULL || lookup_context == NULL)
        return VAR_ERR_INVALID_ARGUMENT;

    /* Optionally use default configuration */
    if (config == NULL)
        config = &var_config_default;

    /* Expand the class description for valid variable names. */
    if ((rc = expand_character_class(config->namechars, nameclass)) != VAR_OK)
        return rc;

    /* Make sure that the specials defined in the configuration do not
       appear in the character name class. */
    if (nameclass[(int)config->varinit] ||
        nameclass[(int)config->startdelim] ||
        nameclass[(int)config->enddelim] ||
        nameclass[(int)config->escape])
        return VAR_ERR_INVALID_CONFIGURATION;

    /* Call the parser. */
    tokenbuf_init(&output);
    if ((rc = input(input_buf, input_buf + input_len, config, nameclass,
                    lookup, lookup_context, force_expand, &output)) != VAR_OK) {
        tokenbuf_free(&output);
        return rc;
    }
    *result = (char *)output.begin;
    *result_len = output.end - output.begin;

    return VAR_OK;
}

CVSTrac 2.0.1