diff options
Diffstat (limited to 'src/config_parse.c')
-rw-r--r-- | src/config_parse.c | 576 |
1 files changed, 0 insertions, 576 deletions
diff --git a/src/config_parse.c b/src/config_parse.c deleted file mode 100644 index 9f95e67d7..000000000 --- a/src/config_parse.c +++ /dev/null @@ -1,576 +0,0 @@ -/* - * Copyright (C) the libgit2 contributors. All rights reserved. - * - * This file is part of libgit2, distributed under the GNU GPL v2 with - * a Linking Exception. For full terms see the included COPYING file. - */ - -#include "config_parse.h" - -#include <ctype.h> - -const char *git_config_escapes = "ntb\"\\"; -const char *git_config_escaped = "\n\t\b\"\\"; - -static void set_parse_error(git_config_parser *reader, int col, const char *error_str) -{ - if (col) - git_error_set(GIT_ERROR_CONFIG, - "failed to parse config file: %s (in %s:%"PRIuZ", column %d)", - error_str, reader->path, reader->ctx.line_num, col); - else - git_error_set(GIT_ERROR_CONFIG, - "failed to parse config file: %s (in %s:%"PRIuZ")", - error_str, reader->path, reader->ctx.line_num); -} - - -GIT_INLINE(int) config_keychar(int c) -{ - return isalnum(c) || c == '-'; -} - -static int strip_comments(char *line, int in_quotes) -{ - int quote_count = in_quotes, backslash_count = 0; - char *ptr; - - for (ptr = line; *ptr; ++ptr) { - if (ptr[0] == '"' && ptr > line && ptr[-1] != '\\') - quote_count++; - - if ((ptr[0] == ';' || ptr[0] == '#') && - (quote_count % 2) == 0 && - (backslash_count % 2) == 0) { - ptr[0] = '\0'; - break; - } - - if (ptr[0] == '\\') - backslash_count++; - else - backslash_count = 0; - } - - /* skip any space at the end */ - while (ptr > line && git__isspace(ptr[-1])) { - ptr--; - } - ptr[0] = '\0'; - - return quote_count; -} - - -static int parse_subsection_header(git_config_parser *reader, const char *line, size_t pos, const char *base_name, char **section_name) -{ - int c, rpos; - const char *first_quote, *last_quote; - const char *line_start = line; - git_buf buf = GIT_BUF_INIT; - size_t quoted_len, alloc_len, base_name_len = strlen(base_name); - - /* Skip any additional whitespace before our section name */ - while (git__isspace(line[pos])) - pos++; - - /* We should be at the first quotation mark. */ - if (line[pos] != '"') { - set_parse_error(reader, 0, "missing quotation marks in section header"); - goto end_error; - } - - first_quote = &line[pos]; - last_quote = strrchr(line, '"'); - quoted_len = last_quote - first_quote; - - if ((last_quote - line) > INT_MAX) { - set_parse_error(reader, 0, "invalid section header, line too long"); - goto end_error; - } - - if (quoted_len == 0) { - set_parse_error(reader, 0, "missing closing quotation mark in section header"); - goto end_error; - } - - GIT_ERROR_CHECK_ALLOC_ADD(&alloc_len, base_name_len, quoted_len); - GIT_ERROR_CHECK_ALLOC_ADD(&alloc_len, alloc_len, 2); - - if (git_buf_grow(&buf, alloc_len) < 0 || - git_buf_printf(&buf, "%s.", base_name) < 0) - goto end_error; - - rpos = 0; - - line = first_quote; - c = line[++rpos]; - - /* - * At the end of each iteration, whatever is stored in c will be - * added to the string. In case of error, jump to out - */ - do { - - switch (c) { - case 0: - set_parse_error(reader, 0, "unexpected end-of-line in section header"); - goto end_error; - - case '"': - goto end_parse; - - case '\\': - c = line[++rpos]; - - if (c == 0) { - set_parse_error(reader, rpos, "unexpected end-of-line in section header"); - goto end_error; - } - - default: - break; - } - - git_buf_putc(&buf, (char)c); - c = line[++rpos]; - } while (line + rpos < last_quote); - -end_parse: - if (git_buf_oom(&buf)) - goto end_error; - - if (line[rpos] != '"' || line[rpos + 1] != ']') { - set_parse_error(reader, rpos, "unexpected text after closing quotes"); - git_buf_dispose(&buf); - return -1; - } - - *section_name = git_buf_detach(&buf); - return (int)(&line[rpos + 2] - line_start); /* rpos is at the closing quote */ - -end_error: - git_buf_dispose(&buf); - - return -1; -} - -static int parse_section_header(git_config_parser *reader, char **section_out) -{ - char *name, *name_end; - int name_length, c, pos; - int result; - char *line; - size_t line_len; - - git_parse_advance_ws(&reader->ctx); - line = git__strndup(reader->ctx.line, reader->ctx.line_len); - if (line == NULL) - return -1; - - /* find the end of the variable's name */ - name_end = strrchr(line, ']'); - if (name_end == NULL) { - git__free(line); - set_parse_error(reader, 0, "missing ']' in section header"); - return -1; - } - - GIT_ERROR_CHECK_ALLOC_ADD(&line_len, (size_t)(name_end - line), 1); - name = git__malloc(line_len); - GIT_ERROR_CHECK_ALLOC(name); - - name_length = 0; - pos = 0; - - /* Make sure we were given a section header */ - c = line[pos++]; - GIT_ASSERT(c == '['); - - c = line[pos++]; - - do { - if (git__isspace(c)){ - name[name_length] = '\0'; - result = parse_subsection_header(reader, line, pos, name, section_out); - git__free(line); - git__free(name); - return result; - } - - if (!config_keychar(c) && c != '.') { - set_parse_error(reader, pos, "unexpected character in header"); - goto fail_parse; - } - - name[name_length++] = (char)git__tolower(c); - - } while ((c = line[pos++]) != ']'); - - if (line[pos - 1] != ']') { - set_parse_error(reader, pos, "unexpected end of file"); - goto fail_parse; - } - - git__free(line); - - name[name_length] = 0; - *section_out = name; - - return pos; - -fail_parse: - git__free(line); - git__free(name); - return -1; -} - -static int skip_bom(git_parse_ctx *parser) -{ - git_buf buf = GIT_BUF_INIT_CONST(parser->content, parser->content_len); - git_buf_bom_t bom; - int bom_offset = git_buf_detect_bom(&bom, &buf); - - if (bom == GIT_BUF_BOM_UTF8) - git_parse_advance_chars(parser, bom_offset); - - /* TODO: reference implementation is pretty stupid with BoM */ - - return 0; -} - -/* - (* basic types *) - digit = "0".."9" - integer = digit { digit } - alphabet = "a".."z" + "A" .. "Z" - - section_char = alphabet | "." | "-" - extension_char = (* any character except newline *) - any_char = (* any character *) - variable_char = "alphabet" | "-" - - - (* actual grammar *) - config = { section } - - section = header { definition } - - header = "[" section [subsection | subsection_ext] "]" - - subsection = "." section - subsection_ext = "\"" extension "\"" - - section = section_char { section_char } - extension = extension_char { extension_char } - - definition = variable_name ["=" variable_value] "\n" - - variable_name = variable_char { variable_char } - variable_value = string | boolean | integer - - string = quoted_string | plain_string - quoted_string = "\"" plain_string "\"" - plain_string = { any_char } - - boolean = boolean_true | boolean_false - boolean_true = "yes" | "1" | "true" | "on" - boolean_false = "no" | "0" | "false" | "off" -*/ - -/* '\"' -> '"' etc */ -static int unescape_line( - char **out, bool *is_multi, const char *ptr, int quote_count) -{ - char *str, *fixed, *esc; - size_t ptr_len = strlen(ptr), alloc_len; - - *is_multi = false; - - if (GIT_ADD_SIZET_OVERFLOW(&alloc_len, ptr_len, 1) || - (str = git__malloc(alloc_len)) == NULL) { - return -1; - } - - fixed = str; - - while (*ptr != '\0') { - if (*ptr == '"') { - quote_count++; - } else if (*ptr != '\\') { - *fixed++ = *ptr; - } else { - /* backslash, check the next char */ - ptr++; - /* if we're at the end, it's a multiline, so keep the backslash */ - if (*ptr == '\0') { - *is_multi = true; - goto done; - } - if ((esc = strchr(git_config_escapes, *ptr)) != NULL) { - *fixed++ = git_config_escaped[esc - git_config_escapes]; - } else { - git__free(str); - git_error_set(GIT_ERROR_CONFIG, "invalid escape at %s", ptr); - return -1; - } - } - ptr++; - } - -done: - *fixed = '\0'; - *out = str; - - return 0; -} - -static int parse_multiline_variable(git_config_parser *reader, git_buf *value, int in_quotes) -{ - int quote_count; - bool multiline = true; - - while (multiline) { - char *line = NULL, *proc_line = NULL; - int error; - - /* Check that the next line exists */ - git_parse_advance_line(&reader->ctx); - line = git__strndup(reader->ctx.line, reader->ctx.line_len); - GIT_ERROR_CHECK_ALLOC(line); - - /* - * We've reached the end of the file, there is no continuation. - * (this is not an error). - */ - if (line[0] == '\0') { - error = 0; - goto out; - } - - /* If it was just a comment, pretend it didn't exist */ - quote_count = strip_comments(line, in_quotes); - if (line[0] == '\0') - goto next; - - if ((error = unescape_line(&proc_line, &multiline, - line, in_quotes)) < 0) - goto out; - - /* Add this line to the multiline var */ - if ((error = git_buf_puts(value, proc_line)) < 0) - goto out; - -next: - git__free(line); - git__free(proc_line); - in_quotes = quote_count; - continue; - -out: - git__free(line); - git__free(proc_line); - return error; - } - - return 0; -} - -GIT_INLINE(bool) is_namechar(char c) -{ - return isalnum(c) || c == '-'; -} - -static int parse_name( - char **name, const char **value, git_config_parser *reader, const char *line) -{ - const char *name_end = line, *value_start; - - *name = NULL; - *value = NULL; - - while (*name_end && is_namechar(*name_end)) - name_end++; - - if (line == name_end) { - set_parse_error(reader, 0, "invalid configuration key"); - return -1; - } - - value_start = name_end; - - while (*value_start && git__isspace(*value_start)) - value_start++; - - if (*value_start == '=') { - *value = value_start + 1; - } else if (*value_start) { - set_parse_error(reader, 0, "invalid configuration key"); - return -1; - } - - if ((*name = git__strndup(line, name_end - line)) == NULL) - return -1; - - return 0; -} - -static int parse_variable(git_config_parser *reader, char **var_name, char **var_value) -{ - const char *value_start = NULL; - char *line = NULL, *name = NULL, *value = NULL; - int quote_count, error; - bool multiline; - - *var_name = NULL; - *var_value = NULL; - - git_parse_advance_ws(&reader->ctx); - line = git__strndup(reader->ctx.line, reader->ctx.line_len); - GIT_ERROR_CHECK_ALLOC(line); - - quote_count = strip_comments(line, 0); - - if ((error = parse_name(&name, &value_start, reader, line)) < 0) - goto out; - - /* - * Now, let's try to parse the value - */ - if (value_start != NULL) { - while (git__isspace(value_start[0])) - value_start++; - - if ((error = unescape_line(&value, &multiline, value_start, 0)) < 0) - goto out; - - if (multiline) { - git_buf multi_value = GIT_BUF_INIT; - git_buf_attach(&multi_value, value, 0); - value = NULL; - - if (parse_multiline_variable(reader, &multi_value, quote_count % 2) < 0 || - git_buf_oom(&multi_value)) { - error = -1; - git_buf_dispose(&multi_value); - goto out; - } - - value = git_buf_detach(&multi_value); - } - } - - *var_name = name; - *var_value = value; - name = NULL; - value = NULL; - -out: - git__free(name); - git__free(value); - git__free(line); - return error; -} - -int git_config_parser_init(git_config_parser *out, const char *path, const char *data, size_t datalen) -{ - out->path = path; - return git_parse_ctx_init(&out->ctx, data, datalen); -} - -void git_config_parser_dispose(git_config_parser *parser) -{ - git_parse_ctx_clear(&parser->ctx); -} - -int git_config_parse( - git_config_parser *parser, - git_config_parser_section_cb on_section, - git_config_parser_variable_cb on_variable, - git_config_parser_comment_cb on_comment, - git_config_parser_eof_cb on_eof, - void *payload) -{ - git_parse_ctx *ctx; - char *current_section = NULL, *var_name = NULL, *var_value = NULL; - int result = 0; - - ctx = &parser->ctx; - - skip_bom(ctx); - - for (; ctx->remain_len > 0; git_parse_advance_line(ctx)) { - const char *line_start; - size_t line_len; - char c; - - restart: - line_start = ctx->line; - line_len = ctx->line_len; - - /* - * Get either first non-whitespace character or, if that does - * not exist, the first whitespace character. This is required - * to preserve whitespaces when writing back the file. - */ - if (git_parse_peek(&c, ctx, GIT_PARSE_PEEK_SKIP_WHITESPACE) < 0 && - git_parse_peek(&c, ctx, 0) < 0) - continue; - - switch (c) { - case '[': /* section header, new section begins */ - git__free(current_section); - current_section = NULL; - - result = parse_section_header(parser, ¤t_section); - if (result < 0) - break; - - git_parse_advance_chars(ctx, result); - - if (on_section) - result = on_section(parser, current_section, line_start, line_len, payload); - /* - * After we've parsed the section header we may not be - * done with the line. If there's still data in there, - * run the next loop with the rest of the current line - * instead of moving forward. - */ - - if (!git_parse_peek(&c, ctx, GIT_PARSE_PEEK_SKIP_WHITESPACE)) - goto restart; - - break; - - case '\n': /* comment or whitespace-only */ - case '\r': - case ' ': - case '\t': - case ';': - case '#': - if (on_comment) { - result = on_comment(parser, line_start, line_len, payload); - } - break; - - default: /* assume variable declaration */ - if ((result = parse_variable(parser, &var_name, &var_value)) == 0 && on_variable) { - result = on_variable(parser, current_section, var_name, var_value, line_start, line_len, payload); - git__free(var_name); - git__free(var_value); - } - - break; - } - - if (result < 0) - goto out; - } - - if (on_eof) - result = on_eof(parser, current_section, payload); - -out: - git__free(current_section); - return result; -} |