always transmit const source_position_t * instead of source_position_t
[cparser] / format_check.c
index a3f10dc..52aad75 100644 (file)
@@ -1,12 +1,33 @@
+/*
+ * This file is part of cparser.
+ * Copyright (C) 2007-2008 Matthias Braun <matze@braunis.de>
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public License
+ * as published by the Free Software Foundation; either version 2
+ * of the License, or (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA
+ * 02111-1307, USA.
+ */
+#include <ctype.h>
 #include <wctype.h>
 
+#include "format_check.h"
+#include "symbol_t.h"
 #include "ast_t.h"
 #include "diagnostic.h"
-#include "format_check.h"
 #include "types.h"
 #include "type_t.h"
 #include "warning.h"
-
+#include "lang_features.h"
 
 typedef enum format_flag_t {
        FMT_FLAG_NONE  = 0,
@@ -30,7 +51,12 @@ typedef enum format_length_modifier_t {
        FMT_MOD_j,
        FMT_MOD_t,
        FMT_MOD_z,
-       FMT_MOD_q
+       FMT_MOD_q,
+       /* only in microsoft mode */
+       FMT_MOD_w,
+       FMT_MOD_I,
+       FMT_MOD_I32,
+       FMT_MOD_I64
 } format_length_modifier_t;
 
 static const char* get_length_modifier_name(const format_length_modifier_t mod)
@@ -45,13 +71,18 @@ static const char* get_length_modifier_name(const format_length_modifier_t mod)
                [FMT_MOD_j]    = "j",
                [FMT_MOD_t]    = "t",
                [FMT_MOD_z]    = "z",
-               [FMT_MOD_q]    = "q"
+               [FMT_MOD_q]    = "q",
+               /* only in microsoft mode */
+               [FMT_MOD_w]    = "w",
+               [FMT_MOD_I]    = "I",
+               [FMT_MOD_I32]  = "I32",
+               [FMT_MOD_I64]  = "I64"
        };
        assert(mod < sizeof(names) / sizeof(*names));
        return names[mod];
 }
 
-static void warn_invalid_length_modifier(const source_position_t pos,
+static void warn_invalid_length_modifier(const source_position_t *pos,
                                          const format_length_modifier_t mod,
                                          const wchar_rep_t conversion)
 {
@@ -61,6 +92,56 @@ static void warn_invalid_length_modifier(const source_position_t pos,
        );
 }
 
+typedef struct vchar_t vchar_t;
+struct vchar_t {
+       const void *string;   /**< the string */
+       size_t     position;  /**< current position */
+       size_t     size;      /**< size of the string */
+
+       /** return the first character of the string and setthe position to 0. */
+       unsigned (*first)(vchar_t *self);
+       /** return the next character of the string */
+       unsigned (*next)(vchar_t *self);
+       /** return non_zero if the given character is a digit */
+       int (*is_digit)(unsigned vchar);
+};
+
+static unsigned string_first(vchar_t *self) {
+       self->position = 0;
+       const string_t *string = self->string;
+       return string->begin[0];
+}
+
+static unsigned string_next(vchar_t *self) {
+       ++self->position;
+       const string_t *string = self->string;
+       return string->begin[self->position];
+}
+
+static int string_isdigit(unsigned vchar) {
+       return isdigit(vchar);
+}
+
+static unsigned wstring_first(vchar_t *self) {
+       self->position = 0;
+       const wide_string_t *wstring = self->string;
+       return wstring->begin[0];
+}
+
+static unsigned wstring_next(vchar_t *self) {
+       ++self->position;
+       const wide_string_t *wstring = self->string;
+       return wstring->begin[self->position];
+}
+
+static int wstring_isdigit(unsigned vchar) {
+       return iswdigit(vchar);
+}
+
+static bool atend(vchar_t *self) {
+       return self->position + 1 == self->size;
+}
+
 static void check_format_arguments(const call_argument_t *const fmt_arg, const call_argument_t* arg)
 {
        const expression_t *fmt_expr = fmt_arg->expression;
@@ -68,34 +149,46 @@ static void check_format_arguments(const call_argument_t *const fmt_arg, const c
                fmt_expr = fmt_expr->unary.value;
        }
 
-       if (fmt_expr->kind != EXPR_WIDE_STRING_LITERAL)
+       vchar_t vchar;
+       if (fmt_expr->kind == EXPR_WIDE_STRING_LITERAL) {
+               vchar.string   = &fmt_expr->wide_string.value;
+               vchar.size     = fmt_expr->wide_string.value.size;
+               vchar.first    = wstring_first;
+               vchar.next     = wstring_next;
+               vchar.is_digit = wstring_isdigit;
+       } else if (fmt_expr->kind == EXPR_STRING_LITERAL) {
+               vchar.string   = &fmt_expr->string.value;
+               vchar.size     = fmt_expr->string.value.size;
+               vchar.first    = string_first;
+               vchar.next     = string_next;
+               vchar.is_digit = string_isdigit;
+       } else {
                return;
-
-       const source_position_t    pos     = fmt_expr->base.source_position;
-       const wide_string_t *const wstring = &fmt_expr->wide_string.value;
-       const wchar_rep_t *fmt = wstring->begin;
-       for (; *fmt != '\0'; ++fmt) {
-               if (*fmt != '%')
+       }
+       const source_position_t *pos = &fmt_expr->base.source_position;
+       unsigned fmt = vchar.first(&vchar);
+       for (; fmt != '\0'; fmt = vchar.next(&vchar)) {
+               if (fmt != '%')
                        continue;
-               ++fmt;
+               fmt = vchar.next(&vchar);
 
-               if (*fmt == '%')
+               if (fmt == '%')
                        continue;
 
                format_flags_t fmt_flags = FMT_FLAG_NONE;
-               if (*fmt == '0') {
-                       ++fmt;
+               if (fmt == '0') {
+                       fmt = vchar.next(&vchar);
                        fmt_flags |= FMT_FLAG_ZERO;
                }
 
                /* argument selector or minimum field width */
-               if (iswdigit(*fmt)) {
+               if (vchar.is_digit(fmt)) {
                        do {
-                               ++fmt;
-                       } while (iswdigit(*fmt));
+                               fmt = vchar.next(&vchar);
+                       } while (vchar.is_digit(fmt));
 
                        /* digit string was ... */
-                       if (*fmt == '$') {
+                       if (fmt == '$') {
                                /* ... argument selector */
                                fmt_flags = FMT_FLAG_NONE; /* reset possibly set 0-flag */
                                /* TODO implement */
@@ -106,7 +199,7 @@ static void check_format_arguments(const call_argument_t *const fmt_arg, const c
                        /* flags */
                        for (;;) {
                                format_flags_t flag;
-                               switch (*fmt) {
+                               switch (fmt) {
                                        case '#':  flag = FMT_FLAG_HASH;  break;
                                        case '0':  flag = FMT_FLAG_ZERO;  break;
                                        case '-':  flag = FMT_FLAG_MINUS; break;
@@ -129,59 +222,59 @@ static void check_format_arguments(const call_argument_t *const fmt_arg, const c
                                        default: goto break_fmt_flags;
                                }
                                if (fmt_flags & flag) {
-                                       warningf(pos, "repeated flag '%c' in conversion specification", (char)*fmt);
+                                       warningf(pos, "repeated flag '%c' in conversion specification", (char)fmt);
                                }
                                fmt_flags |= flag;
-                               ++fmt;
+                               fmt = vchar.next(&vchar);
                        }
 break_fmt_flags:
 
                        /* minimum field width */
-                       if (*fmt == '*') {
+                       if (fmt == '*') {
                                if (arg == NULL) {
                                        warningf(pos, "missing argument for '*' field width in conversion specification");
                                        return;
                                }
-                               const type_t *const arg_type = arg->expression->base.datatype;
+                               const type_t *const arg_type = arg->expression->base.type;
                                if (arg_type != type_int) {
                                        warningf(pos, "argument for '*' field width in conversion specification is not an 'int', but an '%T'", arg_type);
                                }
                                arg = arg->next;
                        } else {
-                               while (iswdigit(*fmt)) {
-                                       ++fmt;
+                               while (vchar.is_digit(fmt)) {
+                                       fmt = vchar.next(&vchar);
                                }
                        }
                }
 
                /* precision */
-               if (*fmt == '.') {
-                       ++fmt;
-                       if (*fmt == '*') {
+               if (fmt == '.') {
+                       fmt = vchar.next(&vchar);
+                       if (fmt == '*') {
                                if (arg == NULL) {
                                        warningf(pos, "missing argument for '*' precision in conversion specification");
                                        return;
                                }
-                               const type_t *const arg_type = arg->expression->base.datatype;
+                               const type_t *const arg_type = arg->expression->base.type;
                                if (arg_type != type_int) {
                                        warningf(pos, "argument for '*' precision in conversion specification is not an 'int', but an '%T'", arg_type);
                                }
                                arg = arg->next;
                        } else {
                                /* digit string may be omitted */
-                               while (iswdigit(*fmt)) {
-                                       ++fmt;
+                               while (vchar.is_digit(fmt)) {
+                                       fmt = vchar.next(&vchar);
                                }
                        }
                }
 
                /* length modifier */
                format_length_modifier_t fmt_mod;
-               switch (*fmt) {
+               switch (fmt) {
                        case 'h':
-                               ++fmt;
-                               if (*fmt == 'h') {
-                                       ++fmt;
+                               fmt = vchar.next(&vchar);
+                               if (fmt == 'h') {
+                                       fmt = vchar.next(&vchar);
                                        fmt_mod = FMT_MOD_hh;
                                } else {
                                        fmt_mod = FMT_MOD_h;
@@ -189,24 +282,60 @@ break_fmt_flags:
                                break;
 
                        case 'l':
-                               ++fmt;
-                               if (*fmt == 'l') {
-                                       ++fmt;
+                               fmt = vchar.next(&vchar);
+                               if (fmt == 'l') {
+                                       fmt = vchar.next(&vchar);
                                        fmt_mod = FMT_MOD_ll;
                                } else {
                                        fmt_mod = FMT_MOD_l;
                                }
                                break;
 
-                       case 'L': ++fmt; fmt_mod = FMT_MOD_L;    break;
-                       case 'j': ++fmt; fmt_mod = FMT_MOD_j;    break;
-                       case 't': ++fmt; fmt_mod = FMT_MOD_t;    break;
-                       case 'z': ++fmt; fmt_mod = FMT_MOD_z;    break;
-                       case 'q': ++fmt; fmt_mod = FMT_MOD_q;    break;
-                       default:         fmt_mod = FMT_MOD_NONE; break;
+                       case 'L': fmt = vchar.next(&vchar); fmt_mod = FMT_MOD_L;    break;
+                       case 'j': fmt = vchar.next(&vchar); fmt_mod = FMT_MOD_j;    break;
+                       case 't': fmt = vchar.next(&vchar); fmt_mod = FMT_MOD_t;    break;
+                       case 'z': fmt = vchar.next(&vchar); fmt_mod = FMT_MOD_z;    break;
+                       case 'q': fmt = vchar.next(&vchar); fmt_mod = FMT_MOD_q;    break;
+                       /* microsoft mode */
+                       case 'w':
+                               if (c_mode & _MS) {
+                                       fmt = vchar.next(&vchar); fmt_mod = FMT_MOD_w;
+                               } else {
+                                       fmt_mod = FMT_MOD_NONE;
+                               }
+                               break;
+                       case 'I':
+                               if (c_mode & _MS) {
+                                       fmt = vchar.next(&vchar); fmt_mod = FMT_MOD_I;
+                                       if (fmt == '3') {
+                                               fmt = vchar.next(&vchar);
+                                               if (fmt == '2') {
+                                                       fmt = vchar.next(&vchar);
+                                                       fmt_mod = FMT_MOD_I32;
+                                               } else {
+                                                       /* rewind */
+                                                       --vchar.position;
+                                               }
+                                       } else if (fmt == '6') {
+                                               fmt = vchar.next(&vchar);
+                                               if (fmt == '4') {
+                                                       fmt = vchar.next(&vchar);
+                                                       fmt_mod = FMT_MOD_I64;
+                                               } else {
+                                                       /* rewind */
+                                                       --vchar.position;
+                                               }
+                                       }
+                               } else {
+                                       fmt_mod = FMT_MOD_NONE;
+                               }
+                               break;
+                       default:
+                               fmt_mod = FMT_MOD_NONE;
+                               break;
                }
 
-               if (*fmt == '\0') {
+               if (fmt == '\0') {
                        warningf(pos, "dangling %% in format string");
                        break;
                }
@@ -214,7 +343,7 @@ break_fmt_flags:
                const type_t      *expected_type;
                type_qualifiers_t  expected_qual = TYPE_QUALIFIER_NONE;
                format_flags_t     allowed_flags;
-               switch (*fmt) {
+               switch (fmt) {
                        case 'd':
                        case 'i':
                                switch (fmt_mod) {
@@ -226,9 +355,12 @@ break_fmt_flags:
                                        case FMT_MOD_j:    expected_type = type_intmax_t;  break;
                                        case FMT_MOD_z:    expected_type = type_ssize_t;   break;
                                        case FMT_MOD_t:    expected_type = type_ptrdiff_t; break;
+                                       case FMT_MOD_I:    expected_type = type_ptrdiff_t; break;
+                                       case FMT_MOD_I32:  expected_type = type_int32;     break;
+                                       case FMT_MOD_I64:  expected_type = type_int64;     break;
 
                                        default:
-                                               warn_invalid_length_modifier(pos, fmt_mod, *fmt);
+                                               warn_invalid_length_modifier(pos, fmt_mod, fmt);
                                                goto next_arg;
                                }
                                allowed_flags = FMT_FLAG_MINUS | FMT_FLAG_SPACE | FMT_FLAG_PLUS | FMT_FLAG_ZERO;
@@ -253,9 +385,12 @@ eval_fmt_mod_unsigned:
                                        case FMT_MOD_j:    expected_type = type_uintmax_t;          break;
                                        case FMT_MOD_z:    expected_type = type_size_t;             break;
                                        case FMT_MOD_t:    expected_type = type_uptrdiff_t;         break;
+                                       case FMT_MOD_I:    expected_type = type_size_t;             break;
+                                       case FMT_MOD_I32:  expected_type = type_unsigned_int32;     break;
+                                       case FMT_MOD_I64:  expected_type = type_unsigned_int64;     break;
 
                                        default:
-                                               warn_invalid_length_modifier(pos, fmt_mod, *fmt);
+                                               warn_invalid_length_modifier(pos, fmt_mod, fmt);
                                                goto next_arg;
                                }
                                break;
@@ -274,7 +409,7 @@ eval_fmt_mod_unsigned:
                                        case FMT_MOD_L:    expected_type = type_long_double; break;
 
                                        default:
-                                               warn_invalid_length_modifier(pos, fmt_mod, *fmt);
+                                               warn_invalid_length_modifier(pos, fmt_mod, fmt);
                                                goto next_arg;
                                }
                                allowed_flags = FMT_FLAG_MINUS | FMT_FLAG_SPACE | FMT_FLAG_PLUS | FMT_FLAG_HASH | FMT_FLAG_ZERO;
@@ -282,7 +417,7 @@ eval_fmt_mod_unsigned:
 
                        case 'C':
                                if (fmt_mod != FMT_MOD_NONE) {
-                                       warn_invalid_length_modifier(pos, fmt_mod, *fmt);
+                                       warn_invalid_length_modifier(pos, fmt_mod, fmt);
                                        goto next_arg;
                                }
                                expected_type = type_wchar_t;
@@ -292,11 +427,12 @@ eval_fmt_mod_unsigned:
                        case 'c':
                                expected_type = type_int;
                                switch (fmt_mod) {
-                                       case FMT_MOD_NONE: expected_type = type_int;    break; /* TODO promoted char */
-                                       case FMT_MOD_l:    expected_type = type_wint_t; break;
+                                       case FMT_MOD_NONE: expected_type = type_int;     break; /* TODO promoted char */
+                                       case FMT_MOD_l:    expected_type = type_wint_t;  break;
+                                       case FMT_MOD_w:    expected_type = type_wchar_t; break;
 
                                        default:
-                                               warn_invalid_length_modifier(pos, fmt_mod, *fmt);
+                                               warn_invalid_length_modifier(pos, fmt_mod, fmt);
                                                goto next_arg;
                                }
                                allowed_flags = FMT_FLAG_NONE;
@@ -304,7 +440,7 @@ eval_fmt_mod_unsigned:
 
                        case 'S':
                                if (fmt_mod != FMT_MOD_NONE) {
-                                       warn_invalid_length_modifier(pos, fmt_mod, *fmt);
+                                       warn_invalid_length_modifier(pos, fmt_mod, fmt);
                                        goto next_arg;
                                }
                                expected_type = type_wchar_t_ptr;
@@ -314,11 +450,12 @@ eval_fmt_mod_unsigned:
 
                        case 's':
                                switch (fmt_mod) {
-                                       case FMT_MOD_NONE: expected_type = type_string;      break;
+                                       case FMT_MOD_NONE: expected_type = type_char_ptr;    break;
                                        case FMT_MOD_l:    expected_type = type_wchar_t_ptr; break;
+                                       case FMT_MOD_w:    expected_type = type_wchar_t_ptr; break;
 
                                        default:
-                                               warn_invalid_length_modifier(pos, fmt_mod, *fmt);
+                                               warn_invalid_length_modifier(pos, fmt_mod, fmt);
                                                goto next_arg;
                                }
                                expected_qual = TYPE_QUALIFIER_CONST;
@@ -327,7 +464,7 @@ eval_fmt_mod_unsigned:
 
                        case 'p':
                                if (fmt_mod != FMT_MOD_NONE) {
-                                       warn_invalid_length_modifier(pos, fmt_mod, *fmt);
+                                       warn_invalid_length_modifier(pos, fmt_mod, fmt);
                                        goto next_arg;
                                }
                                expected_type = type_void_ptr;
@@ -346,14 +483,14 @@ eval_fmt_mod_unsigned:
                                        case FMT_MOD_t:    expected_type = type_ptrdiff_t_ptr;   break;
 
                                        default:
-                                               warn_invalid_length_modifier(pos, fmt_mod, *fmt);
+                                               warn_invalid_length_modifier(pos, fmt_mod, fmt);
                                                goto next_arg;
                                }
                                allowed_flags = FMT_FLAG_NONE;
                                break;
 
                        default:
-                               warningf(pos, "encountered unknown conversion specifier '%%%C'", (wint_t)*fmt);
+                               warningf(pos, "encountered unknown conversion specifier '%%%C'", (wint_t)fmt);
                                goto next_arg;
                }
 
@@ -368,7 +505,7 @@ eval_fmt_mod_unsigned:
                }
 
                {       /* create a scope here to prevent warning about the jump to next_arg */
-                       type_t *const arg_type = arg->expression->base.datatype;
+                       type_t *const arg_type = arg->expression->base.type;
                        if (is_type_pointer(expected_type)) {
                                type_t *const arg_skip = skip_typeref(arg_type);
                                if (is_type_pointer(arg_skip)) {
@@ -387,13 +524,13 @@ eval_fmt_mod_unsigned:
                        if (is_type_valid(arg_type)) {
                                warningf(pos,
                                        "argument type '%T' does not match conversion specifier '%%%s%c'",
-                                       arg_type, get_length_modifier_name(fmt_mod), (char)*fmt);
+                                       arg_type, get_length_modifier_name(fmt_mod), (char)fmt);
                        }
                }
 next_arg:
                arg = arg->next;
        }
-       if (fmt + 1 != wstring->begin + wstring->size) {
+       if (!atend(&vchar)) {
                warningf(pos, "format string contains NUL");
        }
        if (arg != NULL) {
@@ -403,7 +540,7 @@ next_arg:
 
 void check_format(const call_expression_t *const call)
 {
-       if (!warning.check_format)
+       if (!warning.format)
                return;
 
        const expression_t *const func_expr = call->function;
@@ -414,8 +551,13 @@ void check_format(const call_expression_t *const call)
        const call_argument_t *      arg  = call->arguments;
        if (strcmp(name, "wprintf") == 0) { /* TODO gammlig */
                check_format_arguments(arg, arg->next);
+       } else if (strcmp(name, "printf") == 0) {
+               check_format_arguments(arg, arg->next);
        } else if (strcmp(name, "swprintf") == 0) {
                arg = arg->next->next; /* skip destination buffer and size */
                check_format_arguments(arg, arg->next);
+       } else if (strcmp(name, "sprintf") == 0) {
+               arg = arg->next->next; /* skip destination buffer and size */
+               check_format_arguments(arg, arg->next);
        }
 }