From 74ca21a41bcb5a49d19e65c9ba88f1f864cb7095 Mon Sep 17 00:00:00 2001
From: "Rafael G. Martins" <rafael@rafaelmartins.eng.br>
Date: Sat, 3 Sep 2016 19:57:54 +0200
Subject: *: big code reorganization.

- source and tests are now splitted by target
- utils lib is now called common

still pending move error.c from blogc to common
---
 tests/common/check_utf8.c | 101 ++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 101 insertions(+)
 create mode 100644 tests/common/check_utf8.c

(limited to 'tests/common/check_utf8.c')
diff --git a/tests/common/check_utf8.c b/tests/common/check_utf8.c
new file mode 100644
index 0000000..d104265
--- /dev/null
+++ b/tests/common/check_utf8.c
@@ -0,0 +1,101 @@
+/*
+ * blogc: A blog compiler.
+ * Copyright (C) 2015-2016 Rafael G. Martins <rafael@rafaelmartins.eng.br>
+ *
+ * This program can be distributed under the terms of the BSD License.
+ * See the file LICENSE.
+ */
+
+#include <stdarg.h>
+#include <stddef.h>
+#include <setjmp.h>
+#include <cmocka.h>
+#include <stdbool.h>
+#include <stdint.h>
+#include <string.h>
+#include "../../src/common/utf8.h"
+#include "../../src/common/utils.h"
+
+// this file MUST be ASCII
+
+
+static void
+test_utf8_valid(void **state)
+{
+    const char *c = "<a href=\"{{ BASE_URL }}/page/{{ PREVIOUS_PAGE }}/\">"
+        "\xc2\xab Newer posts</a>";
+    assert_true(blogc_utf8_validate((uint8_t*) c, strlen(c)));
+    const uint8_t d[3] = {0xe2, 0x82, 0xac};  // euro sign
+    assert_true(blogc_utf8_validate(d, 3));
+    const uint8_t e[3] = {0xef, 0xbb, 0xbf};  // utf-8 bom
+    assert_true(blogc_utf8_validate(e, 3));
+}
+
+
+static void
+test_utf8_invalid(void **state)
+{
+    const uint8_t c[4] = {0xff, 0xfe, 0xac, 0x20};  // utf-16
+    assert_false(blogc_utf8_validate(c, 4));
+    const uint8_t d[8] = {0xff, 0xfe, 0x00, 0x00, 0xac, 0x20, 0x00, 0x00};  // utf-32
+    assert_false(blogc_utf8_validate(d, 8));
+}
+
+
+static void
+test_utf8_valid_str(void **state)
+{
+    sb_string_t *s = sb_string_new();
+    sb_string_append(s,
+        "<a href=\"{{ BASE_URL }}/page/{{ PREVIOUS_PAGE }}/\">\xc2\xab Newer "
+        "posts</a>");
+    assert_true(blogc_utf8_validate_str(s));
+    sb_string_free(s, true);
+    s = sb_string_new();
+    sb_string_append(s, "\xe2\x82\xac");
+    assert_true(blogc_utf8_validate_str(s));
+    sb_string_free(s, true);
+}
+
+
+static void
+test_utf8_invalid_str(void **state)
+{
+    sb_string_t *s = sb_string_new();
+    sb_string_append(s, "\xff\xfe\xac\x20");  // utf-16
+    assert_false(blogc_utf8_validate_str(s));
+    sb_string_free(s, true);
+    s = sb_string_new();
+    sb_string_append(s, "\xff\xfe\x00\x00\xac\x20\x00\x00");  // utf-32
+    assert_false(blogc_utf8_validate_str(s));
+    sb_string_free(s, true);
+}
+
+
+static void
+test_utf8_skip_bom(void **state)
+{
+    const uint8_t c[4] = {0xef, 0xbb, 0xbf, 0};
+    assert_int_equal(blogc_utf8_skip_bom(c, 2), 0);
+    assert_int_equal(blogc_utf8_skip_bom(c, 3), 3);
+    assert_string_equal(c + 3, "");
+    const uint8_t d[8] = {0xef, 0xbb, 0xbf, 'b', 'o', 'l', 'a', 0};
+    assert_int_equal(blogc_utf8_skip_bom(d, 7), 3);
+    assert_string_equal(d + 3, "bola");
+    const uint8_t e[5] = "bola";
+    assert_int_equal(blogc_utf8_skip_bom(e, 4), 0);
+}
+
+
+int
+main(void)
+{
+    const UnitTest tests[] = {
+        unit_test(test_utf8_valid),
+        unit_test(test_utf8_invalid),
+        unit_test(test_utf8_valid_str),
+        unit_test(test_utf8_invalid_str),
+        unit_test(test_utf8_skip_bom),
+    };
+    return run_tests(tests);
+}
-- 
cgit v1.2.3-18-g5258