[tracker/parser-unicode-libs-review] FTS parser tests: disable some tests if using the glib/pango parser

From: Aleksander Morgado <aleksm src gnome org>
To: commits-list gnome org
Cc:
Subject: [tracker/parser-unicode-libs-review] FTS parser tests: disable some tests if using the glib/pango parser
Date: Thu, 20 May 2010 10:15:08 +0000 (UTC)
commit 83f65b49f2d382a3891bcc8294f2dfeedd63f550
Author: Aleksander Morgado <aleksander lanedo com>
Date:   Thu May 20 12:14:45 2010 +0200

    FTS parser tests: disable some tests if using the glib/pango parser

 tests/libtracker-fts/tracker-parser-test.c |   29 ++++++++++++++++++++++++++++
 1 files changed, 29 insertions(+), 0 deletions(-)
---
diff --git a/tests/libtracker-fts/tracker-parser-test.c b/tests/libtracker-fts/tracker-parser-test.c
index 81189e4..0364fdd 100644
--- a/tests/libtracker-fts/tracker-parser-test.c
+++ b/tests/libtracker-fts/tracker-parser-test.c
@@ -26,6 +26,23 @@
 
 #include <libtracker-fts/tracker-parser.h>
 
+/* Note
+ *  Currently, three different types of parsers are defined in libtracker-fts:
+ *    - GNU libunistring-based parser, up to 20% faster than the others, and full
+ *       unicode compliant.
+ *    - libicu-based parser, full unicode compliant but slower as it needs
+ *       conversions to/from UChars (UTF-16 encoded strings)
+ *    - glib/pango parser, not fully unicode compliant as it doesn't work properly
+ *       with decomposed strings (NFD normalized), doesn't make a unicode-based
+ *       word-breaking and doesn't make full-word casefolding.
+ *
+ * Some of the tests, thus, will be DISABLED for the GLIB/PANGO parser.
+ */
+#undef FULL_UNICODE_TESTS
+#if defined HAVE_LIBUNISTRING || defined HAVE_LIBICU
+#define FULL_UNICODE_TESTS
+#endif
+
 /* -------------- COMMON FOR ALL TESTS ----------------- */
 
 /* Fixture object type */
@@ -185,9 +202,11 @@ static const TestDataExpectedWord test_data_normalization[] = {
 	{ "Ã©cole",                "ecole" },
 	{ "Ã?COLE",                "ecole" },
 	{ "Ã?cole",                "ecole" },
+#ifdef FULL_UNICODE_TESTS /* glib/pango doesn't like NFD strings */
 	{ "e" "\xCC\x81" "cole",  "ecole" },
 	{ "E" "\xCC\x81" "COLE",  "ecole" },
 	{ "E" "\xCC\x81" "cole",  "ecole" },
+#endif
 	{ NULL,                   NULL    }
 };
 
@@ -204,9 +223,11 @@ static const TestDataExpectedWord test_data_normalization[] = {
 	{ "Ã©cole",                "Ã©cole" },
 	{ "Ã?COLE",                "Ã©cole" },
 	{ "Ã?cole",                "Ã©cole" },
+#ifdef FULL_UNICODE_TESTS /* glib/pango doesn't like NFD strings */
 	{ "e" "\xCC\x81" "cole",  "Ã©cole" },
 	{ "E" "\xCC\x81" "COLE",  "Ã©cole" },
 	{ "E" "\xCC\x81" "cole",  "Ã©cole" },
+#endif
 	{ NULL,                   NULL    }
 };
 #endif
@@ -216,19 +237,27 @@ static const TestDataExpectedWord test_data_casefolding[] = {
 	{ "gross", "gross" },
 	{ "GROSS", "gross" },
 	{ "GrOsS", "gross" },
+#ifdef FULL_UNICODE_TESTS /* glib/pango doesn't do full-word casefolding */
 	{ "groÃ?",  "gross" },
+#endif
 	{ NULL,    NULL    }
 };
 
 /* Number of expected words tests */
 static const TestDataExpectedNWords test_data_nwords[] = {
+#ifdef FULL_UNICODE_TESTS /* glib/pango thinks 32.3 are 2 words */
 	{ "The quick (\"brown\") fox canâ??t jump 32.3 feet, right?", TRUE,   8 },
 	{ "The quick (\"brown\") fox canâ??t jump 32.3 feet, right?", FALSE,  9 },
+#endif
 	{ "ã??ã?¢ã?»ã?µã??ã?¨ã?³ã?¹",                                            TRUE,   2 }, /* katakana */
+#ifdef FULL_UNICODE_TESTS /* glib/pango doesn't work properly with chinese */
 	{ "æ?¬å·?æ??ä¸»æµ?ç??é£?å?³",                                          TRUE,   8 }, /* chinese */
+#endif
 	{ "Ð?Ð¼ÐµÑ?Ð¸ÐºÐ°Ð½Ñ?ÐºÐ¸Ðµ Ñ?Ñ?Ð´Ð° Ð½Ð°Ñ?Ð¾Ð´Ñ?Ñ?Ñ?Ñ? Ð² Ð¼ÐµÐ¶Ð´Ñ?Ð½Ð°Ñ?Ð¾Ð´Ð½Ñ?Ñ? Ð²Ð¾Ð´Ð°Ñ?.",     TRUE,   6 }, /* russian */
 	{ "Báº§n chá»? lÃ  má»?t anh nghÃ¨o xÃ¡c",                           TRUE,   7 }, /* vietnamese */
+#ifdef FULL_UNICODE_TESTS /* glib/pango doesn't work properly with chinese */
 	{ "ã??ã?¢ã?»ã?µã??ã?¨ã?³ã?¹ æ?¬å·?æ??ä¸»æµ?ç??é£?å?³ katakana, chinese, english",   TRUE,  13 }, /* mixed */
+#endif
 	{ NULL,                                                     FALSE,  0 }
 };
[Date Prev][Date Next] [Thread Prev][Thread Next] [Thread Index] [Date Index] [Author Index]