From bb98f3fd2887468ada6b3cee7cdccd05b809c545 Mon Sep 17 00:00:00 2001
From: Galen Charlton <gmc@esilibrary.com>
Date: Wed, 10 Apr 2013 20:18:10 -0400
Subject: [PATCH] start adding pgTAP test cases

pgTAP is a PostgreSQL unit testing framework; about which
more can be found at http://pgtap.org/

This commit introduces the first pgTAP test case, which exercises
the NACO normalization functions.

To run the tests, install pgTAP, create an Evergreen database that
contains (for now) just the seed data, and from the top of the
source tree run

pg_prove -vr -U evergreen Open-ILS/src/sql/Pg/t/*

Replace '-U evergreen' with the psql command-line switches
needed to access your database.

To install pgTAP on a Debian Wheezy system, you can do:

Then, to load the pgTAP extension into the database, run

psql> CREATE EXTENSION pgtap;

Signed-off-by: Galen Charlton <gmc@esilibrary.com>
Signed-off-by: Mike Rylander <mrylander@gmail.com>
---
 Open-ILS/src/sql/Pg/t/naco_normalize.sql | 44 ++++++++++++++++++++++++
 1 file changed, 44 insertions(+)
 create mode 100644 Open-ILS/src/sql/Pg/t/naco_normalize.sql

diff --git a/Open-ILS/src/sql/Pg/t/naco_normalize.sql b/Open-ILS/src/sql/Pg/t/naco_normalize.sql
new file mode 100644
index 0000000000..0e59107e99
--- /dev/null
+++ b/Open-ILS/src/sql/Pg/t/naco_normalize.sql
@@ -0,0 +1,44 @@
+BEGIN;
+
+SELECT plan(25);
+
+CREATE FUNCTION nfkd(TEXT) RETURNS TEXT AS $$
+    use strict;
+    use warnings;
+    use Unicode::Normalize;
+    my $str = shift;
+    return NFKD($str);
+$$ LANGUAGE PLPERLU STABLE;
+
+SELECT is( public.naco_normalize('abc'), 'abc', 'regular text' );
+SELECT is( public.naco_normalize('ABC'), 'abc', 'regular text' );
+SELECT is( public.naco_normalize('Ã¥bÃ§dÃ©Ã±ÅÃ¶Ã®Ã¸Ã¦ÃÄ±ÃÃÃÃÃÃÃÃÃÃÅÃ¨'), 'abcdenoeoioaeciaaiiiooouaeoee', 'European diacritics' );
+SELECT is( public.naco_normalize('âââÂ«quotesÂ»ââ'), 'quotes', 'special quotes' );
+SELECT is( public.naco_normalize('ÂabcÂ def'), 'def', 'special non-filing characters designation' );
+SELECT is( public.naco_normalize('Âabcdef'), 'abcdef', 'unpaired start of string' );
+SELECT is( public.naco_normalize('Ã'), 'ss', 'sharp S (eszett)' );
+SELECT is( public.naco_normalize('ï¬ï¬ï¬'), 'flfiff', 'ligatures' );
+SELECT is( public.naco_normalize('Æ Æ¡Æ¯Æ°Â²Ä²Ä³'), 'oouu2ijij', 'NFKD applied correctly' );
+SELECT is( public.naco_normalize('ÃÃÃÃ¦Ã°Ã¸Ã¾ÄÄÄ±ÅÅÅÅÊ»Ê¼â'), 'aeothaedothddilloeoel', 'part 3.6' );
+SELECT is( public.naco_normalize('Ã'), 'd', 'uppercase eth (missing from 3.6?)' );
+SELECT is( public.naco_normalize('Ä±Ä°'), 'ii', 'Turkish I' );
+SELECT is( public.naco_normalize('[book''s cover]'), 'books cover', 'square brackets and apostrophe' );
+SELECT is( public.naco_normalize('  grue   food '), 'grue food', 'trim spaces' );
+-- note addition of nfkd() to transform expected output
+SELECT is( public.naco_normalize('íêµ­ì´ ì¡°ì ë§'), nfkd('íêµ­ì´ ì¡°ì ë§'), 'Korean text' );
+SELECT is( public.naco_normalize('æ®éè©± / æ®éè¯'), 'æ®éè©± æ®éè¯', 'Chinese text' );
+SELECT is( public.naco_normalize('Ø§ÙØ¹Ø±Ø¨ÙØ©'), 'Ø§ÙØ¹Ø±Ø¨ÙØ©', 'Arabic text' );
+SELECT is( public.naco_normalize('á¥áá áá£áá ááá'), 'á¥áá áá£áá ááá', 'Georgian text' );
+SELECT is( public.naco_normalize('ÑÑÑÑÐºÐ¸Ð¹ ÑÐ·ÑÐº'), 'ÑÑÑÑÐºÐ¸Ð¸ ÑÐ·ÑÐº', 'Russian text' );
+SELECT is( public.naco_normalize(E'\r\npa\tper\f'), 'paper', 'other whitespace' );
+SELECT is( public.naco_normalize('#1: â C++, @ home & abroad'), '#1 c++ @ home & abroad', 'other punctuation' );
+SELECT is( public.naco_normalize('Ù Ù¡Ù¢Ù£Ù¤Ù¥'), '012345', 'other decimal digits' );
+SELECT is( public.naco_normalize('Â²Â³Â¹'), '231', 'superscript numbers' );
+SELECT is( public.naco_normalize('â­Â©Â®â¯'), 'â­ â¯', 'other symbols' );
+
+SELECT is( public.naco_normalize('Smith, Jane. Poet, painter, and author', 'a'), 'smith, jane poet painter and author',
+      'retain first comma' );
+
+SELECT * FROM finish();
+
+ROLLBACK;
-- 
2.43.2