libtests: Include the Unicode test files directly.

author Mark Wooding <mdw@distorted.org.uk>

Sat, 2 Dec 2017 21:44:38 +0000 (21:44 +0000)

committer Mark Wooding <mdw@distorted.org.uk>

Sat, 2 Dec 2017 22:18:21 +0000 (22:18 +0000)
author Mark Wooding <mdw@distorted.org.uk>
Sat, 2 Dec 2017 21:44:38 +0000 (21:44 +0000)
committer Mark Wooding <mdw@distorted.org.uk>
Sat, 2 Dec 2017 22:18:21 +0000 (22:18 +0000)
diff --git a/README b/README

index 5daf7b71ddc6364281902e594f6323a6b2f6295e..80e8d175421c4a297fd7d8038fdc8e83dd65d111 100644 (file)
--- a/README
+++ b/README
@@ -282,6 +282,8 @@ Portions extracted from MPG321, http://mpg321.sourceforge.net/
    Copyright (C) 2000-2001 Robert Leslie
  Portions Copyright (C) 1997-2006 Free Software Foundation, Inc.
  Portions Copyright (C) 2000 Red Hat, Inc., Jonathan Blandford <jrb@redhat.com>
    Copyright (C) 2000-2001 Robert Leslie
  Portions Copyright (C) 1997-2006 Free Software Foundation, Inc.
  Portions Copyright (C) 2000 Red Hat, Inc., Jonathan Blandford <jrb@redhat.com>
+Unicode test files Copyright (C) 1991-2017 Unicode Inc.; see
+  libtests/COPYING.unicode-tests for details.
  Binaries may derive extra copyright owners through linkage (binary distributors
  are expected to do their own legwork)
  
  Binaries may derive extra copyright owners through linkage (binary distributors
  are expected to do their own legwork)
  
diff --git a/libtests/COPYING.unicode-tests b/libtests/COPYING.unicode-tests

new file mode 100644 (file)

index 0000000..b456a04
--- /dev/null
+++ b/libtests/COPYING.unicode-tests
@@ -0,0 +1,38 @@
+[The Unicode test files GraphemeBreakTest.txt, NormalizationTest.txt,
+and WordBreakTest.txt, included in this directory, are copyright (c)
+1991--2017 Unicode Inc., and subject to the license conditions below, as
+published at https://www.unicode.org/copyright.html.  These files are
+used for testing, but are not required at runtime.  In particular, they
+are not included in binary packages.  -- [mdw]]
+
+Copyright © 1991-2017 Unicode, Inc. All rights reserved.
+Distributed under the Terms of Use in http://www.unicode.org/copyright.html.
+
+Permission is hereby granted, free of charge, to any person obtaining
+a copy of the Unicode data files and any associated documentation
+(the "Data Files") or Unicode software and any associated documentation
+(the "Software") to deal in the Data Files or Software
+without restriction, including without limitation the rights to use,
+copy, modify, merge, publish, distribute, and/or sell copies of
+the Data Files or Software, and to permit persons to whom the Data Files
+or Software are furnished to do so, provided that either
+(a) this copyright and permission notice appear with all copies
+of the Data Files or Software, or
+(b) this copyright and permission notice appear in associated
+Documentation.
+
+THE DATA FILES AND SOFTWARE ARE PROVIDED "AS IS", WITHOUT WARRANTY OF
+ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE
+WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+NONINFRINGEMENT OF THIRD PARTY RIGHTS.
+IN NO EVENT SHALL THE COPYRIGHT HOLDER OR HOLDERS INCLUDED IN THIS
+NOTICE BE LIABLE FOR ANY CLAIM, OR ANY SPECIAL INDIRECT OR CONSEQUENTIAL
+DAMAGES, OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE,
+DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
+TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
+PERFORMANCE OF THE DATA FILES OR SOFTWARE.
+
+Except as contained in this notice, the name of a copyright holder
+shall not be used in advertising or otherwise to promote the sale,
+use or other dealings in these Data Files or Software without prior
+written authorization of the copyright holder.
diff --git a/libtests/GraphemeBreakTest.txt.gz b/libtests/GraphemeBreakTest.txt.gz

new file mode 100644 (file)

index 0000000..128d91f

Binary files /dev/null and b/libtests/GraphemeBreakTest.txt.gz differ
diff --git a/libtests/Makefile.am b/libtests/Makefile.am

index e4a9eb0fb779d1c628df2aa7246e591ede7209fd..83a7f97e52184ed63d98725e7cec3a21a29dde32 100644 (file)
--- a/libtests/Makefile.am
+++ b/libtests/Makefile.am
@@ -56,6 +56,7 @@ t_split_SOURCES=t-split.c test.c test.h
  t_syscalls_SOURCES=t-syscalls.c test.c test.h
  t_trackname_SOURCES=t-trackname.c test.c test.h
  t_unicode_SOURCES=t-unicode.c test.c test.h
  t_syscalls_SOURCES=t-syscalls.c test.c test.h
  t_trackname_SOURCES=t-trackname.c test.c test.h
  t_unicode_SOURCES=t-unicode.c test.c test.h
+t_unicode_CFLAGS=$(AM_CFLAGS) -DSRCDIR=\"$(srcdir)\"
  t_url_SOURCES=t-url.c test.c test.h
  t_utf8_SOURCES=t-utf8.c test.c test.h
  t_vector_SOURCES=t-vector.c test.c test.h
  t_url_SOURCES=t-url.c test.c test.h
  t_utf8_SOURCES=t-utf8.c test.c test.h
  t_vector_SOURCES=t-vector.c test.c test.h
@@ -74,9 +75,22 @@ before-check:
  make-coverage-reports: check
         cd ../lib && ${GCOV} *.c | ${PYTHON} ../scripts/format-gcov-report --html . *.c
  
  make-coverage-reports: check
         cd ../lib && ${GCOV} *.c | ${PYTHON} ../scripts/format-gcov-report --html . *.c
  
-EXTRA_DIST=t-macros-1.tmpl t-macros-2
+UNICODE_TEST_FILES=GraphemeBreakTest NormalizationTest WordBreakTest
+UNICODE_TEST_BASE_URL=http://www.unicode.org/Public/6.0.0/ucd/
+GraphemeBreakTest_URL=$(UNICODE_TEST_BASE_URL)/auxiliary/GraphemeBreakTest.txt
+NormalizationTest_URL=$(UNICODE_TEST_BASE_URL)/NormalizationTest.txt
+WordBreakTest_URL=$(UNICODE_TEST_BASE_URL)/auxiliary/WordBreakTest.txt
+update-unicode-tests:
+       set -e; \
+       for t in $(foreach t,$(UNICODE_TEST_FILES),$t:$($t_URL)); do \
+         f=$${t%%:*} u=$${t#*:}; \
+         echo $$f $$u; \
+         rm -f $$f.new $$f.new.gz; wget -O$$f.new $$u; \
+         gzip -9cv $$f.new >$$f.new.gz; \
+         mv -f $$f.new.gz $(srcdir)/$$f.txt.gz; rm -f $$f.new; \
+       done
  
  
-CLEANFILES=*.gcda *.gcov *.gcno *.c.html index.html
+EXTRA_DIST=t-macros-1.tmpl t-macros-2 \
+       COPYING.unicode-tests $(addsuffix .txt.gz, $(UNICODE_TEST_FILES))
  
  
-DISTCLEANFILES=GraphemeBreakTest.txt NormalizationTest.txt     \
-              WordBreakTest.txt
+CLEANFILES=*.gcda *.gcov *.gcno *.c.html index.html
diff --git a/libtests/NormalizationTest.txt.gz b/libtests/NormalizationTest.txt.gz

new file mode 100644 (file)

index 0000000..6524991

Binary files /dev/null and b/libtests/NormalizationTest.txt.gz differ
diff --git a/libtests/WordBreakTest.txt.gz b/libtests/WordBreakTest.txt.gz

new file mode 100644 (file)

index 0000000..72c0193

Binary files /dev/null and b/libtests/WordBreakTest.txt.gz differ
diff --git a/libtests/t-unicode.c b/libtests/t-unicode.c

index 2a199e35deaac777272194917290d40c63af2fec..6ab20f5d8270bb258d515ab3ece0c95dc05c1e9c 100644 (file)
--- a/libtests/t-unicode.c
+++ b/libtests/t-unicode.c
@@ -17,30 +17,30 @@
   */
  #include "test.h"
  
   */
  #include "test.h"
  
+#ifndef SRCDIR
+# define SRCDIR "."
+#endif
+
  /** @brief Open a Unicode test file */
  static FILE *open_unicode_test(const char *path) {
  /** @brief Open a Unicode test file */
  static FILE *open_unicode_test(const char *path) {
-  const char *base;
    FILE *fp;
    char buffer[1024];
    FILE *fp;
    char buffer[1024];
-  int w;
  
  
-  if((base = strrchr(path, '/')))
-    ++base;
-  else
-    base = path;
-  if(!(fp = fopen(base, "r"))) {
-    snprintf(buffer, sizeof buffer,
-             "wget http://www.unicode.org/Public/6.0.0/ucd/%s", path);
-    if((w = system(buffer)))
-      disorder_fatal(0, "%s: %s", buffer, wstat(w));
-    if(chmod(base, 0444) < 0)
-      disorder_fatal(errno, "chmod %s", base);
-    if(!(fp = fopen(base, "r")))
-      disorder_fatal(errno, "%s", base);
-  }
+  snprintf(buffer, sizeof buffer, "gzip -dc " SRCDIR "/%s.gz", path);
+  if(!(fp = popen(buffer, "r")))
+    disorder_fatal(errno, "decompressing %s", path);
    return fp;
  }
  
    return fp;
  }
  
+/** @brief Close a Unicode test file */
+static void close_unicode_test(const char *path, FILE *fp)
+{
+  int w;
+
+  if((w = pclose(fp)))
+    disorder_fatal(0, "decompressing %s: %s", path, wstat(w));
+}
+
  /** @brief Run breaking tests for utf32_grapheme_boundary() etc */
  static void breaktest(const char *path,
                        int (*breakfn)(const uint32_t *, size_t, size_t)) {
  /** @brief Run breaking tests for utf32_grapheme_boundary() etc */
  static void breaktest(const char *path,
                        int (*breakfn)(const uint32_t *, size_t, size_t)) {
@@ -94,7 +94,7 @@ static void breaktest(const char *path,
      }
      xfree(l);
    }
      }
      xfree(l);
    }
-  fclose(fp);
+  close_unicode_test(path, fp);
  }
  
  /** @brief Tests for @ref lib/unicode.h */
  }
  
  /** @brief Tests for @ref lib/unicode.h */
@@ -179,9 +179,9 @@ static void test_unicode(void) {
      }
      xfree(l);
    }
      }
      xfree(l);
    }
-  fclose(fp);
-  breaktest("auxiliary/GraphemeBreakTest.txt", utf32_is_grapheme_boundary);
-  breaktest("auxiliary/WordBreakTest.txt", utf32_is_word_boundary);
+  close_unicode_test("NormalizationTest.txt", fp);
+  breaktest("GraphemeBreakTest.txt", utf32_is_grapheme_boundary);
+  breaktest("WordBreakTest.txt", utf32_is_word_boundary);
    insist(utf32_combining_class(0x40000) == 0);
    insist(utf32_combining_class(0xE0000) == 0);
  }
    insist(utf32_combining_class(0x40000) == 0);
    insist(utf32_combining_class(0xE0000) == 0);
  }
author	Mark Wooding <mdw@distorted.org.uk>
	Sat, 2 Dec 2017 21:44:38 +0000 (21:44 +0000)
committer	Mark Wooding <mdw@distorted.org.uk>
	Sat, 2 Dec 2017 22:18:21 +0000 (22:18 +0000)
README		patch \| blob \| blame \| history
libtests/COPYING.unicode-tests	[new file with mode: 0644]	patch \| blob
libtests/GraphemeBreakTest.txt.gz	[new file with mode: 0644]	patch \| blob
libtests/Makefile.am		patch \| blob \| blame \| history
libtests/NormalizationTest.txt.gz	[new file with mode: 0644]	patch \| blob
libtests/WordBreakTest.txt.gz	[new file with mode: 0644]	patch \| blob
libtests/t-unicode.c		patch \| blob \| blame \| history