Expand parser and Unicode test coverage

2009-07-18 15:59:55 +03:00 · 2009-07-18 15:59:55 +03:00 · 20efe4aa26
parent 9240146c10
commit 20efe4aa26
7 changed files with 123 additions and 17 deletions
--- a/test/run-test
+++ b/test/run-test
@ -16,15 +16,12 @@ run_testprog() {
    esac
 }
-if [ ! -f $TESTFILE ]; then
+for testfile in $TESTFILES; do
-    echo "$TESTFILE cannot be found" >&2
+    mkdir -p $TMPDIR
-    exit 1
+    ${srcdir}/split-testfile.py $testfile $TMPDIR | while read input output; do
-fi
+        run_test load_dump $input $output
-
+        run_test loadf_dumpf $input $output
-mkdir -p $TMPDIR
+        run_test loads_dumps $input $output
-${srcdir}/split-testfile.py $TESTFILE $TMPDIR | \
+    done || exit 1
-while read input output; do
+    rm -rf $TMPDIR
    run_test load_dump $input $output
    run_test loadf_dumpf $input $output
    run_test loads_dumps $input $output
 done
--- a/test/split-testfile.py
+++ b/test/split-testfile.py
@ -17,8 +17,8 @@ def main():
        print 'usage: %s input-file output-directory' % sys.argv[0]
        return 2
-    infile = sys.argv[1]
+    infile = os.path.normpath(sys.argv[1])
-    outdir = sys.argv[2]
+    outdir = os.path.normpath(sys.argv[2])
    if not os.path.exists(outdir):
        print >>sys.stderr, 'output directory %r does not exist!' % outdir
@ -40,7 +40,7 @@ def main():
            current.write(line)
    close_files(input, output)
-    print >>sys.stderr, "%d test cases" % (i + 1)
+    print >>sys.stderr, "%s: %d test cases" % (infile, i + 1)
 if __name__ == '__main__':
    sys.exit(main() or 0)
--- a/test/test-invalid
+++ b/test/test-invalid
@ -1,6 +1,6 @@
 #!/bin/sh
-TESTFILE="${srcdir}/testdata/invalid"
+TESTFILES="${srcdir}/testdata/invalid ${srcdir}/testdata/invalid-unicode"
 TMPDIR="tmp"
 run_test() {
--- a/test/test-valid
+++ b/test/test-valid
@ -1,6 +1,6 @@
 #!/bin/sh
-TESTFILE="${srcdir}/testdata/valid"
+TESTFILES="${srcdir}/testdata/valid"
 TMPDIR="tmp"
 run_test() {
--- a/test/testdata/invalid
+++ b/test/testdata/invalid
@ -77,6 +77,11 @@ unexpected token near end of file
 1
 unexpected newline near '"a'
 ========
 {"a":"a" 123}
 ====
 1
 '}' expected near '123'
 ========
 {[
 ====
 1
@ -132,6 +137,16 @@ invalid token near '0'
 1
 invalid token near '-0'
 ========
 [troo
 ====
 1
 invalid token near 'troo'
 ========
 ["\a <-- invalid escape"]
 ====
 1
 invalid escape near '"\'
 ========
 ["	 <-- tab character"]
 ====
 1
@ -156,3 +171,8 @@ invalid Unicode '\uD888\u3210'
 ====
 1
 invalid Unicode '\uDFAA'
 ========
 å
 ====
 1
 '[' or '{' expected near 'å'
--- a/test/testdata/invalid-unicode
+++ b/test/testdata/invalid-unicode
@ -0,0 +1,89 @@
 å
 ====
 -1
 unable to decode byte 0xe5 at position 0
 ========
 ["å <-- invalid UTF-8"]
 ====
 -1
 unable to decode byte 0xe5 at position 2
 ========
 [å]
 ====
 -1
 unable to decode byte 0xe5 at position 1
 ========
 [aå]
 ====
 -1
 unable to decode byte 0xe5 at position 2
 ========
 ["\uå"]
 ====
 -1
 unable to decode byte 0xe5 at position 4
 ========
 ["\å"]
 ====
 -1
 unable to decode byte 0xe5 at position 3
 ========
 [0å]
 ====
 -1
 unable to decode byte 0xe5 at position 2
 ========
 [123å]
 ====
 -1
 unable to decode byte 0xe5 at position 4
 ========
 [1eå]
 ====
 -1
 unable to decode byte 0xe5 at position 3
 ========
 [1e1å]
 ====
 -1
 unable to decode byte 0xe5 at position 4
 ========
 ["<22>"]
 ====
 -1
 unable to decode byte 0x81 at position 2
 ========
 ["Á"]
 ====
 -1
 unable to decode byte 0xc1 at position 2
 ========
 ["ý"]
 ====
 -1
 unable to decode byte 0xfd at position 2
 ========
 ["ô¿¿¿"]
 ====
 -1
 unable to decode byte 0xf4 at position 2
 ========
 ["à€¢ <-- overlong encoding"]
 ====
 -1
 unable to decode byte 0xe0 at position 2
 ========
 ["ð€€¢ <-- overlong encoding"]
 ====
 -1
 unable to decode byte 0xf0 at position 2
 ========
 ["àÿ <-- truncated UTF-8"]
 ====
 -1
 unable to decode byte 0xe0 at position 2
 ========
 ["í¢« <-- encoded surrogate half"]
 ====
 -1
 unable to decode byte 0xed at position 2
--- a/test/testdata/valid
+++ b/test/testdata/valid
@ -4,7 +4,7 @@
 ========
 ["abcdefghijklmnopqrstuvwxyz1234567890 "]
 ========
-["€þıœəßð some utf-8 ĸʒ×ŋµåäö"]
+["€þıœəßð some utf-8 ĸʒ×ŋµåäö𝄞"]
 ========
 ["\"\\\/\b\f\n\r\t"]
 ========