blob: d596ff3d893452a0abbde1f407de7c0c292ed3b7 [file] [log] [blame]
David K. Bainbridge215e0242017-09-05 23:18:24 -07001// Copyright 2011 The Go Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style
3// license that can be found in the LICENSE file.
4
5package norm
6
7import (
8 "fmt"
9 "testing"
10
11 "golang.org/x/text/transform"
12)
13
14func TestTransform(t *testing.T) {
15 tests := []struct {
16 f Form
17 in, out string
18 eof bool
19 dstSize int
20 err error
21 }{
22 {NFC, "ab", "ab", true, 2, nil},
23 {NFC, "qx", "qx", true, 2, nil},
24 {NFD, "qx", "qx", true, 2, nil},
25 {NFC, "", "", true, 1, nil},
26 {NFD, "", "", true, 1, nil},
27 {NFC, "", "", false, 1, nil},
28 {NFD, "", "", false, 1, nil},
29
30 // Normalized segment does not fit in destination.
31 {NFD, "ö", "", true, 1, transform.ErrShortDst},
32 {NFD, "ö", "", true, 2, transform.ErrShortDst},
33
34 // As an artifact of the algorithm, only full segments are written.
35 // This is not strictly required, and some bytes could be written.
36 // In practice, for Transform to not block, the destination buffer
37 // should be at least MaxSegmentSize to work anyway and these edge
38 // conditions will be relatively rare.
39 {NFC, "ab", "", true, 1, transform.ErrShortDst},
40 // This is even true for inert runes.
41 {NFC, "qx", "", true, 1, transform.ErrShortDst},
42 {NFC, "a\u0300abc", "\u00e0a", true, 4, transform.ErrShortDst},
43
44 // We cannot write a segment if successive runes could still change the result.
45 {NFD, "ö", "", false, 3, transform.ErrShortSrc},
46 {NFC, "a\u0300", "", false, 4, transform.ErrShortSrc},
47 {NFD, "a\u0300", "", false, 4, transform.ErrShortSrc},
48 {NFC, "ö", "", false, 3, transform.ErrShortSrc},
49
50 {NFC, "a\u0300", "", true, 1, transform.ErrShortDst},
51 // Theoretically could fit, but won't due to simplified checks.
52 {NFC, "a\u0300", "", true, 2, transform.ErrShortDst},
53 {NFC, "a\u0300", "", true, 3, transform.ErrShortDst},
54 {NFC, "a\u0300", "\u00e0", true, 4, nil},
55
56 {NFD, "öa\u0300", "o\u0308", false, 8, transform.ErrShortSrc},
57 {NFD, "öa\u0300ö", "o\u0308a\u0300", true, 8, transform.ErrShortDst},
58 {NFD, "öa\u0300ö", "o\u0308a\u0300", false, 12, transform.ErrShortSrc},
59
60 // Illegal input is copied verbatim.
61 {NFD, "\xbd\xb2=\xbc ", "\xbd\xb2=\xbc ", true, 8, nil},
62 }
63 b := make([]byte, 100)
64 for i, tt := range tests {
65 nDst, _, err := tt.f.Transform(b[:tt.dstSize], []byte(tt.in), tt.eof)
66 out := string(b[:nDst])
67 if out != tt.out || err != tt.err {
68 t.Errorf("%d: was %+q (%v); want %+q (%v)", i, out, err, tt.out, tt.err)
69 }
70 if want := tt.f.String(tt.in)[:nDst]; want != out {
71 t.Errorf("%d: incorrect normalization: was %+q; want %+q", i, out, want)
72 }
73 }
74}
75
76var transBufSizes = []int{
77 MaxTransformChunkSize,
78 3 * MaxTransformChunkSize / 2,
79 2 * MaxTransformChunkSize,
80 3 * MaxTransformChunkSize,
81 100 * MaxTransformChunkSize,
82}
83
84func doTransNorm(f Form, buf []byte, b []byte) []byte {
85 acc := []byte{}
86 for p := 0; p < len(b); {
87 nd, ns, _ := f.Transform(buf[:], b[p:], true)
88 p += ns
89 acc = append(acc, buf[:nd]...)
90 }
91 return acc
92}
93
94func TestTransformNorm(t *testing.T) {
95 for _, sz := range transBufSizes {
96 buf := make([]byte, sz)
97 runNormTests(t, fmt.Sprintf("Transform:%d", sz), func(f Form, out []byte, s string) []byte {
98 return doTransNorm(f, buf, append(out, s...))
99 })
100 }
101}