599 lines
11 KiB
Go
599 lines
11 KiB
Go
|
package utf8s
|
|||
|
|
|||
|
import (
|
|||
|
"io"
|
|||
|
"strings"
|
|||
|
|
|||
|
"testing"
|
|||
|
)
|
|||
|
|
|||
|
func TestRuneReader(t *testing.T) {
|
|||
|
|
|||
|
tests := []struct{
|
|||
|
Reader io.Reader
|
|||
|
ExpectedRune rune
|
|||
|
ExpectedInt int
|
|||
|
}{
|
|||
|
{
|
|||
|
Reader: strings.NewReader("a"),
|
|||
|
ExpectedRune: 'a',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("ap"),
|
|||
|
ExpectedRune: 'a',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("app"),
|
|||
|
ExpectedRune: 'a',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("appl"),
|
|||
|
ExpectedRune: 'a',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("apple"),
|
|||
|
ExpectedRune: 'a',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("b"),
|
|||
|
ExpectedRune: 'b',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("ba"),
|
|||
|
ExpectedRune: 'b',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("ban"),
|
|||
|
ExpectedRune: 'b',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("bana"),
|
|||
|
ExpectedRune: 'b',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("banan"),
|
|||
|
ExpectedRune: 'b',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("banana"),
|
|||
|
ExpectedRune: 'b',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("c"),
|
|||
|
ExpectedRune: 'c',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("ch"),
|
|||
|
ExpectedRune: 'c',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("che"),
|
|||
|
ExpectedRune: 'c',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("cher"),
|
|||
|
ExpectedRune: 'c',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("cherr"),
|
|||
|
ExpectedRune: 'c',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("cherry"),
|
|||
|
ExpectedRune: 'c',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("A"),
|
|||
|
ExpectedRune: 'A',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("r"),
|
|||
|
ExpectedRune: 'r',
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("¡"),
|
|||
|
ExpectedRune: '¡',
|
|||
|
ExpectedInt: 2,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("¡!"),
|
|||
|
ExpectedRune: '¡',
|
|||
|
ExpectedInt: 2,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("۵"),
|
|||
|
ExpectedRune: '۵',
|
|||
|
ExpectedInt: 2,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("۵5"),
|
|||
|
ExpectedRune: '۵',
|
|||
|
ExpectedInt: 2,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("‱"),
|
|||
|
ExpectedRune: '‱',
|
|||
|
ExpectedInt: 3,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("‱%"),
|
|||
|
ExpectedRune: '‱',
|
|||
|
ExpectedInt: 3,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("≡"),
|
|||
|
ExpectedRune: '≡',
|
|||
|
ExpectedInt: 3,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("≡="),
|
|||
|
ExpectedRune: '≡',
|
|||
|
ExpectedInt: 3,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("𐏕"),
|
|||
|
ExpectedRune: '𐏕',
|
|||
|
ExpectedInt: 4,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("𐏕100"),
|
|||
|
ExpectedRune: '𐏕',
|
|||
|
ExpectedInt: 4,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("🙂"),
|
|||
|
ExpectedRune: '🙂',
|
|||
|
ExpectedInt: 4,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("🙂:-)"),
|
|||
|
ExpectedRune: '🙂',
|
|||
|
ExpectedInt: 4,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\u0000"),
|
|||
|
ExpectedRune: 0x0,
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\u0001"),
|
|||
|
ExpectedRune: 0x1,
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\u007e"),
|
|||
|
ExpectedRune: 0x7e,
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\u007f"),
|
|||
|
ExpectedRune: 0x7f,
|
|||
|
ExpectedInt: 1,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\u0080"),
|
|||
|
ExpectedRune: 0x80,
|
|||
|
ExpectedInt: 2,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\u0081"),
|
|||
|
ExpectedRune: 0x81,
|
|||
|
ExpectedInt: 2,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\u07fe"),
|
|||
|
ExpectedRune: 0x7fe,
|
|||
|
ExpectedInt: 2,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\u07ff"),
|
|||
|
ExpectedRune: 0x7ff,
|
|||
|
ExpectedInt: 2,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\u0800"),
|
|||
|
ExpectedRune: 0x800,
|
|||
|
ExpectedInt: 3,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\u0801"),
|
|||
|
ExpectedRune: 0x801,
|
|||
|
ExpectedInt: 3,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\ufffe"),
|
|||
|
ExpectedRune: 0xfffe,
|
|||
|
ExpectedInt: 3,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\uffff"),
|
|||
|
ExpectedRune: 0xffff,
|
|||
|
ExpectedInt: 3,
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\U00010000"),
|
|||
|
ExpectedRune: 0x10000,
|
|||
|
ExpectedInt: 4,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\U00010001"),
|
|||
|
ExpectedRune: 0x10001,
|
|||
|
ExpectedInt: 4,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\U0010fffe"),
|
|||
|
ExpectedRune: 0x10fffe,
|
|||
|
ExpectedInt: 4,
|
|||
|
},
|
|||
|
{
|
|||
|
Reader: strings.NewReader("\U0010ffff"),
|
|||
|
ExpectedRune: 0x10ffff,
|
|||
|
ExpectedInt: 4,
|
|||
|
},
|
|||
|
}
|
|||
|
|
|||
|
|
|||
|
for testNumber, test := range tests {
|
|||
|
runeReader := NewRuneReader(test.Reader)
|
|||
|
|
|||
|
actualRune, actualInt, err := runeReader.ReadRune()
|
|||
|
if nil != err {
|
|||
|
t.Errorf("For test #%d, did not expect an error, but actually got one: (%T) %q", testNumber, err, err)
|
|||
|
t.Errorf("\tEXPECTED: %s", FormatBinary(test.ExpectedRune))
|
|||
|
t.Errorf("\tACTUAL: %s", FormatBinary(actualRune))
|
|||
|
continue
|
|||
|
}
|
|||
|
if expected, actual := test.ExpectedRune, actualRune; expected != actual {
|
|||
|
t.Errorf("For test #%d, expected %q (0x%X), but actually got %q (0x%X).", testNumber, expected, expected, actual, actual)
|
|||
|
t.Errorf("\tEXPECTED: %s", FormatBinary(test.ExpectedRune))
|
|||
|
t.Errorf("\tACTUAL: %s", FormatBinary(actualRune))
|
|||
|
continue
|
|||
|
}
|
|||
|
if expected, actual := test.ExpectedInt, actualInt; expected != actual {
|
|||
|
t.Errorf("For test #%d, expected %d, but actually got %d.", testNumber, expected, actual)
|
|||
|
t.Errorf("\tEXPECTED: %s", FormatBinary(test.ExpectedRune))
|
|||
|
t.Errorf("\tACTUAL: %s", FormatBinary(actualRune))
|
|||
|
continue
|
|||
|
}
|
|||
|
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
func TestRuneReaders(t *testing.T) {
|
|||
|
|
|||
|
tests := []struct{
|
|||
|
Reader io.Reader
|
|||
|
Expected []rune
|
|||
|
}{
|
|||
|
{ // 0
|
|||
|
Reader: strings.NewReader("a"),
|
|||
|
Expected: []rune{'a'},
|
|||
|
},
|
|||
|
{ // 1
|
|||
|
Reader: strings.NewReader("ap"),
|
|||
|
Expected: []rune{'a','p'},
|
|||
|
},
|
|||
|
{ // 2
|
|||
|
Reader: strings.NewReader("app"),
|
|||
|
Expected: []rune{'a','p','p'},
|
|||
|
},
|
|||
|
{ // 3
|
|||
|
Reader: strings.NewReader("appl"),
|
|||
|
Expected: []rune{'a','p','p','l'},
|
|||
|
},
|
|||
|
{ // 4
|
|||
|
Reader: strings.NewReader("apple"),
|
|||
|
Expected: []rune{'a','p','p','l','e'},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 5
|
|||
|
Reader: strings.NewReader("b"),
|
|||
|
Expected: []rune{'b'},
|
|||
|
},
|
|||
|
{ // 6
|
|||
|
Reader: strings.NewReader("ba"),
|
|||
|
Expected: []rune{'b','a'},
|
|||
|
},
|
|||
|
{ // 7
|
|||
|
Reader: strings.NewReader("ban"),
|
|||
|
Expected: []rune{'b','a','n'},
|
|||
|
},
|
|||
|
{ // 8
|
|||
|
Reader: strings.NewReader("bana"),
|
|||
|
Expected: []rune{'b','a','n','a'},
|
|||
|
},
|
|||
|
{ // 9
|
|||
|
Reader: strings.NewReader("banan"),
|
|||
|
Expected: []rune{'b','a','n','a','n'},
|
|||
|
},
|
|||
|
{ // 10
|
|||
|
Reader: strings.NewReader("banana"),
|
|||
|
Expected: []rune{'b','a','n','a','n','a'},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 11
|
|||
|
Reader: strings.NewReader("c"),
|
|||
|
Expected: []rune{'c'},
|
|||
|
},
|
|||
|
{ // 12
|
|||
|
Reader: strings.NewReader("ch"),
|
|||
|
Expected: []rune{'c','h'},
|
|||
|
},
|
|||
|
{ // 13
|
|||
|
Reader: strings.NewReader("che"),
|
|||
|
Expected: []rune{'c','h','e'},
|
|||
|
},
|
|||
|
{ // 14
|
|||
|
Reader: strings.NewReader("cher"),
|
|||
|
Expected: []rune{'c','h','e','r'},
|
|||
|
},
|
|||
|
{ // 15
|
|||
|
Reader: strings.NewReader("cherr"),
|
|||
|
Expected: []rune{'c','h','e','r','r'},
|
|||
|
},
|
|||
|
{ // 16
|
|||
|
Reader: strings.NewReader("cherry"),
|
|||
|
Expected: []rune{'c','h','e','r','r','y'},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 17
|
|||
|
Reader: strings.NewReader("A"),
|
|||
|
Expected: []rune{'A'},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 18
|
|||
|
Reader: strings.NewReader("r"),
|
|||
|
Expected: []rune{'r'},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 19
|
|||
|
Reader: strings.NewReader("¡"),
|
|||
|
Expected: []rune{'¡'},
|
|||
|
},
|
|||
|
{ // 20
|
|||
|
Reader: strings.NewReader("¡!"),
|
|||
|
Expected: []rune{'¡','!'},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 21
|
|||
|
Reader: strings.NewReader("۵"),
|
|||
|
Expected: []rune{'۵'},
|
|||
|
},
|
|||
|
{ // 22
|
|||
|
Reader: strings.NewReader("۵5"),
|
|||
|
Expected: []rune{'۵','5'},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 23
|
|||
|
Reader: strings.NewReader("‱"),
|
|||
|
Expected: []rune{'‱'},
|
|||
|
},
|
|||
|
{ // 24
|
|||
|
Reader: strings.NewReader("‱%"),
|
|||
|
Expected: []rune{'‱','%'},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 25
|
|||
|
Reader: strings.NewReader("≡"),
|
|||
|
Expected: []rune{'≡'},
|
|||
|
},
|
|||
|
{ // 26
|
|||
|
Reader: strings.NewReader("≡="),
|
|||
|
Expected: []rune{'≡', '='},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 27
|
|||
|
Reader: strings.NewReader("𐏕"),
|
|||
|
Expected: []rune{'𐏕'},
|
|||
|
},
|
|||
|
{ // 28
|
|||
|
Reader: strings.NewReader("𐏕100"),
|
|||
|
Expected: []rune{'𐏕','1','0','0'},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 29
|
|||
|
Reader: strings.NewReader("🙂"),
|
|||
|
Expected: []rune{'🙂'},
|
|||
|
},
|
|||
|
{ // 30
|
|||
|
Reader: strings.NewReader("🙂:-)"),
|
|||
|
Expected: []rune{'🙂',':','-',')'},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 31
|
|||
|
Reader: strings.NewReader("\u0000"),
|
|||
|
Expected: []rune{0x0},
|
|||
|
},
|
|||
|
{ // 32
|
|||
|
Reader: strings.NewReader("\u0001"),
|
|||
|
Expected: []rune{0x1},
|
|||
|
},
|
|||
|
{ // 33
|
|||
|
Reader: strings.NewReader("\u007e"),
|
|||
|
Expected: []rune{0x7e},
|
|||
|
},
|
|||
|
{ // 34
|
|||
|
Reader: strings.NewReader("\u007f"),
|
|||
|
Expected: []rune{0x7f},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 35
|
|||
|
Reader: strings.NewReader("\u0080"),
|
|||
|
Expected: []rune{0x80},
|
|||
|
},
|
|||
|
{ // 36
|
|||
|
Reader: strings.NewReader("\u0081"),
|
|||
|
Expected: []rune{0x81},
|
|||
|
},
|
|||
|
{ // 37
|
|||
|
Reader: strings.NewReader("\u07fe"),
|
|||
|
Expected: []rune{0x7fe},
|
|||
|
},
|
|||
|
{ // 38
|
|||
|
Reader: strings.NewReader("\u07ff"),
|
|||
|
Expected: []rune{0x7ff},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 39
|
|||
|
Reader: strings.NewReader("\u0800"),
|
|||
|
Expected: []rune{0x800},
|
|||
|
},
|
|||
|
{ // 40
|
|||
|
Reader: strings.NewReader("\u0801"),
|
|||
|
Expected: []rune{0x801},
|
|||
|
},
|
|||
|
{ // 41
|
|||
|
Reader: strings.NewReader("\ufffe"),
|
|||
|
Expected: []rune{0xfffe},
|
|||
|
},
|
|||
|
{ // 42
|
|||
|
Reader: strings.NewReader("\uffff"),
|
|||
|
Expected: []rune{0xffff},
|
|||
|
},
|
|||
|
|
|||
|
|
|||
|
|
|||
|
{ // 43
|
|||
|
Reader: strings.NewReader("\U00010000"),
|
|||
|
Expected: []rune{0x10000},
|
|||
|
},
|
|||
|
{ // 44
|
|||
|
Reader: strings.NewReader("\U00010001"),
|
|||
|
Expected: []rune{0x10001},
|
|||
|
},
|
|||
|
{ // 45
|
|||
|
Reader: strings.NewReader("\U0010fffe"),
|
|||
|
Expected: []rune{0x10fffe},
|
|||
|
},
|
|||
|
{ // 46
|
|||
|
Reader: strings.NewReader("\U0010ffff"),
|
|||
|
Expected: []rune{0x10ffff},
|
|||
|
},
|
|||
|
}
|
|||
|
|
|||
|
|
|||
|
TestLoop: for testNumber, test := range tests {
|
|||
|
|
|||
|
var runeNumber int
|
|||
|
for {
|
|||
|
runeReader := NewRuneReader(test.Reader)
|
|||
|
|
|||
|
actualRune, actualInt, err := runeReader.ReadRune()
|
|||
|
if nil != err && io.EOF != err {
|
|||
|
t.Errorf("For test #%d and rune #%d, did not expect an error, but actually got one: (%T) %q", testNumber, runeNumber, err, err)
|
|||
|
t.Errorf("\tEXPECTED: %s", FormatBinary(test.Expected[runeNumber]))
|
|||
|
t.Errorf("\tACTUAL: %s", FormatBinary(actualRune))
|
|||
|
continue TestLoop
|
|||
|
}
|
|||
|
if io.EOF == err {
|
|||
|
if expected, actual := len(test.Expected), runeNumber; expected != actual {
|
|||
|
t.Errorf("For test #%d and rune #%d, expected %d, but actually got %d.", testNumber, runeNumber, expected, actual)
|
|||
|
}
|
|||
|
|
|||
|
break
|
|||
|
}
|
|||
|
if expected, actual := test.Expected[runeNumber], actualRune; expected != actual {
|
|||
|
t.Errorf("For test #%d and rune #%d, expected %q (0x%X), but actually got %q (0x%X).", testNumber, runeNumber, expected, expected, actual, actual)
|
|||
|
t.Errorf("\tEXPECTED: %s", FormatBinary(test.Expected[runeNumber]))
|
|||
|
t.Errorf("\tACTUAL: %s", FormatBinary(actualRune))
|
|||
|
continue TestLoop
|
|||
|
}
|
|||
|
if expected, actual := Len(test.Expected[runeNumber]), actualInt; expected != actual {
|
|||
|
t.Errorf("For test #%d and rune #%d, expected %d, but actually got %d.", testNumber, runeNumber, expected, actual)
|
|||
|
t.Errorf("\tEXPECTED: %s", FormatBinary(test.Expected[runeNumber]))
|
|||
|
t.Errorf("\tACTUAL: %s", FormatBinary(actualRune))
|
|||
|
continue TestLoop
|
|||
|
}
|
|||
|
|
|||
|
runeNumber++
|
|||
|
}
|
|||
|
}
|
|||
|
}
|