summaryrefslogtreecommitdiffstats
path: root/modules/mahonia/big5.go
blob: 07044fe9e26b0955818068d713fc143daab43f4e (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
package mahonia

// Converters for Big 5 encoding.

import (
	"sync"
)

func init() {
	RegisterCharset(&Charset{
		Name:    "Big5",
		Aliases: []string{"csBig5"},
		NewDecoder: func() Decoder {
			return decodeBig5Rune
		},
		NewEncoder: func() Encoder {
			big5Once.Do(reverseBig5Table)
			return encodeBig5Rune
		},
	})
}

func decodeBig5Rune(p []byte) (r rune, size int, status Status) {
	if len(p) == 0 {
		status = NO_ROOM
		return
	}

	b := p[0]
	if b < 128 {
		return rune(b), 1, SUCCESS
	}

	if len(p) < 2 {
		status = NO_ROOM
		return
	}

	c := int(p[0])<<8 + int(p[1])
	c = int(big5ToUnicode[c])
	if c > 0 {
		return rune(c), 2, SUCCESS
	}

	return 0xfffd, 1, INVALID_CHAR
}

func encodeBig5Rune(p []byte, r rune) (size int, status Status) {
	if len(p) == 0 {
		status = NO_ROOM
		return
	}

	if r < 128 {
		p[0] = byte(r)
		return 1, SUCCESS
	}

	if len(p) < 2 {
		status = NO_ROOM
		return
	}

	if r < 0x10000 {
		c := unicodeToBig5[r]
		if c > 0 {
			p[0] = byte(c >> 8)
			p[1] = byte(c)
			return 2, SUCCESS
		}
	}

	p[0] = '?'
	return 1, INVALID_CHAR
}

var big5Once sync.Once

var unicodeToBig5 []uint16

func reverseBig5Table() {
	unicodeToBig5 = make([]uint16, 65536)

	for big5, unicode := range big5ToUnicode {
		if unicode > 0 {
			unicodeToBig5[unicode] = uint16(big5)
		}
	}
}