summaryrefslogtreecommitdiffstats
path: root/modules/mahonia/gbk.go
blob: ffb13b286e8d6723136c2176950aa5c8260085ae (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
package mahonia

// Converters for GBK encoding.

func init() {
	RegisterCharset(&Charset{
		Name:    "GBK",
		Aliases: []string{"GB2312"}, // GBK is a superset of GB2312.
		NewDecoder: func() Decoder {
			return decodeGBKRune
		},
		NewEncoder: func() Encoder {
			return encodeGBKRune
		},
	})
}

func decodeGBKRune(p []byte) (r rune, size int, status Status) {
	if len(p) == 0 {
		status = NO_ROOM
		return
	}

	b := p[0]
	if b < 128 {
		return rune(b), 1, SUCCESS
	}

	if len(p) < 2 {
		status = NO_ROOM
		return
	}

	c := uint16(p[0])<<8 + uint16(p[1])
	r = rune(gbkToUnicode[c])
	if r == 0 {
		r = gbkToUnicodeExtra[c]
	}

	if r != 0 {
		return r, 2, SUCCESS
	}

	return 0xfffd, 1, INVALID_CHAR
}

func encodeGBKRune(p []byte, r rune) (size int, status Status) {
	if len(p) == 0 {
		status = NO_ROOM
		return
	}

	if r < 128 {
		p[0] = byte(r)
		return 1, SUCCESS
	}

	if len(p) < 2 {
		status = NO_ROOM
		return
	}

	var c uint16
	if r < 0x10000 {
		c = unicodeToGBK[r]
	} else {
		c = unicodeToGBKExtra[r]
	}

	if c != 0 {
		p[0] = byte(c >> 8)
		p[1] = byte(c)
		return 2, SUCCESS
	}

	p[0] = 0x1a
	return 1, INVALID_CHAR
}