forked from Shiloh/githaven
103 lines
1.7 KiB
Go
103 lines
1.7 KiB
Go
package mahonia
|
|
|
|
import (
|
|
"unicode/utf8"
|
|
)
|
|
|
|
// Converters for the EUC-JP encoding
|
|
|
|
func init() {
|
|
RegisterCharset(&Charset{
|
|
Name: "EUC-JP",
|
|
Aliases: []string{"extended_unix_code_packed_format_for_japanese", "cseucpkdfmtjapanese"},
|
|
NewDecoder: func() Decoder {
|
|
return decodeEucJP
|
|
},
|
|
NewEncoder: func() Encoder {
|
|
jis0208Table.Reverse()
|
|
jis0212Table.Reverse()
|
|
return encodeEucJP
|
|
},
|
|
})
|
|
}
|
|
|
|
func decodeEucJP(p []byte) (c rune, size int, status Status) {
|
|
if len(p) == 0 {
|
|
return 0, 0, NO_ROOM
|
|
}
|
|
|
|
b := p[0]
|
|
switch {
|
|
case b < 0x80:
|
|
return rune(b), 1, SUCCESS
|
|
|
|
case b == 0x8e:
|
|
if len(p) < 2 {
|
|
return 0, 0, NO_ROOM
|
|
}
|
|
b2 := p[1]
|
|
if b2 < 0xa1 || b2 > 0xdf {
|
|
return utf8.RuneError, 1, INVALID_CHAR
|
|
}
|
|
return rune(b2) + (0xff61 - 0xa1), 2, SUCCESS
|
|
|
|
case b == 0x8f:
|
|
if len(p) < 3 {
|
|
return 0, 0, NO_ROOM
|
|
}
|
|
c, size, status = jis0212Table.DecodeHigh(p[1:3])
|
|
if status == SUCCESS {
|
|
size = 3
|
|
}
|
|
return
|
|
|
|
case 0xa1 <= b && b <= 0xfe:
|
|
return jis0208Table.DecodeHigh(p)
|
|
}
|
|
|
|
return utf8.RuneError, 1, INVALID_CHAR
|
|
}
|
|
|
|
func encodeEucJP(p []byte, c rune) (size int, status Status) {
|
|
if len(p) == 0 {
|
|
return 0, NO_ROOM
|
|
}
|
|
|
|
if c < 0x80 {
|
|
p[0] = byte(c)
|
|
return 1, SUCCESS
|
|
}
|
|
|
|
if len(p) < 2 {
|
|
return 0, NO_ROOM
|
|
}
|
|
|
|
if c > 0xffff {
|
|
p[0] = '?'
|
|
return 1, INVALID_CHAR
|
|
}
|
|
|
|
if 0xff61 <= c && c <= 0xff9f {
|
|
p[0] = 0x8e
|
|
p[1] = byte(c - (0xff61 - 0xa1))
|
|
return 2, SUCCESS
|
|
}
|
|
|
|
size, status = jis0208Table.EncodeHigh(p, c)
|
|
if status == SUCCESS {
|
|
return size, status
|
|
}
|
|
|
|
size, status = jis0212Table.EncodeHigh(p[1:], c)
|
|
switch status {
|
|
case SUCCESS:
|
|
p[0] = 0x8f
|
|
return size + 1, SUCCESS
|
|
|
|
case INVALID_CHAR:
|
|
p[0] = '?'
|
|
return 1, INVALID_CHAR
|
|
}
|
|
return size, status
|
|
}
|