Платформа ЦРНП "Мирокод" для разработки проектов
https://git.mirocod.ru
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
102 lines
1.7 KiB
102 lines
1.7 KiB
package mahonia |
|
|
|
import ( |
|
"unicode/utf8" |
|
) |
|
|
|
// Converters for the EUC-JP encoding |
|
|
|
func init() { |
|
RegisterCharset(&Charset{ |
|
Name: "EUC-JP", |
|
Aliases: []string{"extended_unix_code_packed_format_for_japanese", "cseucpkdfmtjapanese"}, |
|
NewDecoder: func() Decoder { |
|
return decodeEucJP |
|
}, |
|
NewEncoder: func() Encoder { |
|
jis0208Table.Reverse() |
|
jis0212Table.Reverse() |
|
return encodeEucJP |
|
}, |
|
}) |
|
} |
|
|
|
func decodeEucJP(p []byte) (c rune, size int, status Status) { |
|
if len(p) == 0 { |
|
return 0, 0, NO_ROOM |
|
} |
|
|
|
b := p[0] |
|
switch { |
|
case b < 0x80: |
|
return rune(b), 1, SUCCESS |
|
|
|
case b == 0x8e: |
|
if len(p) < 2 { |
|
return 0, 0, NO_ROOM |
|
} |
|
b2 := p[1] |
|
if b2 < 0xa1 || b2 > 0xdf { |
|
return utf8.RuneError, 1, INVALID_CHAR |
|
} |
|
return rune(b2) + (0xff61 - 0xa1), 2, SUCCESS |
|
|
|
case b == 0x8f: |
|
if len(p) < 3 { |
|
return 0, 0, NO_ROOM |
|
} |
|
c, size, status = jis0212Table.DecodeHigh(p[1:3]) |
|
if status == SUCCESS { |
|
size = 3 |
|
} |
|
return |
|
|
|
case 0xa1 <= b && b <= 0xfe: |
|
return jis0208Table.DecodeHigh(p) |
|
} |
|
|
|
return utf8.RuneError, 1, INVALID_CHAR |
|
} |
|
|
|
func encodeEucJP(p []byte, c rune) (size int, status Status) { |
|
if len(p) == 0 { |
|
return 0, NO_ROOM |
|
} |
|
|
|
if c < 0x80 { |
|
p[0] = byte(c) |
|
return 1, SUCCESS |
|
} |
|
|
|
if len(p) < 2 { |
|
return 0, NO_ROOM |
|
} |
|
|
|
if c > 0xffff { |
|
p[0] = '?' |
|
return 1, INVALID_CHAR |
|
} |
|
|
|
if 0xff61 <= c && c <= 0xff9f { |
|
p[0] = 0x8e |
|
p[1] = byte(c - (0xff61 - 0xa1)) |
|
return 2, SUCCESS |
|
} |
|
|
|
size, status = jis0208Table.EncodeHigh(p, c) |
|
if status == SUCCESS { |
|
return size, status |
|
} |
|
|
|
size, status = jis0212Table.EncodeHigh(p[1:], c) |
|
switch status { |
|
case SUCCESS: |
|
p[0] = 0x8f |
|
return size + 1, SUCCESS |
|
|
|
case INVALID_CHAR: |
|
p[0] = '?' |
|
return 1, INVALID_CHAR |
|
} |
|
return size, status |
|
}
|
|
|