forked from l2x/golang-chinese-to-pinyin
/
pinyin.go
87 lines (72 loc) · 1.26 KB
/
pinyin.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
package Pinyin
import (
"github.com/qiniu/iconv"
"strings"
)
var (
pyTableLen = len(pyValue)
)
type Pinyin struct {
//分隔符
Split string
//是否首字母大写
Upper bool
}
func New() Pinyin {
return Pinyin{
Split: " ",
Upper: true,
}
}
func (c *Pinyin) Convert(s string) (string, error) {
var pyStr string
gbk, err := utf8ToGbk(s)
if err != nil {
return pyStr, err
}
pyArr := c.gbkToPinyin(gbk)
pyStr = strings.Join(pyArr, c.Split)
return pyStr, nil
}
func (c *Pinyin) gbkToPinyin(gbk string) []string {
var pyStr []string
for i := 0; i < len(gbk); i++ {
p := int(gbk[i])
if p > 0 && p < 160 {
pyStr = append(pyStr, string(gbk[i]))
} else {
i++
q := int(gbk[i])
p = p*256 + q - 65536
py := pinyinSearch(p)
if py != "" {
if c.Upper == false {
py = strings.ToLower(py)
}
pyStr = append(pyStr, py)
}
}
}
return pyStr
}
func utf8ToGbk(s string) (string, error) {
cd, err := iconv.Open("gbk", "utf-8")
if err != nil {
return "", err
}
defer cd.Close()
gbk := cd.ConvString(s)
return gbk, nil
}
func pinyinSearch(p int) string {
if v, ok := tableMap[p]; ok {
return v
} else {
for i := pyTableLen - 1; i >= 0; i-- {
if pyValue[i] <= p {
return pyName[i]
}
}
}
return ""
}