-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathtranslit.go
104 lines (85 loc) · 2.08 KB
/
translit.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
package tlit
import (
"bufio"
"bytes"
"io"
"regexp"
"strings"
)
// An Encoder writes transliteration to an output stream.
type Encoder struct {
*bufio.Writer
sys System
tbl map[rune]string
}
// NewEncoder returns a new encoder that writes to w.
func NewEncoder(w io.Writer, sys System) *Encoder {
return &Encoder{
Writer: bufio.NewWriter(w),
sys: sys,
tbl: tableTransliteration[sys],
}
}
// Encode writes the transliteration encoding of data to the stream.
func (enc *Encoder) Encode(data []byte) error {
r := bytes.Runes(data)
l := len(r)
var (
prev, next rune
err error
)
for i, v := range r {
if i+1 <= l {
next = r[i]
} else {
next = 0
}
if s, ok := enc.tbl[v]; ok {
if sFix, ok := fixRuleRune(prev, v, next, enc.sys); ok {
s = sFix
}
_, err = enc.WriteString(s)
if err != nil {
return err
}
} else {
_, err = enc.WriteRune(v)
if err != nil {
return err
}
}
prev = v
}
return enc.Flush()
}
// EncodeString is a convenience wrapper for Encode()
func (enc *Encoder) EncodeString(s string) error {
return enc.Encode([]byte(s))
}
// Marshal returns the translit encoding of data.
func Marshal(data []byte, sys System) ([]byte, error) {
var b bytes.Buffer
if err := NewEncoder(&b, sys).Encode(data); err != nil {
return nil, err
}
return b.Bytes(), nil
}
// MarshalString is like Marshal but applies string in the input and output.
func MarshalString(s string, sys System) (string, error) {
b, err := Marshal([]byte(s), sys)
return string(b), err
}
// MarshalStringURL transforms input string into part of URL
func MarshalStringURL(s string, sys System) string {
reg := regexp.MustCompile("[^A-Za-z0-9 ]+")
s, _ = MarshalString(strings.Replace(s, "-", " ", -1), sys)
return strings.ToLower(strings.Join(strings.Fields(reg.ReplaceAllString(s, "")), "-"))
}
// MarshalStringURLru is syntactic sugar
func MarshalStringURLru(s string) string {
return MarshalStringURL(s, Default)
}
// MarshalStringURLua is syntactic sugar
func MarshalStringURLua(s string) string {
return MarshalStringURL(s, UkrainianWeb)
}