-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtokenizer.go
51 lines (41 loc) · 1.42 KB
/
tokenizer.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
package at
import (
"github.com/flipb/at/multibuf"
)
type TwoBufferTokenizer func(firstBuf []byte, secondBuf []byte) (advance int, token []byte, matched bool)
type Tokenizer func(readData []byte) (advance int, token []byte, matched bool)
func PatternSplitTokenizer(pattern []byte) TwoBufferTokenizer {
return func(buf []byte, inputData []byte) (advance int, token []byte, matched bool) {
if i := multibuf.PatternIndex(pattern, buf, inputData); i >= 0 {
advance = i + len(pattern)
data := multibuf.Slice(0, advance, buf, inputData)
return advance, data, true
}
return 0, inputData, false
}
}
func tokenizerToTwoBuffers(t Tokenizer) TwoBufferTokenizer {
return func(readData []byte, moreData []byte) (advance int, token []byte, matched bool) {
buf := multibuf.Slice(0, -1, readData, moreData)
return t(buf)
}
}
func matchAdvanceBuffer(buf *[]byte, inputData []byte, tokenizer TwoBufferTokenizer) (advance int, token []byte, matched bool) {
advance, token, matched = tokenizer(*buf, inputData)
// at this stage we have to remove any bytes taken from "buf"
// as well as decrease the advance count with the same number of bytes
if advance > 0 && len(*buf) > 0 && len(token) > 0 {
consumed := len(*buf)
if len(*buf) > len(token) {
consumed = len(token)
}
nBuf := *buf
nBuf = nBuf[consumed:]
*buf = nBuf
advance -= (consumed)
if advance < 0 {
advance = 0
}
}
return advance, token, matched
}