mirror of
https://github.com/ollama/ollama.git
synced 2026-04-30 17:58:49 -05:00
move tokenizers to separate package (#13825)
This commit is contained in:
17
tokenizer/tokenizer.go
Normal file
17
tokenizer/tokenizer.go
Normal file
@@ -0,0 +1,17 @@
|
||||
package tokenizer
|
||||
|
||||
const (
|
||||
TOKEN_TYPE_NORMAL = iota + 1
|
||||
TOKEN_TYPE_UNKNOWN
|
||||
TOKEN_TYPE_CONTROL
|
||||
TOKEN_TYPE_USER_DEFINED
|
||||
TOKEN_TYPE_UNUSED
|
||||
TOKEN_TYPE_BYTE
|
||||
)
|
||||
|
||||
type Tokenizer interface {
|
||||
Encode(s string, addSpecial bool) ([]int32, error)
|
||||
Decode([]int32) (string, error)
|
||||
Is(int32, Special) bool
|
||||
Vocabulary() *Vocabulary
|
||||
}
|
||||
Reference in New Issue
Block a user