Documentation
¶
Index ¶
- type EncodeOption
- type Encoding
- type Offset
- type Tokenizer
- func (t *Tokenizer) Close() error
- func (t *Tokenizer) Decode(tokenIDs []uint32, skipSpecialTokens bool) string
- func (t *Tokenizer) Encode(str string, addSpecialTokens bool) ([]uint32, []string)
- func (t *Tokenizer) EncodeWithOptions(str string, addSpecialTokens bool, opts ...EncodeOption) Encoding
- func (t *Tokenizer) VocabSize() uint32
- type TokenizerOption
- type TruncationDirection
Constants ¶
This section is empty.
Variables ¶
This section is empty.
Functions ¶
This section is empty.
Types ¶
type EncodeOption ¶
type EncodeOption func(eo *encodeOpts)
func WithReturnAllAttributes ¶
func WithReturnAllAttributes() EncodeOption
func WithReturnAttentionMask ¶
func WithReturnAttentionMask() EncodeOption
func WithReturnOffsets ¶
func WithReturnOffsets() EncodeOption
func WithReturnSpecialTokensMask ¶
func WithReturnSpecialTokensMask() EncodeOption
func WithReturnTokens ¶
func WithReturnTokens() EncodeOption
func WithReturnTypeIDs ¶
func WithReturnTypeIDs() EncodeOption
type Tokenizer ¶
type Tokenizer struct {
// contains filtered or unexported fields
}
func FromBytesWithTruncation ¶
func FromBytesWithTruncation(data []byte, maxLen uint32, dir TruncationDirection) (*Tokenizer, error)
func (*Tokenizer) EncodeWithOptions ¶
func (t *Tokenizer) EncodeWithOptions(str string, addSpecialTokens bool, opts ...EncodeOption) Encoding
type TokenizerOption ¶
type TokenizerOption func(to *tokenizerOpts)
func WithEncodeSpecialTokens ¶
func WithEncodeSpecialTokens() TokenizerOption
type TruncationDirection ¶
type TruncationDirection int
const ( TruncationDirectionLeft TruncationDirection = iota TruncationDirectionRight )
Click to show internal directories.
Click to hide internal directories.