mirror of https://github.com/milvus-io/milvus.git
54 lines
1.2 KiB
Go
54 lines
1.2 KiB
Go
package ctokenizer
|
|
|
|
/*
|
|
#cgo pkg-config: milvus_core
|
|
#include <stdlib.h> // free
|
|
#include "segcore/token_stream_c.h"
|
|
*/
|
|
import "C"
|
|
|
|
import (
|
|
"unsafe"
|
|
|
|
"github.com/milvus-io/milvus-proto/go-api/v2/milvuspb"
|
|
"github.com/milvus-io/milvus/internal/util/tokenizerapi"
|
|
)
|
|
|
|
var _ tokenizerapi.TokenStream = (*CTokenStream)(nil)
|
|
|
|
type CTokenStream struct {
|
|
ptr C.CTokenStream
|
|
}
|
|
|
|
func NewCTokenStream(ptr C.CTokenStream) *CTokenStream {
|
|
return &CTokenStream{
|
|
ptr: ptr,
|
|
}
|
|
}
|
|
|
|
func (impl *CTokenStream) Advance() bool {
|
|
return bool(C.token_stream_advance(impl.ptr))
|
|
}
|
|
|
|
func (impl *CTokenStream) Token() string {
|
|
token := C.token_stream_get_token(impl.ptr)
|
|
defer C.free_token(unsafe.Pointer(token))
|
|
return C.GoString(token)
|
|
}
|
|
|
|
func (impl *CTokenStream) DetailedToken() *milvuspb.AnalyzerToken {
|
|
token := C.token_stream_get_detailed_token(impl.ptr)
|
|
defer C.free_token(unsafe.Pointer(token.token))
|
|
return &milvuspb.AnalyzerToken{
|
|
Token: C.GoString(token.token),
|
|
StartOffset: int64(token.start_offset),
|
|
EndOffset: int64(token.end_offset),
|
|
Position: int64(token.position),
|
|
PositionLength: int64(token.position_length),
|
|
}
|
|
}
|
|
|
|
func (impl *CTokenStream) Destroy() {
|
|
C.free_token_stream(impl.ptr)
|
|
}
|