milvus/internal/util/indexcgowrapper/dataset.go

138 lines
3.1 KiB
Go

package indexcgowrapper
import (
"github.com/milvus-io/milvus-proto/go-api/v2/schemapb"
"github.com/milvus-io/milvus/internal/storage"
)
const (
keyRawArr = "key_raw_arr"
)
type Dataset struct {
DType schemapb.DataType
Data map[string]interface{}
}
func GenFloatVecDataset(vectors []float32) *Dataset {
return &Dataset{
DType: schemapb.DataType_FloatVector,
Data: map[string]interface{}{
keyRawArr: vectors,
},
}
}
func GenFloat16VecDataset(vectors []byte) *Dataset {
return &Dataset{
DType: schemapb.DataType_Float16Vector,
Data: map[string]interface{}{
keyRawArr: vectors,
},
}
}
func GenBFloat16VecDataset(vectors []byte) *Dataset {
return &Dataset{
DType: schemapb.DataType_BFloat16Vector,
Data: map[string]interface{}{
keyRawArr: vectors,
},
}
}
func GenSparseFloatVecDataset(data *storage.SparseFloatVectorFieldData) *Dataset {
// TODO(SPARSE): This is used only for testing. In order to make any golang
// tests that uses this method work, we'll need to expose
// knowhere::sparse::SparseRow to Go, which is the accepted format in cgo
// wrapper. Such tests are skipping sparse vector for now.
return &Dataset{
DType: schemapb.DataType_SparseFloatVector,
}
}
func GenBinaryVecDataset(vectors []byte) *Dataset {
return &Dataset{
DType: schemapb.DataType_BinaryVector,
Data: map[string]interface{}{
keyRawArr: vectors,
},
}
}
func GenDataset(data storage.FieldData) *Dataset {
switch f := data.(type) {
case *storage.BoolFieldData:
return &Dataset{
DType: schemapb.DataType_Bool,
Data: map[string]interface{}{
keyRawArr: f.Data,
},
}
case *storage.Int8FieldData:
return &Dataset{
DType: schemapb.DataType_Int8,
Data: map[string]interface{}{
keyRawArr: f.Data,
},
}
case *storage.Int16FieldData:
return &Dataset{
DType: schemapb.DataType_Int16,
Data: map[string]interface{}{
keyRawArr: f.Data,
},
}
case *storage.Int32FieldData:
return &Dataset{
DType: schemapb.DataType_Int32,
Data: map[string]interface{}{
keyRawArr: f.Data,
},
}
case *storage.Int64FieldData:
return &Dataset{
DType: schemapb.DataType_Int64,
Data: map[string]interface{}{
keyRawArr: f.Data,
},
}
case *storage.FloatFieldData:
return &Dataset{
DType: schemapb.DataType_Float,
Data: map[string]interface{}{
keyRawArr: f.Data,
},
}
case *storage.DoubleFieldData:
return &Dataset{
DType: schemapb.DataType_Double,
Data: map[string]interface{}{
keyRawArr: f.Data,
},
}
case *storage.StringFieldData:
return &Dataset{
DType: schemapb.DataType_VarChar,
Data: map[string]interface{}{
keyRawArr: f.Data,
},
}
case *storage.BinaryVectorFieldData:
return GenBinaryVecDataset(f.Data)
case *storage.FloatVectorFieldData:
return GenFloatVecDataset(f.Data)
case *storage.Float16VectorFieldData:
return GenFloat16VecDataset(f.Data)
case *storage.BFloat16VectorFieldData:
return GenBFloat16VecDataset(f.Data)
case *storage.SparseFloatVectorFieldData:
return GenSparseFloatVecDataset(f)
default:
return &Dataset{
DType: schemapb.DataType_None,
Data: nil,
}
}
}