2023-03-24 09:09:58 +00:00
|
|
|
package proxy
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
|
|
|
|
|
|
|
"github.com/milvus-io/milvus-proto/go-api/schemapb"
|
2023-04-06 11:14:32 +00:00
|
|
|
"github.com/milvus-io/milvus/pkg/util/funcutil"
|
|
|
|
"github.com/milvus-io/milvus/pkg/util/merr"
|
2023-05-12 03:33:20 +00:00
|
|
|
"github.com/milvus-io/milvus/pkg/util/paramtable"
|
2023-04-06 11:14:32 +00:00
|
|
|
"github.com/milvus-io/milvus/pkg/util/typeutil"
|
2023-03-24 09:09:58 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
type validateUtil struct {
|
|
|
|
checkNAN bool
|
|
|
|
checkMaxLen bool
|
|
|
|
}
|
|
|
|
|
|
|
|
type validateOption func(*validateUtil)
|
|
|
|
|
|
|
|
func withNANCheck() validateOption {
|
|
|
|
return func(v *validateUtil) {
|
|
|
|
v.checkNAN = true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func withMaxLenCheck() validateOption {
|
|
|
|
return func(v *validateUtil) {
|
|
|
|
v.checkMaxLen = true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (v *validateUtil) apply(opts ...validateOption) {
|
|
|
|
for _, opt := range opts {
|
|
|
|
opt(v)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (v *validateUtil) Validate(data []*schemapb.FieldData, schema *schemapb.CollectionSchema, numRows uint64) error {
|
|
|
|
helper, err := typeutil.CreateSchemaHelper(schema)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := v.checkAligned(data, helper, numRows); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, field := range data {
|
|
|
|
fieldSchema, err := helper.GetFieldFromName(field.GetFieldName())
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
switch fieldSchema.GetDataType() {
|
|
|
|
case schemapb.DataType_FloatVector:
|
|
|
|
if err := v.checkFloatVectorFieldData(field, fieldSchema); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
case schemapb.DataType_BinaryVector:
|
|
|
|
if err := v.checkBinaryVectorFieldData(field, fieldSchema); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
case schemapb.DataType_VarChar:
|
|
|
|
if err := v.checkVarCharFieldData(field, fieldSchema); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2023-05-12 03:33:20 +00:00
|
|
|
case schemapb.DataType_JSON:
|
|
|
|
if err := v.checkJSONFieldData(field, fieldSchema); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2023-03-24 09:09:58 +00:00
|
|
|
default:
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (v *validateUtil) checkAligned(data []*schemapb.FieldData, schema *typeutil.SchemaHelper, numRows uint64) error {
|
|
|
|
errNumRowsMismatch := func(fieldName string, fieldNumRows, passedNumRows uint64) error {
|
|
|
|
msg := fmt.Sprintf("the num_rows (%d) of field (%s) is not equal to passed num_rows (%d)", fieldNumRows, fieldName, passedNumRows)
|
|
|
|
return merr.WrapErrParameterInvalid(passedNumRows, numRows, msg)
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, field := range data {
|
|
|
|
switch field.GetType() {
|
|
|
|
case schemapb.DataType_FloatVector:
|
|
|
|
f, err := schema.GetFieldFromName(field.GetFieldName())
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
dim, err := typeutil.GetDim(f)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
n, err := funcutil.GetNumRowsOfFloatVectorField(field.GetVectors().GetFloatVector().GetData(), dim)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if n != numRows {
|
|
|
|
return errNumRowsMismatch(field.GetFieldName(), n, numRows)
|
|
|
|
}
|
|
|
|
|
|
|
|
case schemapb.DataType_BinaryVector:
|
|
|
|
f, err := schema.GetFieldFromName(field.GetFieldName())
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
dim, err := typeutil.GetDim(f)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
n, err := funcutil.GetNumRowsOfBinaryVectorField(field.GetVectors().GetBinaryVector(), dim)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if n != numRows {
|
|
|
|
return errNumRowsMismatch(field.GetFieldName(), n, numRows)
|
|
|
|
}
|
|
|
|
|
|
|
|
default:
|
|
|
|
// error won't happen here.
|
|
|
|
n, err := funcutil.GetNumRowOfFieldData(field)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if n != numRows {
|
|
|
|
return errNumRowsMismatch(field.GetFieldName(), n, numRows)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (v *validateUtil) checkFloatVectorFieldData(field *schemapb.FieldData, fieldSchema *schemapb.FieldSchema) error {
|
|
|
|
floatArray := field.GetVectors().GetFloatVector().GetData()
|
|
|
|
if floatArray == nil {
|
|
|
|
msg := fmt.Sprintf("float vector field '%v' is illegal, array type mismatch", field.GetFieldName())
|
|
|
|
return merr.WrapErrParameterInvalid("need float vector", "got nil", msg)
|
|
|
|
}
|
|
|
|
|
|
|
|
if v.checkNAN {
|
|
|
|
return typeutil.VerifyFloats32(floatArray)
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (v *validateUtil) checkBinaryVectorFieldData(field *schemapb.FieldData, fieldSchema *schemapb.FieldSchema) error {
|
|
|
|
// TODO
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (v *validateUtil) checkVarCharFieldData(field *schemapb.FieldData, fieldSchema *schemapb.FieldSchema) error {
|
|
|
|
strArr := field.GetScalars().GetStringData().GetData()
|
|
|
|
if strArr == nil {
|
|
|
|
msg := fmt.Sprintf("varchar field '%v' is illegal, array type mismatch", field.GetFieldName())
|
|
|
|
return merr.WrapErrParameterInvalid("need string array", "got nil", msg)
|
|
|
|
}
|
|
|
|
|
|
|
|
if v.checkMaxLen {
|
|
|
|
maxLength, err := GetMaxLength(fieldSchema)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
return verifyLengthPerRow(strArr, maxLength)
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2023-05-12 03:33:20 +00:00
|
|
|
func (v *validateUtil) checkJSONFieldData(field *schemapb.FieldData, fieldSchema *schemapb.FieldSchema) error {
|
|
|
|
jsonArray := field.GetScalars().GetJsonData().GetData()
|
|
|
|
if jsonArray == nil {
|
|
|
|
msg := fmt.Sprintf("varchar field '%v' is illegal, array type mismatch", field.GetFieldName())
|
|
|
|
return merr.WrapErrParameterInvalid("need string array", "got nil", msg)
|
|
|
|
}
|
|
|
|
|
|
|
|
if v.checkMaxLen {
|
|
|
|
return verifyLengthPerRow(jsonArray, paramtable.Get().CommonCfg.JSONMaxLength.GetAsInt64())
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func verifyLengthPerRow[E interface{ ~string | ~[]byte }](strArr []E, maxLength int64) error {
|
2023-03-24 09:09:58 +00:00
|
|
|
for i, s := range strArr {
|
|
|
|
if int64(len(s)) > maxLength {
|
|
|
|
msg := fmt.Sprintf("the length (%d) of %dth string exceeds max length (%d)", len(s), i, maxLength)
|
|
|
|
return merr.WrapErrParameterInvalid("valid length string", "string length exceeds max length", msg)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func newValidateUtil(opts ...validateOption) *validateUtil {
|
|
|
|
v := &validateUtil{
|
|
|
|
checkNAN: true,
|
|
|
|
checkMaxLen: false,
|
|
|
|
}
|
|
|
|
|
|
|
|
v.apply(opts...)
|
|
|
|
|
|
|
|
return v
|
|
|
|
}
|