Support ScaNN index (#26099)

Signed-off-by: chasingegg <chao.gao@zilliz.com>
pull/25384/head
Gao 2023-08-11 14:21:29 +08:00 committed by GitHub
parent 54d6f0ea23
commit b6fcbb0998
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
9 changed files with 38 additions and 4 deletions

View File

@ -11,7 +11,7 @@
# or implied. See the License for the specific language governing permissions and limitations under the License. # or implied. See the License for the specific language governing permissions and limitations under the License.
#------------------------------------------------------------------------------- #-------------------------------------------------------------------------------
set( KNOWHERE_VERSION b7d0b0a ) set( KNOWHERE_VERSION 4f99dc0)
message(STATUS "Building knowhere-${KNOWHERE_SOURCE_VER} from source") message(STATUS "Building knowhere-${KNOWHERE_SOURCE_VER} from source")
message(STATUS ${CMAKE_BUILD_TYPE}) message(STATUS ${CMAKE_BUILD_TYPE})
@ -30,7 +30,7 @@ endif ()
set( CMAKE_PREFIX_PATH ${CONAN_BOOST_ROOT} ) set( CMAKE_PREFIX_PATH ${CONAN_BOOST_ROOT} )
FetchContent_Declare( FetchContent_Declare(
knowhere knowhere
GIT_REPOSITORY "https://github.com/milvus-io/knowhere.git" GIT_REPOSITORY "https://github.com/zilliztech/knowhere.git"
GIT_TAG ${KNOWHERE_VERSION} GIT_TAG ${KNOWHERE_VERSION}
SOURCE_DIR ${CMAKE_CURRENT_BINARY_DIR}/knowhere-src SOURCE_DIR ${CMAKE_CURRENT_BINARY_DIR}/knowhere-src
BINARY_DIR ${CMAKE_CURRENT_BINARY_DIR}/knowhere-build BINARY_DIR ${CMAKE_CURRENT_BINARY_DIR}/knowhere-build

View File

@ -50,6 +50,7 @@ const (
IndexFaissIDMap = "FLAT" IndexFaissIDMap = "FLAT"
IndexFaissIVFFlat = "IVF_FLAT" IndexFaissIVFFlat = "IVF_FLAT"
IndexFaissIVFPQ = "IVF_PQ" IndexFaissIVFPQ = "IVF_PQ"
IndexScaNN = "SCANN"
IndexFaissIVFSQ8 = "IVF_SQ8" IndexFaissIVFSQ8 = "IVF_SQ8"
IndexFaissBinIDMap = "BIN_FLAT" IndexFaissBinIDMap = "BIN_FLAT"
IndexFaissBinIVFFlat = "BIN_IVF_FLAT" IndexFaissBinIVFFlat = "BIN_IVF_FLAT"

View File

@ -56,6 +56,7 @@ const (
IndexFaissIVFFlat = "IVF_FLAT" IndexFaissIVFFlat = "IVF_FLAT"
IndexFaissIVFPQ = "IVF_PQ" IndexFaissIVFPQ = "IVF_PQ"
IndexFaissIVFSQ8 = "IVF_SQ8" IndexFaissIVFSQ8 = "IVF_SQ8"
IndexScaNN = "SCANN"
IndexFaissBinIDMap = "BIN_FLAT" IndexFaissBinIDMap = "BIN_FLAT"
IndexFaissBinIVFFlat = "BIN_IVF_FLAT" IndexFaissBinIVFFlat = "BIN_IVF_FLAT"
IndexHNSW = "HNSW" IndexHNSW = "HNSW"

View File

@ -18,6 +18,7 @@ const (
IndexFaissIVFFlat = "IVF_FLAT" IndexFaissIVFFlat = "IVF_FLAT"
IndexFaissIVFPQ = "IVF_PQ" IndexFaissIVFPQ = "IVF_PQ"
IndexFaissIVFSQ8 = "IVF_SQ8" IndexFaissIVFSQ8 = "IVF_SQ8"
IndexScaNN = "SCANN"
IndexFaissBinIDMap = "BIN_FLAT" IndexFaissBinIDMap = "BIN_FLAT"
IndexFaissBinIVFFlat = "BIN_IVF_FLAT" IndexFaissBinIVFFlat = "BIN_IVF_FLAT"
@ -52,6 +53,8 @@ func generateFloatVectorTestCases() []vecTestCase {
{IndexFaissIVFPQ, metric.IP, false, schemapb.DataType_FloatVector}, {IndexFaissIVFPQ, metric.IP, false, schemapb.DataType_FloatVector},
{IndexFaissIVFSQ8, metric.L2, false, schemapb.DataType_FloatVector}, {IndexFaissIVFSQ8, metric.L2, false, schemapb.DataType_FloatVector},
{IndexFaissIVFSQ8, metric.IP, false, schemapb.DataType_FloatVector}, {IndexFaissIVFSQ8, metric.IP, false, schemapb.DataType_FloatVector},
{IndexScaNN, metric.L2, false, schemapb.DataType_FloatVector},
{IndexScaNN, metric.IP, false, schemapb.DataType_FloatVector},
{IndexHNSW, metric.L2, false, schemapb.DataType_FloatVector}, {IndexHNSW, metric.L2, false, schemapb.DataType_FloatVector},
{IndexHNSW, metric.IP, false, schemapb.DataType_FloatVector}, {IndexHNSW, metric.IP, false, schemapb.DataType_FloatVector},
} }
@ -89,6 +92,9 @@ func generateParams(indexType, metricType string) (map[string]string, map[string
indexParams[common.DimKey] = strconv.Itoa(dim) indexParams[common.DimKey] = strconv.Itoa(dim)
indexParams["nlist"] = strconv.Itoa(nlist) indexParams["nlist"] = strconv.Itoa(nlist)
indexParams["nbits"] = strconv.Itoa(nbits) indexParams["nbits"] = strconv.Itoa(nbits)
} else if indexType == IndexScaNN {
indexParams[common.DimKey] = strconv.Itoa(dim)
indexParams["nlist"] = strconv.Itoa(nlist)
} else if indexType == IndexHNSW { } else if indexType == IndexHNSW {
indexParams[common.DimKey] = strconv.Itoa(dim) indexParams[common.DimKey] = strconv.Itoa(dim)
indexParams["M"] = strconv.Itoa(16) indexParams["M"] = strconv.Itoa(16)

View File

@ -48,6 +48,7 @@ func (mgr *indexCheckerMgrImpl) registerIndexChecker() {
mgr.checkers[IndexFaissIDMap] = newFlatChecker() mgr.checkers[IndexFaissIDMap] = newFlatChecker()
mgr.checkers[IndexFaissIvfFlat] = newIVFBaseChecker() mgr.checkers[IndexFaissIvfFlat] = newIVFBaseChecker()
mgr.checkers[IndexFaissIvfPQ] = newIVFPQChecker() mgr.checkers[IndexFaissIvfPQ] = newIVFPQChecker()
mgr.checkers[IndexScaNN] = newIVFBaseChecker()
mgr.checkers[IndexFaissIvfSQ8] = newIVFSQChecker() mgr.checkers[IndexFaissIvfSQ8] = newIVFSQChecker()
mgr.checkers[IndexFaissBinIDMap] = newBinFlatChecker() mgr.checkers[IndexFaissBinIDMap] = newBinFlatChecker()
mgr.checkers[IndexFaissBinIvfFlat] = newBinIVFFlatChecker() mgr.checkers[IndexFaissBinIvfFlat] = newBinIVFFlatChecker()

View File

@ -41,6 +41,12 @@ func Test_GetConfAdapterMgrInstance(t *testing.T) {
_, ok = adapter.(*ivfBaseChecker) _, ok = adapter.(*ivfBaseChecker)
assert.Equal(t, true, ok) assert.Equal(t, true, ok)
adapter, err = adapterMgr.GetChecker(IndexScaNN)
assert.Equal(t, nil, err)
assert.NotEqual(t, nil, adapter)
_, ok = adapter.(*ivfBaseChecker)
assert.Equal(t, true, ok)
adapter, err = adapterMgr.GetChecker(IndexFaissIvfPQ) adapter, err = adapterMgr.GetChecker(IndexFaissIvfPQ)
assert.Equal(t, nil, err) assert.Equal(t, nil, err)
assert.NotEqual(t, nil, adapter) assert.NotEqual(t, nil, adapter)
@ -95,6 +101,12 @@ func TestConfAdapterMgrImpl_GetAdapter(t *testing.T) {
_, ok = adapter.(*ivfBaseChecker) _, ok = adapter.(*ivfBaseChecker)
assert.Equal(t, true, ok) assert.Equal(t, true, ok)
adapter, err = adapterMgr.GetChecker(IndexScaNN)
assert.Equal(t, nil, err)
assert.NotEqual(t, nil, adapter)
_, ok = adapter.(*ivfBaseChecker)
assert.Equal(t, true, ok)
adapter, err = adapterMgr.GetChecker(IndexFaissIvfPQ) adapter, err = adapterMgr.GetChecker(IndexFaissIvfPQ)
assert.Equal(t, nil, err) assert.Equal(t, nil, err)
assert.NotEqual(t, nil, adapter) assert.NotEqual(t, nil, adapter)

View File

@ -21,6 +21,7 @@ const (
IndexFaissIDMap IndexType = "FLAT" // no index is built. IndexFaissIDMap IndexType = "FLAT" // no index is built.
IndexFaissIvfFlat IndexType = "IVF_FLAT" IndexFaissIvfFlat IndexType = "IVF_FLAT"
IndexFaissIvfPQ IndexType = "IVF_PQ" IndexFaissIvfPQ IndexType = "IVF_PQ"
IndexScaNN IndexType = "SCANN"
IndexFaissIvfSQ8 IndexType = "IVF_SQ8" IndexFaissIvfSQ8 IndexType = "IVF_SQ8"
IndexFaissBinIDMap IndexType = "BIN_FLAT" IndexFaissBinIDMap IndexType = "BIN_FLAT"
IndexFaissBinIvfFlat IndexType = "BIN_IVF_FLAT" IndexFaissBinIvfFlat IndexType = "BIN_IVF_FLAT"

View File

@ -287,6 +287,17 @@ func (s *TestGetVectorSuite) TestGetVector_IVF_PQ() {
s.run() s.run()
} }
func (s *TestGetVectorSuite) TestGetVector_SCANN() {
s.nq = 10
s.topK = 10
s.indexType = integration.IndexScaNN
s.metricType = metric.L2
s.pkType = schemapb.DataType_Int64
s.vecType = schemapb.DataType_FloatVector
s.searchFailed = false
s.run()
}
func (s *TestGetVectorSuite) TestGetVector_IVF_SQ8() { func (s *TestGetVectorSuite) TestGetVector_IVF_SQ8() {
s.nq = 10 s.nq = 10
s.topK = 10 s.topK = 10

View File

@ -35,6 +35,7 @@ const (
IndexFaissIDMap = indexparamcheck.IndexFaissIDMap IndexFaissIDMap = indexparamcheck.IndexFaissIDMap
IndexFaissIvfFlat = indexparamcheck.IndexFaissIvfFlat IndexFaissIvfFlat = indexparamcheck.IndexFaissIvfFlat
IndexFaissIvfPQ = indexparamcheck.IndexFaissIvfPQ IndexFaissIvfPQ = indexparamcheck.IndexFaissIvfPQ
IndexScaNN = indexparamcheck.IndexScaNN
IndexFaissIvfSQ8 = indexparamcheck.IndexFaissIvfSQ8 IndexFaissIvfSQ8 = indexparamcheck.IndexFaissIvfSQ8
IndexFaissBinIDMap = indexparamcheck.IndexFaissBinIDMap IndexFaissBinIDMap = indexparamcheck.IndexFaissBinIDMap
IndexFaissBinIvfFlat = indexparamcheck.IndexFaissBinIvfFlat IndexFaissBinIvfFlat = indexparamcheck.IndexFaissBinIvfFlat
@ -124,7 +125,7 @@ func ConstructIndexParam(dim int, indexType string, metricType string) []*common
switch indexType { switch indexType {
case IndexFaissIDMap, IndexFaissBinIDMap: case IndexFaissIDMap, IndexFaissBinIDMap:
// no index param is required // no index param is required
case IndexFaissIvfFlat, IndexFaissBinIvfFlat, IndexFaissIvfSQ8: case IndexFaissIvfFlat, IndexFaissBinIvfFlat, IndexFaissIvfSQ8, IndexScaNN:
params = append(params, &commonpb.KeyValuePair{ params = append(params, &commonpb.KeyValuePair{
Key: "nlist", Key: "nlist",
Value: "100", Value: "100",
@ -163,7 +164,7 @@ func GetSearchParams(indexType string, metricType string) map[string]any {
switch indexType { switch indexType {
case IndexFaissIDMap, IndexFaissBinIDMap: case IndexFaissIDMap, IndexFaissBinIDMap:
params[common.MetricTypeKey] = metricType params[common.MetricTypeKey] = metricType
case IndexFaissIvfFlat, IndexFaissBinIvfFlat, IndexFaissIvfSQ8, IndexFaissIvfPQ: case IndexFaissIvfFlat, IndexFaissBinIvfFlat, IndexFaissIvfSQ8, IndexFaissIvfPQ, IndexScaNN:
params["nprobe"] = 8 params["nprobe"] = 8
case IndexHNSW: case IndexHNSW:
params["ef"] = 200 params["ef"] = 200