123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191 |
- /*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements. See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership. The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License. You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing,
- * software distributed under the License is distributed on an
- * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
- * KIND, either express or implied. See the License for the
- * specific language governing permissions and limitations
- * under the License.
- */
- package io.milvus;
- import io.milvus.client.MilvusServiceClient;
- import io.milvus.common.clientenum.ConsistencyLevelEnum;
- import io.milvus.grpc.*;
- import io.milvus.param.*;
- import io.milvus.param.collection.*;
- import io.milvus.param.dml.InsertParam;
- import io.milvus.param.dml.QueryParam;
- import io.milvus.param.dml.SearchParam;
- import io.milvus.param.index.CreateIndexParam;
- import io.milvus.response.FieldDataWrapper;
- import io.milvus.response.QueryResultsWrapper;
- import io.milvus.response.SearchResultsWrapper;
- import java.util.*;
- public class SparseVectorExample {
- private static final String COLLECTION_NAME = "java_sdk_example_sparse";
- private static final String ID_FIELD = "id";
- private static final String VECTOR_FIELD = "vector";
- public static void main(String[] args) {
- // Connect to Milvus server. Replace the "localhost" and port with your Milvus server address.
- MilvusServiceClient milvusClient = new MilvusServiceClient(ConnectParam.newBuilder()
- .withHost("localhost")
- .withPort(19530)
- .build());
- // drop the collection if you don't need the collection anymore
- R<Boolean> hasR = milvusClient.hasCollection(HasCollectionParam.newBuilder()
- .withCollectionName(COLLECTION_NAME)
- .build());
- CommonUtils.handleResponseStatus(hasR);
- if (hasR.getData()) {
- milvusClient.dropCollection(DropCollectionParam.newBuilder()
- .withCollectionName(COLLECTION_NAME)
- .build());
- }
- // Define fields
- List<FieldType> fieldsSchema = Arrays.asList(
- FieldType.newBuilder()
- .withName(ID_FIELD)
- .withDataType(DataType.Int64)
- .withPrimaryKey(true)
- .withAutoID(false)
- .build(),
- FieldType.newBuilder()
- .withName(VECTOR_FIELD)
- .withDataType(DataType.SparseFloatVector)
- .build()
- );
- // Create the collection
- R<RpcStatus> ret = milvusClient.createCollection(CreateCollectionParam.newBuilder()
- .withCollectionName(COLLECTION_NAME)
- .withConsistencyLevel(ConsistencyLevelEnum.STRONG)
- .withFieldTypes(fieldsSchema)
- .build());
- CommonUtils.handleResponseStatus(ret);
- System.out.println("Collection created");
- // Insert entities
- int rowCount = 10000;
- List<Long> ids = new ArrayList<>();
- for (long i = 0L; i < rowCount; ++i) {
- ids.add(i);
- }
- List<SortedMap<Long, Float>> vectors = CommonUtils.generateSparseVectors(rowCount);
- List<InsertParam.Field> fieldsInsert = new ArrayList<>();
- fieldsInsert.add(new InsertParam.Field(ID_FIELD, ids));
- fieldsInsert.add(new InsertParam.Field(VECTOR_FIELD, vectors));
- InsertParam insertParam = InsertParam.newBuilder()
- .withCollectionName(COLLECTION_NAME)
- .withFields(fieldsInsert)
- .build();
- R<MutationResult> insertR = milvusClient.insert(insertParam);
- CommonUtils.handleResponseStatus(insertR);
- // Flush the data to storage for testing purpose
- // Note that no need to manually call flush interface in practice
- R<FlushResponse> flushR = milvusClient.flush(FlushParam.newBuilder().
- addCollectionName(COLLECTION_NAME).
- build());
- CommonUtils.handleResponseStatus(flushR);
- System.out.println("Entities inserted");
- // Specify an index type on the vector field.
- ret = milvusClient.createIndex(CreateIndexParam.newBuilder()
- .withCollectionName(COLLECTION_NAME)
- .withFieldName(VECTOR_FIELD)
- .withIndexType(IndexType.SPARSE_WAND)
- .withMetricType(MetricType.IP)
- .withExtraParam("{\"drop_ratio_build\":0.2}")
- .build());
- CommonUtils.handleResponseStatus(ret);
- System.out.println("Index created");
- // Call loadCollection() to enable automatically loading data into memory for searching
- ret = milvusClient.loadCollection(LoadCollectionParam.newBuilder()
- .withCollectionName(COLLECTION_NAME)
- .build());
- CommonUtils.handleResponseStatus(ret);
- System.out.println("Collection loaded");
- // Pick some vectors from the inserted vectors to search
- // Ensure the returned top1 item's ID should be equal to target vector's ID
- for (int i = 0; i < 10; i++) {
- Random ran = new Random();
- int k = ran.nextInt(rowCount);
- SortedMap<Long, Float> targetVector = vectors.get(k);
- R<SearchResults> searchRet = milvusClient.search(SearchParam.newBuilder()
- .withCollectionName(COLLECTION_NAME)
- .withMetricType(MetricType.IP)
- .withTopK(3)
- .withSparseFloatVectors(Collections.singletonList(targetVector))
- .withVectorFieldName(VECTOR_FIELD)
- .addOutField(VECTOR_FIELD)
- .withParams("{\"drop_ratio_search\":0.2}")
- .build());
- CommonUtils.handleResponseStatus(searchRet);
- // The search() allows multiple target vectors to search in a batch.
- // Here we only input one vector to search, get the result of No.0 vector to check
- SearchResultsWrapper resultsWrapper = new SearchResultsWrapper(searchRet.getData().getResults());
- List<SearchResultsWrapper.IDScore> scores = resultsWrapper.getIDScore(0);
- System.out.printf("The result of No.%d target vector:\n", i);
- for (SearchResultsWrapper.IDScore score : scores) {
- System.out.println(score);
- }
- if (scores.get(0).getLongID() != k) {
- throw new RuntimeException(String.format("The top1 ID %d is not equal to target vector's ID %d",
- scores.get(0).getLongID(), k));
- }
- }
- System.out.println("Search result is correct");
- // Retrieve some data
- int n = 99;
- R<QueryResults> queryR = milvusClient.query(QueryParam.newBuilder()
- .withCollectionName(COLLECTION_NAME)
- .withExpr(String.format("id == %d", n))
- .addOutField(VECTOR_FIELD)
- .build());
- CommonUtils.handleResponseStatus(queryR);
- QueryResultsWrapper queryWrapper = new QueryResultsWrapper(queryR.getData());
- FieldDataWrapper field = queryWrapper.getFieldWrapper(VECTOR_FIELD);
- List<?> r = field.getFieldData();
- if (r.isEmpty()) {
- throw new RuntimeException("The query result is empty");
- } else {
- SortedMap<Long, Float> sparse = (SortedMap<Long, Float>) r.get(0);
- if (!sparse.equals(vectors.get(n))) {
- throw new RuntimeException("The query result is incorrect");
- }
- }
- System.out.println("Query result is correct");
- // drop the collection if you don't need the collection anymore
- milvusClient.dropCollection(DropCollectionParam.newBuilder()
- .withCollectionName(COLLECTION_NAME)
- .build());
- System.out.println("Collection dropped");
- milvusClient.close();
- }
- }
|