BinaryVectorExample.java 7.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172
  1. package io.milvus.v2;
  2. import com.google.gson.Gson;
  3. import com.google.gson.JsonObject;
  4. import io.milvus.v1.CommonUtils;
  5. import io.milvus.v2.client.ConnectConfig;
  6. import io.milvus.v2.client.MilvusClientV2;
  7. import io.milvus.v2.common.ConsistencyLevel;
  8. import io.milvus.v2.common.DataType;
  9. import io.milvus.v2.common.IndexParam;
  10. import io.milvus.v2.service.collection.request.AddFieldReq;
  11. import io.milvus.v2.service.collection.request.CreateCollectionReq;
  12. import io.milvus.v2.service.collection.request.DropCollectionReq;
  13. import io.milvus.v2.service.vector.request.InsertReq;
  14. import io.milvus.v2.service.vector.request.QueryReq;
  15. import io.milvus.v2.service.vector.request.SearchReq;
  16. import io.milvus.v2.service.vector.request.data.BinaryVec;
  17. import io.milvus.v2.service.vector.response.QueryResp;
  18. import io.milvus.v2.service.vector.response.SearchResp;
  19. import java.nio.ByteBuffer;
  20. import java.util.*;
  21. public class BinaryVectorExample {
  22. private static final String COLLECTION_NAME = "java_sdk_example_binary_vector_v2";
  23. private static final String ID_FIELD = "id";
  24. private static final String VECTOR_FIELD = "vector";
  25. private static final Integer VECTOR_DIM = 512;
  26. public static void main(String[] args) {
  27. ConnectConfig config = ConnectConfig.builder()
  28. .uri("http://localhost:19530")
  29. .build();
  30. MilvusClientV2 client = new MilvusClientV2(config);
  31. // Drop collection if exists
  32. client.dropCollection(DropCollectionReq.builder()
  33. .collectionName(COLLECTION_NAME)
  34. .build());
  35. // Create collection
  36. CreateCollectionReq.CollectionSchema collectionSchema = CreateCollectionReq.CollectionSchema.builder()
  37. .build();
  38. collectionSchema.addField(AddFieldReq.builder()
  39. .fieldName(ID_FIELD)
  40. .dataType(DataType.Int64)
  41. .isPrimaryKey(Boolean.TRUE)
  42. .build());
  43. collectionSchema.addField(AddFieldReq.builder()
  44. .fieldName(VECTOR_FIELD)
  45. .dataType(DataType.BinaryVector)
  46. .dimension(VECTOR_DIM)
  47. .build());
  48. List<IndexParam> indexes = new ArrayList<>();
  49. Map<String,Object> extraParams = new HashMap<>();
  50. extraParams.put("nlist",64);
  51. indexes.add(IndexParam.builder()
  52. .fieldName(VECTOR_FIELD)
  53. .indexType(IndexParam.IndexType.BIN_IVF_FLAT)
  54. .metricType(IndexParam.MetricType.HAMMING)
  55. .extraParams(extraParams)
  56. .build());
  57. CreateCollectionReq requestCreate = CreateCollectionReq.builder()
  58. .collectionName(COLLECTION_NAME)
  59. .collectionSchema(collectionSchema)
  60. .indexParams(indexes)
  61. .consistencyLevel(ConsistencyLevel.BOUNDED)
  62. .build();
  63. client.createCollection(requestCreate);
  64. System.out.println("Collection created");
  65. // Insert entities by rows
  66. int rowCount = 10000;
  67. List<JsonObject> rows = new ArrayList<>();
  68. Gson gson = new Gson();
  69. List<ByteBuffer> vectors = new ArrayList<>();
  70. for (long i = 0L; i < rowCount; ++i) {
  71. JsonObject row = new JsonObject();
  72. row.addProperty(ID_FIELD, i);
  73. ByteBuffer vector = CommonUtils.generateBinaryVector(VECTOR_DIM);
  74. vectors.add(vector);
  75. row.add(VECTOR_FIELD, gson.toJsonTree(vector.array()));
  76. rows.add(row);
  77. }
  78. client.insert(InsertReq.builder()
  79. .collectionName(COLLECTION_NAME)
  80. .data(rows)
  81. .build());
  82. // Get row count, set ConsistencyLevel.STRONG to sync the data to query node so that data is visible
  83. QueryResp countR = client.query(QueryReq.builder()
  84. .collectionName(COLLECTION_NAME)
  85. .filter("")
  86. .outputFields(Collections.singletonList("count(*)"))
  87. .consistencyLevel(ConsistencyLevel.STRONG)
  88. .build());
  89. System.out.printf("%d rows persisted\n", (long)countR.getQueryResults().get(0).getEntity().get("count(*)"));
  90. // Pick some vectors from the inserted vectors to search
  91. // Ensure the returned top1 item's ID should be equal to target vector's ID
  92. for (int i = 0; i < 10; i++) {
  93. Random ran = new Random();
  94. int k = ran.nextInt(rowCount);
  95. ByteBuffer targetVector = vectors.get(k);
  96. Map<String,Object> params = new HashMap<>();
  97. params.put("nprobe",16);
  98. SearchResp searchResp = client.search(SearchReq.builder()
  99. .collectionName(COLLECTION_NAME)
  100. .data(Collections.singletonList(new BinaryVec(targetVector)))
  101. .annsField(VECTOR_FIELD)
  102. .outputFields(Collections.singletonList(VECTOR_FIELD))
  103. .searchParams(params)
  104. .topK(3)
  105. .build());
  106. // The search() allows multiple target vectors to search in a batch.
  107. // Here we only input one vector to search, get the result of No.0 vector to check
  108. List<List<SearchResp.SearchResult>> searchResults = searchResp.getSearchResults();
  109. List<SearchResp.SearchResult> results = searchResults.get(0);
  110. System.out.printf("The result of No.%d target vector:\n", i);
  111. for (SearchResp.SearchResult result : results) {
  112. System.out.println(result.getEntity());
  113. System.out.printf("ID: %d, Score: %f, Vector: ", result.getId(), result.getScore());
  114. ByteBuffer vector = (ByteBuffer) result.getEntity().get(VECTOR_FIELD);
  115. vector.rewind();
  116. while (vector.hasRemaining()) {
  117. System.out.print(Integer.toBinaryString(vector.get()));
  118. }
  119. System.out.println();
  120. }
  121. SearchResp.SearchResult firstResult = results.get(0);
  122. if ((long)firstResult.getId() != k) {
  123. throw new RuntimeException(String.format("The top1 ID %d is not equal to target vector's ID %d",
  124. firstResult.getId(), k));
  125. }
  126. }
  127. System.out.println("Search result is correct");
  128. // Retrieve some data
  129. int n = 99;
  130. QueryResp queryResp = client.query(QueryReq.builder()
  131. .collectionName(COLLECTION_NAME)
  132. .filter(String.format("id == %d", n))
  133. .outputFields(Collections.singletonList(VECTOR_FIELD))
  134. .build());
  135. List<QueryResp.QueryResult> queryResults = queryResp.getQueryResults();
  136. if (queryResults.isEmpty()) {
  137. throw new RuntimeException("The query result is empty");
  138. } else {
  139. ByteBuffer vector = (ByteBuffer) queryResults.get(0).getEntity().get(VECTOR_FIELD);
  140. if (vector.compareTo(vectors.get(n)) != 0) {
  141. throw new RuntimeException("The query result is incorrect");
  142. }
  143. }
  144. System.out.println("Query result is correct");
  145. // Drop the collection if you don't need the collection anymore
  146. client.dropCollection(DropCollectionReq.builder()
  147. .collectionName(COLLECTION_NAME)
  148. .build());
  149. client.close();
  150. }
  151. }