ANNS

ANNS Library Usage

// ... ... ...
int main() {
  std::vector<vdim_t> base_vectors, queries_vectors;
  std::vector<id_t> groundtruth;
  auto [nb, d0] = utils::LoadFromFile(base_vectors, base_vectors_path);
  auto [nq, d1] = utils::LoadFromFile(queries_vectors, queries_vectors_path);
  auto [ng, d2] = utils::LoadFromFile(groundtruth, groundtruth_path);
  auto nest_queries_vectors = utils::Nest(std::move(queries_vectors), nq, d1);
  utils::STimer build_timer;
  utils::STimer query_timer;
  auto cspg = std::make_unique<anns::graph::RandomPartitionGraph<vdim_t, subgraph_t>> (d0, part);
  build_timer.Start();
  cspg->BuildIndex(base_vectors, num_threads, {default_params.max_degree, default_params.efc, default_params.dedup});
  build_timer.Stop();
  std::vector<std::vector<id_t>> knn;
  query_timer.Start();
  cspg->GetTopkNNParallel(nest_queries_vectors, k, num_threads, 1, efq, knn);
  query_timer.Stop();
  std::cout << "Query TIme: " << query_timer.GetTime() << std::endl;
  std::cout << "Recall@10: " << utils::GetRecall(k, d2, groundtruth, knn) << std::endl;
  // ... ... ...
  return 0;
}

This is an example of how to use the ANNS library to build and query an index. The main function takes in the path to the base vectors, queries vectors, and groundtruth file, as well as the number of partitions, maximum degree, and effective query count for the index. It then builds the index and performs queries on the queries vectors, and outputs the results to a CSV file.

To use the ANNS library simply, we wrap the CPP APIs with Python API, which you can use as follow. Example for ANNS Python API

# Include the library modules
import sys
mpath = 'Path/To/CSPG/ANNS/modules'
if mpath not in sys.path:
  sys.path.append(mpath)

# Import important modules
import anns
import numpy as np
from binary_io import  *

# Data path
base = "/var/lib/docker/anns/dataset/sift1m/base.fvecs"
query = "/var/lib/docker/anns/query/sift1m/query.fvecs"
gt = "/var/lib/docker/anns/query/sift1m/gt.ivecs"

# Read data from files
base = fvecs_read(base)
query = fvecs_read(query)
gt = ivecs_read(gt)
nb, d = base.shape
nq, _ = query.shape
_, ngt = gt.shape

# Parameters
m = 2
threads = 24
k = 10

# Reshape the data to adjust to the library APIs
base = base.flatten().tolist()
query = query.flatten().tolist()
gt = gt.flatten().tolist()

# Initialize your index and build
index = anns.CSPG_HNSW_FLOAT(d, m)
index.build(base, threads, [32, 128, 0.5])

# Search k-NN
knn = index.search(query, k, 1, ef1 = 1, ef2 = 128)

# Get recall by groudtruth
print(anns.get_recall(k, ngt, gt, knn))

Name		Name	Last commit message	Last commit date
parent directory ..
include		include
modules		modules
CMakeLists.txt		CMakeLists.txt
README.md		README.md
anns_bindings.cpp		anns_bindings.cpp
test_anns.ipynb		test_anns.ipynb

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

README.md

ANNS Library Usage

FilesExpand file tree

ANNS

Directory actions

More options

Directory actions

More options

Latest commit

History

ANNS

Folders and files

parent directory

README.md

ANNS Library Usage