Python CuHNSW示例

编程语言: Python

命名空间/包名称: cuhnsw

类/类型: CuHNSW

hotexamples.com的示例: 4

Python CuHNSW - 已找到4个示例。这些是从开源项目中提取的最受好评的cuhnsw.CuHNSW现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

CuHNSW(4)

load_index(3)

search_knn(3)

build(1)

save_index(1)

set_data(1)

示例#1

显示文件

def run_gpu_inference(topk=100, index_file=INDEX_FILE, ef_search=300):
  print("=" * BARRIER_SIZE)
  data_path = pjoin(RES_DIR, DATA_FILE)
  index_path = pjoin(RES_DIR, index_file)
  LOGGER.info("gpu inference on %s with index %s", data_path, index_path)
  ch0 = CuHNSW(OPT)
  LOGGER.info("load model from %s by cuhnsw", index_path)
  ch0.load_index(index_path)

  h5f = h5py.File(data_path, "r")
  queries = h5f["test"][:, :].astype(np.float32)
  neighbors = h5f["neighbors"][:, :topk].astype(np.int32)
  h5f.close()
  num_queries = queries.shape[0]
  queries /= np.linalg.norm(queries, axis=1)[:, None]

  start = time.time()
  pred_nn, _, _ = ch0.search_knn(queries, topk, ef_search)
  el0 = time.time() - start
  LOGGER.info("elapsed for inferencing %d queries of top@%d (ef_search: %d): "
              "%.4e sec", num_queries, topk, ef_search, el0)
  accs = []
  for _pred_nn, _gt_nn in zip(pred_nn, neighbors):
    intersection = set(_pred_nn) & set(_gt_nn)
    acc = len(intersection) / float(topk)
    accs.append(acc)
  LOGGER.info("accuracy mean: %.4e, std: %.4e", np.mean(accs), np.std(accs))
  return el0, np.mean(accs)

示例#2

显示文件

文件： example1.py 项目： js1010/cuhnsw

def run_gpu_inference2(topk=5, index_file="cuhnsw.index", ef_search=300):
  print("=" * BARRIER_SIZE)
  data_path = pjoin(RES_DIR, DATA_FILE)
  index_path = pjoin(RES_DIR, index_file)
  LOGGER.info("gpu inference on %s with index %s", data_path, index_path)
  ch0 = CuHNSW(OPT)
  LOGGER.info("load model from %s by cuhnsw", index_path)
  ch0.load_index(index_path)

  h5f = h5py.File(data_path, "r")
  data = h5f["train"][:, :].astype(np.float32)
  queries = h5f["test"][:5, :].astype(np.float32)
  h5f.close()
  if NRZ:
    data /= np.linalg.norm(data, axis=1)[:, None]

  nns, distances, found_cnt = ch0.search_knn(queries[:5], topk, ef_search)
  for idx, (nn0, distance, cnt) in \
      enumerate(zip(nns, distances, found_cnt)):
    print("=" * BARRIER_SIZE)
    print(f"query {idx + 1}")
    print("-" * BARRIER_SIZE)
    for _idx, (_nn, _dist) in enumerate(zip(nn0[:cnt], distance[:cnt])):
      if DIST_TYPE == "l2":
        real_dist = np.linalg.norm(data[_nn] - queries[idx])
        _dist = np.sqrt(_dist)
      elif DIST_TYPE == "dot":
        real_dist = data[_nn].dot(queries[idx])
      print(f"rank {_idx + 1}. neighbor: {_nn}, dist by lib: {_dist}, "
            f"actual dist: {real_dist}")

示例#3

显示文件

def run_gpu_inference_large(topk=100, index_file=INDEX_FILE, ef_search=300,
                            num_queries=1000000, num_dims=50):
  print("=" * BARRIER_SIZE)
  index_path = pjoin(RES_DIR, index_file)
  data_path = pjoin(RES_DIR, DATA_FILE)
  LOGGER.info("gpu inference on %s with index %s", data_path, index_path)
  ch0 = CuHNSW(OPT)
  LOGGER.info("load model from %s by cuhnsw", index_path)
  ch0.load_index(index_path)

  queries = np.random.normal(size=(num_queries, num_dims)).astype(np.float32)
  num_queries = queries.shape[0]
  queries /= np.linalg.norm(queries, axis=1)[:, None]

  start = time.time()
  _, _, _ = ch0.search_knn(queries, topk, ef_search)
  el0 = time.time() - start
  LOGGER.info("elapsed for inferencing %d queries of top@%d (ef_search: %d): "
              "%.4e sec", num_queries, topk, ef_search, el0)
  return el0

示例#4

显示文件

def run_gpu_training(ef_const=150):
  print("=" * BARRIER_SIZE)
  data_path = pjoin(RES_DIR, DATA_FILE)
  LOGGER.info("gpu training on %s with ef const %d", data_path, ef_const)
  OPT["ef_construction"] = ef_const
  ch0 = CuHNSW(OPT)
  h5f = h5py.File(data_path, "r")
  data = h5f["train"][:, :].astype(np.float32)
  h5f.close()
  ch0.set_data(data)
  start = time.time()
  ch0.build()
  el0 = time.time() - start
  LOGGER.info("elpased time to build by cuhnsw: %.4e sec", el0)
  index_path = pjoin(RES_DIR, CUHNSW_INDEX_FILE)
  ch0.save_index(index_path)
  return el0