# library(testthat); library(BiocNeighbors); source("setup.R"); source("test-findNeighbors.R")
set.seed(999999)
test_that("findNeighbors works with basic options", {
Y <- matrix(rnorm(10000), ncol=20)
d <- median(findDistance(Y, k=8))
out <- findNeighbors(Y, threshold=d)
ref <- refFindNeighbors(Y, threshold=d)
expect_equal(out, ref)
d <- median(findDistance(Y, k=8, BNPARAM=KmknnParam(distance="Manhattan")))
out <- findNeighbors(Y, threshold=d, BNPARAM=KmknnParam(distance="Manhattan"))
ref <- refFindNeighbors(Y, threshold=d, type="manhattan")
expect_equal(out, ref)
d <- median(findDistance(Y, k=8, BNPARAM=KmknnParam(distance="Cosine")))
out <- findNeighbors(Y, threshold=d, BNPARAM=KmknnParam(distance="Cosine"))
Y1 <- Y/sqrt(rowSums(Y^2))
ref <- findNeighbors(Y1, threshold=d)
expect_equal(out, ref)
})
test_that("findNeighbors works in parallel", {
Y <- matrix(rnorm(10000), ncol=20)
d <- median(findDistance(Y, k=5))
out <- findNeighbors(Y, threshold=d)
pout <- findNeighbors(Y, threshold=d, num.threads=2)
expect_identical(out, pout)
pout <- findNeighbors(Y, threshold=d, BPPARAM=BiocParallel::SnowParam(2))
expect_identical(out, pout)
})
test_that("findNeighbors works with subsets", {
Y <- matrix(rnorm(10000), ncol=20)
d <- median(findDistance(Y, k=3))
full <- findNeighbors(Y, threshold=d)
sout <- findNeighbors(Y, subset=1:10, threshold=d)
out <- full
out$index <- out$index[1:10]
out$distance <- out$distance[1:10]
expect_identical(out, sout)
expect_error(findNeighbors(Y, threshold=d, subset=100000), "out-of-range")
out <- findNeighbors(Y[0,,drop=FALSE], threshold=d)
expect_identical(length(out$index), 0L)
expect_identical(length(out$distance), 0L)
# Works with non-integer options.
keep <- rbinom(nrow(Y), 1, 0.5) == 1
sout <- findNeighbors(Y, subset=keep, threshold=d)
out <- full
out$index <- out$index[keep]
out$distance <- out$distance[keep]
expect_identical(out, sout)
Z <- Y
rownames(Z) <- seq_len(nrow(Z))
keep <- sample(rownames(Z), nrow(Z) / 2)
sout <- findNeighbors(Z, subset=keep, threshold=d)
out <- full
out$index <- out$index[as.integer(keep)]
out$distance <- out$distance[as.integer(keep)]
expect_identical(out, sout)
})
test_that("findNeighbors works with prebuilt indices", {
Y <- matrix(rnorm(10000), ncol=20)
d <- median(findDistance(Y, k=3))
built <- buildIndex(Y, threshold=d)
out <- findNeighbors(Y, threshold=d)
preout <- findNeighbors(built, threshold=d)
expect_identical(out, preout)
# Unaffected by BNPARAM settings at this point.
preout <- findNeighbors(built, threshold=d, BNPARAM=AnnoyParam())
expect_identical(out, preout)
# Throws an error for deserialized prebuilt indices.
tmp <- tempfile(fileext=".rds")
saveRDS(built, tmp)
expect_error(findNeighbors(readRDS(tmp), threshold=d), "null pointer")
})
test_that("findNeighbors works with variable thresholds", {
Y <- matrix(rnorm(10000), ncol=20)
d4 <- median(findDistance(Y, k=4))
d10 <- median(findDistance(Y, k=10))
th <- rep(c(d4, d10), length.out=nrow(Y))
out <- findNeighbors(Y, threshold=th)
keep <- th == d4
ref <- findNeighbors(Y, threshold=d4)
expect_identical(out$index[keep], ref$index[keep])
expect_identical(out$distance[keep], ref$distance[keep])
keep <- th == d10
ref <- findNeighbors(Y, threshold=d10)
expect_identical(out$index[keep], ref$index[keep])
expect_identical(out$distance[keep], ref$distance[keep])
expect_error(findNeighbors(Y, threshold=1:10), "length equal")
})
test_that("findNeighbors works with variable outputs", {
Y <- matrix(rnorm(10000), ncol=20)
d <- median(findDistance(Y, k=8))
out <- findNeighbors(Y, threshold=d)
iout <- findNeighbors(Y, threshold=d, get.distance=FALSE)
expect_null(iout$distance)
expect_identical(iout$index, out$index)
dout <- findNeighbors(Y, threshold=d, get.index=FALSE)
expect_null(dout$index)
expect_identical(dout$distance, out$distance)
count <- findNeighbors(Y, threshold=d, get.index=FALSE, get.distance=FALSE)
expect_identical(count, lengths(out$index))
})
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.