inst/unitTests/test_cpp.R

###########################################################################
#
# Test C functions optimized by SSE2/AVX/AVX2
#

library(SeqArray)
library(RUnit)


.popcnt <- function(x)
{
	ans <- 0L
	while(x > 0)
	{
		if (x %% 2) ans <- ans + 1L
		x <- x %/% 2
	}
	ans
}


test_popcnt <- function()
{
	set.seed(1000)
	v1 <- sample.int(2147483647L, 10000L, replace=TRUE)
	v2 <- sample.int(2147483647L, 10000L, replace=TRUE)

	c1 <- sapply(v1, .popcnt)
	c2 <- sapply(v2, .popcnt)

	t1 <- SeqArray:::.cfunction("test_array_popcnt32")(v1)
	t2 <- SeqArray:::.cfunction("test_array_popcnt32")(v2)
	t3 <- SeqArray:::.cfunction2("test_array_popcnt64")(v1, v2)

	checkEquals(c1, t1, "popcount u32")
	checkEquals(c2, t2, "popcount u32")
	checkEquals(c1+c2, t3, "popcount u64")

	invisible()
}


test_byte_count <- function()
{
	set.seed(1000)
	for (st in sample.int(1000L, 25L))
	{
		n <- 50000L + sample.int(64L, 1L) - 1L
		v <- sample.int(255L, n, replace=TRUE)
		v[sample.int(n, 25000L)] <- 0L
		v <- as.raw(v)

		n1 <- SeqArray:::.cfunction2("test_byte_count")(v, st)
		n2 <- sum(v[st:length(v)] != 0L)
		checkEquals(n1, n2, paste0("byte_count (start=", st, ")"))
	}

	invisible()
}


test_int8_replace <- function()
{
	set.seed(5000)
	for (st in sample.int(1000L, 25L))
	{
		n <- 50000L + sample.int(64L, 1L) - 1L
		v1 <- sample.int(127L, n, replace=TRUE)
		fd <- sample(v1, 1L)
		sub <- sample(v1, 1L)

		v2 <- SeqArray:::.cfunction4("test_int8_replace")(as.raw(v1), st, fd, sub)
		a <- v1[st:length(v1)]
		a[a == fd] <- sub
		v1[st:length(v1)] <- a
		v1 <- as.raw(v1)
		checkEquals(v1, v2, paste0("int8_replace (start=", st, ")"))
	}

	invisible()
}


test_int_count <- function()
{
	set.seed(5000)
	for (st in sample.int(1000L, 25L))
	{
		n <- 50000L + sample.int(64L, 1L) - 1L
		v <- sample.int(255L, n, replace=TRUE)
		fd <- sample(v, 1L)

		n1 <- SeqArray:::.cfunction3("test_int32_count")(v, st, fd)
		n2 <- sum(v[st:length(v)] == fd)
		checkEquals(n1, n2, paste0("int_count (start=", st, ")"))
	}

	invisible()
}


test_i8_count <- function()
{
	set.seed(5000)
	for (st in sample.int(1000L, 25L))
	{
		n <- 50000L + sample.int(64L, 1L) - 1L
		v <- as.raw(sample.int(255L, n, replace=TRUE))
		fd <- sample(v, 1L)

		n1 <- SeqArray:::.cfunction3("test_i8_count")(v, st, fd)
		n2 <- sum(v[st:length(v)] == fd)
		checkEquals(n1, n2, paste0("i8_count (start=", st, ")"))
	}

	invisible()
}


test_int_count2 <- function()
{
	set.seed(5000)
	for (st in sample.int(1000L, 25L))
	{
		n <- 50000L + sample.int(64L, 1L) - 1L
		v <- sample.int(255L, n, replace=TRUE)
		fd1 <- sample(v, 1L)
		fd2 <- sample(v, 1L)

		n1 <- SeqArray:::.cfunction4("test_int32_count2")(v, st, fd1, fd2)
		n2 <- c(sum(v[st:length(v)] == fd1), sum(v[st:length(v)] == fd2))
		checkEquals(n1, n2, paste0("int_count2 (start=", st, ")"))
	}

	invisible()
}


test_i8_count2 <- function()
{
	set.seed(5000)
	for (st in sample.int(1000L, 25L))
	{
		n <- 50000L + sample.int(64L, 1L) - 1L
		v <- as.raw(sample.int(255L, n, replace=TRUE))
		fd1 <- sample(v, 1L)
		fd2 <- sample(v, 1L)

		n1 <- SeqArray:::.cfunction4("test_int8_count2")(v, st, fd1, fd2)
		n2 <- c(sum(v[st:length(v)] == fd1), sum(v[st:length(v)] == fd2))
		checkEquals(n1, n2, paste0("i8_count2 (start=", st, ")"))
	}

	invisible()
}


test_int_count3 <- function()
{
	set.seed(5000)
	for (st in sample.int(1000L, 25L))
	{
		n <- 50000L + sample.int(64L, 1L) - 1L
		v <- sample.int(255L, n, replace=TRUE)
		fd1 <- sample(v, 1L)
		fd2 <- sample(v, 1L)
		fd3 <- sample(v, 1L)

		n1 <- SeqArray:::.cfunction5("test_int32_count3")(v, st, fd1, fd2, fd3)
		v <- v[st:length(v)]
		n2 <- c(sum(v==fd1), sum(v==fd2), sum(v==fd3))
		checkEquals(n1, n2, paste0("int_count3 (start=", st, ")"))
	}

	invisible()
}


test_i8_count3 <- function()
{
	set.seed(5000)
	for (st in sample.int(1000L, 25L))
	{
		n <- 50000L + sample.int(64L, 1L) - 1L
		v <- as.raw(sample.int(255L, n, replace=TRUE))
		fd1 <- sample(v, 1L)
		fd2 <- sample(v, 1L)
		fd3 <- sample(v, 1L)

		n1 <- SeqArray:::.cfunction5("test_int8_count3")(v, st, fd1, fd2, fd3)
		v <- v[st:length(v)]
		n2 <- c(sum(v==fd1), sum(v==fd2), sum(v==fd3))
		checkEquals(n1, n2, paste0("i8_count3 (start=", st, ")"))
	}

	invisible()
}


test_int_replace <- function()
{
	set.seed(5000)
	for (st in sample.int(1000L, 25L))
	{
		n <- 50000L + sample.int(64L, 1L) - 1L
		v1 <- sample.int(255L, n, replace=TRUE)
		fd <- sample(v1, 1L)
		sub <- sample(v1, 1L)

		v2 <- SeqArray:::.cfunction4("test_int32_replace")(v1, st, fd, sub)
		a <- v1[st:length(v1)]
		a[a == fd] <- sub
		v1[st:length(v1)] <- a
		checkEquals(v1, v2, paste0("int_replace (start=", st, ")"))
	}

	invisible()
}


test_position_index <- function()
{
	set.seed(1000)

	for (k in 1:25)
	{
		len <- sample.int(2L, 50000L, replace=TRUE)

		f <- createfn.gds("test.gds")
		n <- add.gdsn(f, "new", len)

		ii <- sample.int(length(len), 100L)
		c.val <- SeqArray:::.cfunction2("test_position_index")(n, ii)

		s <- c(); v <- c()
		for (i in ii)
		{
			s <- c(s, ifelse(i > 1L, sum(len[1:(i-1L)]), 0L))
			v <- c(v, len[i])
		}
		checkEquals(c.val[[1L]], s, "test_position_index: accumulated sum")
		checkEquals(c.val[[2L]], v, "test_position_index: current value")

		closefn.gds(f)
		unlink("test.gds", force=TRUE)
	}

	invisible()
}
zhengxwen/SeqArray documentation built on Jan. 10, 2025, 9:09 p.m.