Commit 0020240a authored by Feng Jiang's avatar Feng Jiang Committed by Paul Walmsley
Browse files

lib/string_kunit: add performance benchmark for strlen()



Introduce a benchmarking framework to the string_kunit test suite to
measure the execution efficiency of string functions.

The implementation is inspired by crc_benchmark(), measuring throughput
(MB/s) and latency (ns/call) across a range of string lengths. It
includes a warm-up phase, disables preemption during measurement, and
uses a fixed seed for reproducible results.

This framework allows for comparing different implementations (e.g.,
generic C vs. architecture-optimized assembly) within the KUnit
environment.

Initially, provide a benchmark for strlen().

Suggested-by: default avatarAndy Shevchenko <andy@kernel.org>
Suggested-by: default avatarEric Biggers <ebiggers@kernel.org>
Signed-off-by: default avatarFeng Jiang <jiangfeng@kylinos.cn>
Reviewed-by: default avatarKees Cook <kees@kernel.org>
Link: https://patch.msgid.link/20260130025018.172925-5-jiangfeng@kylinos.cn


[pjw@kernel.org: fixed a checkpatch issue]
Signed-off-by: default avatarPaul Walmsley <pjw@kernel.org>
parent 27b2810a
Loading
Loading
Loading
Loading
+11 −0
Original line number Diff line number Diff line
@@ -2518,6 +2518,17 @@ config STRING_HELPERS_KUNIT_TEST
	depends on KUNIT
	default KUNIT_ALL_TESTS

config STRING_KUNIT_BENCH
       bool "Benchmark string functions at runtime"
       depends on STRING_KUNIT_TEST
       help
         Enable performance measurement for string functions.

         This measures the execution efficiency of string functions
         during the KUnit test run.

         If unsure, say N.

config FFS_KUNIT_TEST
	tristate "KUnit test ffs-family functions at runtime" if !KUNIT_ALL_TESTS
	depends on KUNIT
+160 −0
Original line number Diff line number Diff line
@@ -6,11 +6,17 @@
#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt

#include <kunit/test.h>
#include <linux/ktime.h>
#include <linux/math64.h>
#include <linux/minmax.h>
#include <linux/mm.h>
#include <linux/module.h>
#include <linux/prandom.h>
#include <linux/printk.h>
#include <linux/slab.h>
#include <linux/string.h>
#include <linux/time64.h>
#include <linux/units.h>
#include <linux/vmalloc.h>

#define STRCMP_LARGE_BUF_LEN 2048
@@ -22,6 +28,9 @@
#define STRING_TEST_MAX_LEN	128
#define STRING_TEST_MAX_OFFSET	16

#define STRING_BENCH_SEED	888
#define STRING_BENCH_WORKLOAD	(1 * MEGA)

static void string_test_memset16(struct kunit *test)
{
	unsigned i, j, k;
@@ -707,6 +716,156 @@ static void string_test_strends(struct kunit *test)
	KUNIT_EXPECT_TRUE(test, strends("", ""));
}

#if IS_ENABLED(CONFIG_STRING_KUNIT_BENCH)
/* Target string lengths for benchmarking */
static const size_t bench_lens[] = {
	0, 1, 7, 8, 16, 31, 64, 127, 512, 1024, 3173, 4096,
};

/**
 * alloc_max_bench_buffer() - Allocate buffer for the max test case.
 * @test: KUnit context for managed allocation.
 * @lens: Array of lengths used in the benchmark cases.
 * @count: Number of elements in the @lens array.
 * @buf_len: [out] Pointer to store the actually allocated buffer
 * size (including NUL character).
 *
 * Return: Pointer to the allocated memory, or NULL on failure.
 */
static void *alloc_max_bench_buffer(struct kunit *test, const size_t *lens,
				    size_t count, size_t *buf_len)
{
	size_t max_len = 0;
	void *buf;

	for (size_t i = 0; i < count; i++)
		max_len = max(lens[i], max_len);

	/* Add space for NUL character */
	max_len += 1;

	buf = kunit_kzalloc(test, max_len, GFP_KERNEL);
	if (!buf)
		return NULL;

	if (buf_len)
		*buf_len = max_len;

	return buf;
}

/**
 * fill_random_string() - Populate a buffer with a random NUL-terminated string.
 * @buf: Buffer to fill.
 * @len: Length of the buffer in bytes.
 *
 * Fills the buffer with random non-NUL bytes and ensures the string is
 * properly NUL-terminated.
 */
static void fill_random_string(char *buf, size_t len)
{
	struct rnd_state state;

	if (!buf || !len)
		return;

	/* Use a fixed seed to ensure deterministic benchmark results */
	prandom_seed_state(&state, STRING_BENCH_SEED);
	prandom_bytes_state(&state, buf, len);

	/* Replace NUL characters to avoid early string termination */
	for (size_t i = 0; i < len; i++) {
		if (buf[i] == '\0')
			buf[i] = 0x01;
	}

	buf[len - 1] = '\0';
}

/**
 * STRING_BENCH() - Benchmark string functions.
 * @iters: Number of iterations to run.
 * @func: Function to benchmark.
 * @...: Variable arguments passed to @func.
 *
 * Disables preemption and measures the total time in nanoseconds to execute
 * @func(@__VA_ARGS__) for @iters times, including a small warm-up phase.
 *
 * Context: Disables preemption during measurement.
 * Return: Total execution time in nanoseconds (u64).
 */
#define STRING_BENCH(iters, func, ...)					\
({									\
	/* Volatile function pointer prevents dead code elimination */	\
	typeof(func) (* volatile __func) = (func);			\
	size_t __bn_iters = (iters);					\
	size_t __bn_warm_iters;						\
	u64 __bn_t;							\
									\
	/* Use 10% of the given iterations (maximum 50) to warm up */	\
	__bn_warm_iters = max(__bn_iters / 10, 50U);			\
									\
	for (size_t __bn_i = 0; __bn_i < __bn_warm_iters; __bn_i++)	\
		(void)__func(__VA_ARGS__);				\
									\
	preempt_disable();						\
	__bn_t = ktime_get_ns();					\
	for (size_t __bn_i = 0; __bn_i < __bn_iters; __bn_i++)		\
		(void)__func(__VA_ARGS__);				\
	__bn_t = ktime_get_ns() - __bn_t;				\
	preempt_enable();						\
	__bn_t;								\
})

/**
 * STRING_BENCH_BUF() - Benchmark harness for single-buffer functions.
 * @test: KUnit context.
 * @buf_name: Local char * variable name to be defined.
 * @buf_size: Local size_t variable name to be defined.
 * @func: Function to benchmark.
 * @...: Extra arguments for @func.
 *
 * Prepares a randomized, NUL-terminated buffer and iterates through lengths
 * in bench_lens, defining @buf_name and @buf_size in each loop.
 */
#define STRING_BENCH_BUF(test, buf_name, buf_size, func, ...)		\
do {									\
	size_t _bn_i, _bn_iters, _bn_size = 0;				\
	u64 _bn_t, _bn_mbps = 0, _bn_lat = 0;				\
	char *_bn_buf;							\
									\
	_bn_buf = alloc_max_bench_buffer(test, bench_lens,		\
			ARRAY_SIZE(bench_lens), &_bn_size);		\
	KUNIT_ASSERT_NOT_ERR_OR_NULL(test, _bn_buf);			\
									\
	fill_random_string(_bn_buf, _bn_size);				\
									\
	for (_bn_i = 0; _bn_i < ARRAY_SIZE(bench_lens); _bn_i++) {	\
		size_t buf_size = bench_lens[_bn_i];			\
		char *buf_name = _bn_buf + _bn_size - buf_size - 1;	\
		_bn_iters = STRING_BENCH_WORKLOAD / max(buf_size, 1U);	\
									\
		_bn_t = STRING_BENCH(_bn_iters, func, ##__VA_ARGS__);	\
		if (_bn_t > 0) {					\
			_bn_mbps = (u64)(buf_size) * _bn_iters *	\
					(NSEC_PER_SEC / MEGA);		\
			_bn_mbps = div64_u64(_bn_mbps, _bn_t);		\
			_bn_lat = div64_u64(_bn_t, _bn_iters);		\
		}							\
		kunit_info(test, "len=%zu: %llu MB/s (%llu ns/call)\n",	\
				buf_size, _bn_mbps, _bn_lat);		\
	}								\
} while (0)
#else
#define STRING_BENCH_BUF(test, buf_name, buf_size, func, ...)		\
	kunit_skip(test, "not enabled")
#endif /* IS_ENABLED(CONFIG_STRING_KUNIT_BENCH) */

static void string_bench_strlen(struct kunit *test)
{
	STRING_BENCH_BUF(test, buf, len, strlen, buf);
}

static struct kunit_case string_test_cases[] = {
	KUNIT_CASE(string_test_memset16),
	KUNIT_CASE(string_test_memset32),
@@ -732,6 +891,7 @@ static struct kunit_case string_test_cases[] = {
	KUNIT_CASE(string_test_strtomem),
	KUNIT_CASE(string_test_memtostr),
	KUNIT_CASE(string_test_strends),
	KUNIT_CASE(string_bench_strlen),
	{}
};