xref: /f-stack/dpdk/app/test/test_efd_perf.c (revision 2d9fd380)
14418919fSjohnjiang /* SPDX-License-Identifier: BSD-3-Clause
24418919fSjohnjiang  * Copyright(c) 2016-2017 Intel Corporation
34418919fSjohnjiang  */
44418919fSjohnjiang 
54418919fSjohnjiang #include <stdio.h>
64418919fSjohnjiang #include <inttypes.h>
74418919fSjohnjiang 
84418919fSjohnjiang #include <rte_lcore.h>
94418919fSjohnjiang #include <rte_cycles.h>
104418919fSjohnjiang #include <rte_malloc.h>
114418919fSjohnjiang #include <rte_random.h>
124418919fSjohnjiang #include <rte_efd.h>
134418919fSjohnjiang #include <rte_memcpy.h>
144418919fSjohnjiang #include <rte_thash.h>
154418919fSjohnjiang 
164418919fSjohnjiang #include "test.h"
174418919fSjohnjiang 
184418919fSjohnjiang #define NUM_KEYSIZES 10
194418919fSjohnjiang #define NUM_SHUFFLES 10
204418919fSjohnjiang #define MAX_KEYSIZE 64
214418919fSjohnjiang #define MAX_ENTRIES (1 << 19)
224418919fSjohnjiang #define KEYS_TO_ADD (MAX_ENTRIES * 3 / 4) /* 75% table utilization */
234418919fSjohnjiang #define NUM_LOOKUPS (KEYS_TO_ADD * 5) /* Loop among keys added, several times */
244418919fSjohnjiang 
254418919fSjohnjiang #if RTE_EFD_VALUE_NUM_BITS == 32
264418919fSjohnjiang #define VALUE_BITMASK 0xffffffff
274418919fSjohnjiang #else
284418919fSjohnjiang #define VALUE_BITMASK ((1 << RTE_EFD_VALUE_NUM_BITS) - 1)
294418919fSjohnjiang #endif
304418919fSjohnjiang static unsigned int test_socket_id;
314418919fSjohnjiang 
efd_get_all_sockets_bitmask(void)324418919fSjohnjiang static inline uint8_t efd_get_all_sockets_bitmask(void)
334418919fSjohnjiang {
344418919fSjohnjiang 	uint8_t all_cpu_sockets_bitmask = 0;
354418919fSjohnjiang 	unsigned int i;
36*2d9fd380Sjfb8856606 	unsigned int next_lcore = rte_get_main_lcore();
374418919fSjohnjiang 	const int val_true = 1, val_false = 0;
384418919fSjohnjiang 	for (i = 0; i < rte_lcore_count(); i++) {
394418919fSjohnjiang 		all_cpu_sockets_bitmask |= 1 << rte_lcore_to_socket_id(next_lcore);
404418919fSjohnjiang 		next_lcore = rte_get_next_lcore(next_lcore, val_false, val_true);
414418919fSjohnjiang 	}
424418919fSjohnjiang 
434418919fSjohnjiang 	return all_cpu_sockets_bitmask;
444418919fSjohnjiang }
454418919fSjohnjiang 
464418919fSjohnjiang enum operations {
474418919fSjohnjiang 	ADD = 0,
484418919fSjohnjiang 	LOOKUP,
494418919fSjohnjiang 	LOOKUP_MULTI,
504418919fSjohnjiang 	DELETE,
514418919fSjohnjiang 	NUM_OPERATIONS
524418919fSjohnjiang };
534418919fSjohnjiang 
544418919fSjohnjiang struct efd_perf_params {
554418919fSjohnjiang 	struct rte_efd_table *efd_table;
564418919fSjohnjiang 	uint32_t key_size;
574418919fSjohnjiang 	unsigned int cycle;
584418919fSjohnjiang };
594418919fSjohnjiang 
604418919fSjohnjiang static uint32_t hashtest_key_lens[] = {
614418919fSjohnjiang 	/* standard key sizes */
624418919fSjohnjiang 	4, 8, 16, 32, 48, 64,
634418919fSjohnjiang 	/* IPv4 SRC + DST + protocol, unpadded */
644418919fSjohnjiang 	9,
654418919fSjohnjiang 	/* IPv4 5-tuple, unpadded */
664418919fSjohnjiang 	13,
674418919fSjohnjiang 	/* IPv6 5-tuple, unpadded */
684418919fSjohnjiang 	37,
694418919fSjohnjiang 	/* IPv6 5-tuple, padded to 8-byte boundary */
704418919fSjohnjiang 	40
714418919fSjohnjiang };
724418919fSjohnjiang 
734418919fSjohnjiang /* Array to store number of cycles per operation */
744418919fSjohnjiang static uint64_t cycles[NUM_KEYSIZES][NUM_OPERATIONS];
754418919fSjohnjiang 
764418919fSjohnjiang /* Array to store the data */
774418919fSjohnjiang static efd_value_t data[KEYS_TO_ADD];
784418919fSjohnjiang 
794418919fSjohnjiang /* Array to store all input keys */
804418919fSjohnjiang static uint8_t keys[KEYS_TO_ADD][MAX_KEYSIZE];
814418919fSjohnjiang 
824418919fSjohnjiang /* Shuffle the keys that have been added, so lookups will be totally random */
834418919fSjohnjiang static void
shuffle_input_keys(struct efd_perf_params * params)844418919fSjohnjiang shuffle_input_keys(struct efd_perf_params *params)
854418919fSjohnjiang {
864418919fSjohnjiang 	efd_value_t temp_data;
874418919fSjohnjiang 	unsigned int i;
884418919fSjohnjiang 	uint32_t swap_idx;
894418919fSjohnjiang 	uint8_t temp_key[MAX_KEYSIZE];
904418919fSjohnjiang 
914418919fSjohnjiang 	for (i = KEYS_TO_ADD - 1; i > 0; i--) {
924418919fSjohnjiang 		swap_idx = rte_rand() % i;
934418919fSjohnjiang 
944418919fSjohnjiang 		memcpy(temp_key, keys[i], hashtest_key_lens[params->cycle]);
954418919fSjohnjiang 		temp_data = data[i];
964418919fSjohnjiang 
974418919fSjohnjiang 		memcpy(keys[i], keys[swap_idx], hashtest_key_lens[params->cycle]);
984418919fSjohnjiang 		data[i] = data[swap_idx];
994418919fSjohnjiang 
1004418919fSjohnjiang 		memcpy(keys[swap_idx], temp_key, hashtest_key_lens[params->cycle]);
1014418919fSjohnjiang 		data[swap_idx] = temp_data;
1024418919fSjohnjiang 	}
1034418919fSjohnjiang }
1044418919fSjohnjiang 
key_compare(const void * key1,const void * key2)1054418919fSjohnjiang static int key_compare(const void *key1, const void *key2)
1064418919fSjohnjiang {
1074418919fSjohnjiang 	return memcmp(key1, key2, MAX_KEYSIZE);
1084418919fSjohnjiang }
1094418919fSjohnjiang 
1104418919fSjohnjiang /*
1114418919fSjohnjiang  * TODO: we could "error proof" these as done in test_hash_perf.c ln 165:
1124418919fSjohnjiang  *
1134418919fSjohnjiang  * The current setup may give errors if too full in some cases which we check
1144418919fSjohnjiang  * for. However, since EFD allows for ~99% capacity, these errors are rare for
1154418919fSjohnjiang  * #"KEYS_TO_ADD" which is 75% capacity.
1164418919fSjohnjiang  */
1174418919fSjohnjiang static int
setup_keys_and_data(struct efd_perf_params * params,unsigned int cycle)1184418919fSjohnjiang setup_keys_and_data(struct efd_perf_params *params, unsigned int cycle)
1194418919fSjohnjiang {
1204418919fSjohnjiang 	unsigned int i, j;
1214418919fSjohnjiang 	int num_duplicates;
1224418919fSjohnjiang 
1234418919fSjohnjiang 	params->key_size = hashtest_key_lens[cycle];
1244418919fSjohnjiang 	params->cycle = cycle;
1254418919fSjohnjiang 
1264418919fSjohnjiang 	/* Reset all arrays */
1274418919fSjohnjiang 	for (i = 0; i < params->key_size; i++)
1284418919fSjohnjiang 		keys[0][i] = 0;
1294418919fSjohnjiang 
1304418919fSjohnjiang 	/* Generate a list of keys, some of which may be duplicates */
1314418919fSjohnjiang 	for (i = 0; i < KEYS_TO_ADD; i++) {
1324418919fSjohnjiang 		for (j = 0; j < params->key_size; j++)
1334418919fSjohnjiang 			keys[i][j] = rte_rand() & 0xFF;
1344418919fSjohnjiang 
1354418919fSjohnjiang 		data[i] = rte_rand() & VALUE_BITMASK;
1364418919fSjohnjiang 	}
1374418919fSjohnjiang 
1384418919fSjohnjiang 	/* Remove duplicates from the keys array */
1394418919fSjohnjiang 	do {
1404418919fSjohnjiang 		num_duplicates = 0;
1414418919fSjohnjiang 
1424418919fSjohnjiang 		/* Sort the list of keys to make it easier to find duplicates */
1434418919fSjohnjiang 		qsort(keys, KEYS_TO_ADD, MAX_KEYSIZE, key_compare);
1444418919fSjohnjiang 
1454418919fSjohnjiang 		/* Sift through the list of keys and look for duplicates */
1464418919fSjohnjiang 		int num_duplicates = 0;
1474418919fSjohnjiang 		for (i = 0; i < KEYS_TO_ADD - 1; i++) {
1484418919fSjohnjiang 			if (memcmp(keys[i], keys[i + 1], params->key_size) == 0) {
1494418919fSjohnjiang 				/* This key already exists, try again */
1504418919fSjohnjiang 				num_duplicates++;
1514418919fSjohnjiang 				for (j = 0; j < params->key_size; j++)
1524418919fSjohnjiang 					keys[i][j] = rte_rand() & 0xFF;
1534418919fSjohnjiang 			}
1544418919fSjohnjiang 		}
1554418919fSjohnjiang 	} while (num_duplicates != 0);
1564418919fSjohnjiang 
1574418919fSjohnjiang 	/* Shuffle the random values again */
1584418919fSjohnjiang 	shuffle_input_keys(params);
1594418919fSjohnjiang 
1604418919fSjohnjiang 	params->efd_table = rte_efd_create("test_efd_perf",
1614418919fSjohnjiang 			MAX_ENTRIES, params->key_size,
1624418919fSjohnjiang 			efd_get_all_sockets_bitmask(), test_socket_id);
1634418919fSjohnjiang 	TEST_ASSERT_NOT_NULL(params->efd_table, "Error creating the efd table\n");
1644418919fSjohnjiang 
1654418919fSjohnjiang 	return 0;
1664418919fSjohnjiang }
1674418919fSjohnjiang 
1684418919fSjohnjiang static int
timed_adds(struct efd_perf_params * params)1694418919fSjohnjiang timed_adds(struct efd_perf_params *params)
1704418919fSjohnjiang {
1714418919fSjohnjiang 	const uint64_t start_tsc = rte_rdtsc();
1724418919fSjohnjiang 	unsigned int i, a;
1734418919fSjohnjiang 	int32_t ret;
1744418919fSjohnjiang 
1754418919fSjohnjiang 	for (i = 0; i < KEYS_TO_ADD; i++) {
1764418919fSjohnjiang 		ret = rte_efd_update(params->efd_table, test_socket_id, keys[i],
1774418919fSjohnjiang 				data[i]);
1784418919fSjohnjiang 		if (ret != 0) {
1794418919fSjohnjiang 			printf("Error %d in rte_efd_update - key=0x", ret);
1804418919fSjohnjiang 			for (a = 0; a < params->key_size; a++)
1814418919fSjohnjiang 				printf("%02x", keys[i][a]);
1824418919fSjohnjiang 			printf(" value=%d\n", data[i]);
1834418919fSjohnjiang 
1844418919fSjohnjiang 			return -1;
1854418919fSjohnjiang 		}
1864418919fSjohnjiang 	}
1874418919fSjohnjiang 
1884418919fSjohnjiang 	const uint64_t end_tsc = rte_rdtsc();
1894418919fSjohnjiang 	const uint64_t time_taken = end_tsc - start_tsc;
1904418919fSjohnjiang 
1914418919fSjohnjiang 	cycles[params->cycle][ADD] = time_taken / KEYS_TO_ADD;
1924418919fSjohnjiang 	return 0;
1934418919fSjohnjiang }
1944418919fSjohnjiang 
1954418919fSjohnjiang static int
timed_lookups(struct efd_perf_params * params)1964418919fSjohnjiang timed_lookups(struct efd_perf_params *params)
1974418919fSjohnjiang {
1984418919fSjohnjiang 	unsigned int i, j, a;
1994418919fSjohnjiang 	const uint64_t start_tsc = rte_rdtsc();
2004418919fSjohnjiang 	efd_value_t ret_data;
2014418919fSjohnjiang 
2024418919fSjohnjiang 	for (i = 0; i < NUM_LOOKUPS / KEYS_TO_ADD; i++) {
2034418919fSjohnjiang 		for (j = 0; j < KEYS_TO_ADD; j++) {
2044418919fSjohnjiang 			ret_data = rte_efd_lookup(params->efd_table,
2054418919fSjohnjiang 					test_socket_id, keys[j]);
2064418919fSjohnjiang 			if (ret_data != data[j]) {
2074418919fSjohnjiang 				printf("Value mismatch using rte_efd_lookup: "
2084418919fSjohnjiang 						"key #%d (0x", i);
2094418919fSjohnjiang 				for (a = 0; a < params->key_size; a++)
2104418919fSjohnjiang 					printf("%02x", keys[i][a]);
2114418919fSjohnjiang 				printf(")\n");
2124418919fSjohnjiang 				printf("  Expected %d, got %d\n", data[i],
2134418919fSjohnjiang 						ret_data);
2144418919fSjohnjiang 
2154418919fSjohnjiang 				return -1;
2164418919fSjohnjiang 			}
2174418919fSjohnjiang 
2184418919fSjohnjiang 		}
2194418919fSjohnjiang 	}
2204418919fSjohnjiang 
2214418919fSjohnjiang 	const uint64_t end_tsc = rte_rdtsc();
2224418919fSjohnjiang 	const uint64_t time_taken = end_tsc - start_tsc;
2234418919fSjohnjiang 
2244418919fSjohnjiang 	cycles[params->cycle][LOOKUP] = time_taken / NUM_LOOKUPS;
2254418919fSjohnjiang 
2264418919fSjohnjiang 	return 0;
2274418919fSjohnjiang }
2284418919fSjohnjiang 
2294418919fSjohnjiang static int
timed_lookups_multi(struct efd_perf_params * params)2304418919fSjohnjiang timed_lookups_multi(struct efd_perf_params *params)
2314418919fSjohnjiang {
2324418919fSjohnjiang 	unsigned int i, j, k, a;
2334418919fSjohnjiang 	efd_value_t result[RTE_EFD_BURST_MAX] = {0};
2344418919fSjohnjiang 	const void *keys_burst[RTE_EFD_BURST_MAX];
2354418919fSjohnjiang 	const uint64_t start_tsc = rte_rdtsc();
2364418919fSjohnjiang 
2374418919fSjohnjiang 	for (i = 0; i < NUM_LOOKUPS / KEYS_TO_ADD; i++) {
2384418919fSjohnjiang 		for (j = 0; j < KEYS_TO_ADD / RTE_EFD_BURST_MAX; j++) {
2394418919fSjohnjiang 			for (k = 0; k < RTE_EFD_BURST_MAX; k++)
2404418919fSjohnjiang 				keys_burst[k] = keys[j * RTE_EFD_BURST_MAX + k];
2414418919fSjohnjiang 
2424418919fSjohnjiang 			rte_efd_lookup_bulk(params->efd_table, test_socket_id,
2434418919fSjohnjiang 					RTE_EFD_BURST_MAX,
2444418919fSjohnjiang 					keys_burst, result);
2454418919fSjohnjiang 
2464418919fSjohnjiang 			for (k = 0; k < RTE_EFD_BURST_MAX; k++) {
2474418919fSjohnjiang 				uint32_t data_idx = j * RTE_EFD_BURST_MAX + k;
2484418919fSjohnjiang 				if (result[k] != data[data_idx]) {
2494418919fSjohnjiang 					printf("Value mismatch using "
2504418919fSjohnjiang 						"rte_efd_lookup_bulk: key #%d "
2514418919fSjohnjiang 						"(0x", i);
2524418919fSjohnjiang 					for (a = 0; a < params->key_size; a++)
2534418919fSjohnjiang 						printf("%02x",
2544418919fSjohnjiang 							keys[data_idx][a]);
2554418919fSjohnjiang 					printf(")\n");
2564418919fSjohnjiang 					printf("  Expected %d, got %d\n",
2574418919fSjohnjiang 						data[data_idx], result[k]);
2584418919fSjohnjiang 
2594418919fSjohnjiang 					return -1;
2604418919fSjohnjiang 				}
2614418919fSjohnjiang 			}
2624418919fSjohnjiang 		}
2634418919fSjohnjiang 	}
2644418919fSjohnjiang 
2654418919fSjohnjiang 	const uint64_t end_tsc = rte_rdtsc();
2664418919fSjohnjiang 	const uint64_t time_taken = end_tsc - start_tsc;
2674418919fSjohnjiang 
2684418919fSjohnjiang 	cycles[params->cycle][LOOKUP_MULTI] = time_taken / NUM_LOOKUPS;
2694418919fSjohnjiang 
2704418919fSjohnjiang 	return 0;
2714418919fSjohnjiang }
2724418919fSjohnjiang 
2734418919fSjohnjiang static int
timed_deletes(struct efd_perf_params * params)2744418919fSjohnjiang timed_deletes(struct efd_perf_params *params)
2754418919fSjohnjiang {
2764418919fSjohnjiang 	unsigned int i, a;
2774418919fSjohnjiang 	const uint64_t start_tsc = rte_rdtsc();
2784418919fSjohnjiang 	int32_t ret;
2794418919fSjohnjiang 
2804418919fSjohnjiang 	for (i = 0; i < KEYS_TO_ADD; i++) {
2814418919fSjohnjiang 		ret = rte_efd_delete(params->efd_table, test_socket_id, keys[i],
2824418919fSjohnjiang 				NULL);
2834418919fSjohnjiang 
2844418919fSjohnjiang 		if (ret != 0) {
2854418919fSjohnjiang 			printf("Error %d in rte_efd_delete - key=0x", ret);
2864418919fSjohnjiang 			for (a = 0; a < params->key_size; a++)
2874418919fSjohnjiang 				printf("%02x", keys[i][a]);
2884418919fSjohnjiang 			printf("\n");
2894418919fSjohnjiang 
2904418919fSjohnjiang 			return -1;
2914418919fSjohnjiang 		}
2924418919fSjohnjiang 	}
2934418919fSjohnjiang 
2944418919fSjohnjiang 	const uint64_t end_tsc = rte_rdtsc();
2954418919fSjohnjiang 	const uint64_t time_taken = end_tsc - start_tsc;
2964418919fSjohnjiang 
2974418919fSjohnjiang 	cycles[params->cycle][DELETE] = time_taken / KEYS_TO_ADD;
2984418919fSjohnjiang 
2994418919fSjohnjiang 	return 0;
3004418919fSjohnjiang }
3014418919fSjohnjiang 
3024418919fSjohnjiang static void
perform_frees(struct efd_perf_params * params)3034418919fSjohnjiang perform_frees(struct efd_perf_params *params)
3044418919fSjohnjiang {
3054418919fSjohnjiang 	if (params->efd_table != NULL) {
3064418919fSjohnjiang 		rte_efd_free(params->efd_table);
3074418919fSjohnjiang 		params->efd_table = NULL;
3084418919fSjohnjiang 	}
3094418919fSjohnjiang }
3104418919fSjohnjiang 
3114418919fSjohnjiang static int
exit_with_fail(const char * testname,struct efd_perf_params * params,unsigned int i)3124418919fSjohnjiang exit_with_fail(const char *testname, struct efd_perf_params *params,
3134418919fSjohnjiang 		unsigned int i)
3144418919fSjohnjiang {
3154418919fSjohnjiang 
3164418919fSjohnjiang 	printf("<<<<<Test %s failed at keysize %d iteration %d >>>>>\n",
3174418919fSjohnjiang 			testname, hashtest_key_lens[params->cycle], i);
3184418919fSjohnjiang 	perform_frees(params);
3194418919fSjohnjiang 	return -1;
3204418919fSjohnjiang }
3214418919fSjohnjiang 
3224418919fSjohnjiang static int
run_all_tbl_perf_tests(void)3234418919fSjohnjiang run_all_tbl_perf_tests(void)
3244418919fSjohnjiang {
3254418919fSjohnjiang 	unsigned int i, j;
3264418919fSjohnjiang 	struct efd_perf_params params;
3274418919fSjohnjiang 
3284418919fSjohnjiang 	printf("Measuring performance, please wait\n");
3294418919fSjohnjiang 	fflush(stdout);
3304418919fSjohnjiang 
3314418919fSjohnjiang 	test_socket_id = rte_socket_id();
3324418919fSjohnjiang 
3334418919fSjohnjiang 	for (i = 0; i < NUM_KEYSIZES; i++) {
3344418919fSjohnjiang 
3354418919fSjohnjiang 		if (setup_keys_and_data(&params, i) < 0) {
3364418919fSjohnjiang 			printf("Could not create keys/data/table\n");
3374418919fSjohnjiang 			return -1;
3384418919fSjohnjiang 		}
3394418919fSjohnjiang 
3404418919fSjohnjiang 		if (timed_adds(&params) < 0)
3414418919fSjohnjiang 			return exit_with_fail("timed_adds", &params, i);
3424418919fSjohnjiang 
3434418919fSjohnjiang 		for (j = 0; j < NUM_SHUFFLES; j++)
3444418919fSjohnjiang 			shuffle_input_keys(&params);
3454418919fSjohnjiang 
3464418919fSjohnjiang 		if (timed_lookups(&params) < 0)
3474418919fSjohnjiang 			return exit_with_fail("timed_lookups", &params, i);
3484418919fSjohnjiang 
3494418919fSjohnjiang 		if (timed_lookups_multi(&params) < 0)
3504418919fSjohnjiang 			return exit_with_fail("timed_lookups_multi", &params, i);
3514418919fSjohnjiang 
3524418919fSjohnjiang 		if (timed_deletes(&params) < 0)
3534418919fSjohnjiang 			return exit_with_fail("timed_deletes", &params, i);
3544418919fSjohnjiang 
3554418919fSjohnjiang 		/* Print a dot to show progress on operations */
3564418919fSjohnjiang 		printf(".");
3574418919fSjohnjiang 		fflush(stdout);
3584418919fSjohnjiang 
3594418919fSjohnjiang 		perform_frees(&params);
3604418919fSjohnjiang 	}
3614418919fSjohnjiang 
3624418919fSjohnjiang 	printf("\nResults (in CPU cycles/operation)\n");
3634418919fSjohnjiang 	printf("-----------------------------------\n");
3644418919fSjohnjiang 	printf("\n%-18s%-18s%-18s%-18s%-18s\n",
3654418919fSjohnjiang 			"Keysize", "Add", "Lookup", "Lookup_bulk", "Delete");
3664418919fSjohnjiang 	for (i = 0; i < NUM_KEYSIZES; i++) {
3674418919fSjohnjiang 		printf("%-18d", hashtest_key_lens[i]);
3684418919fSjohnjiang 		for (j = 0; j < NUM_OPERATIONS; j++)
3694418919fSjohnjiang 			printf("%-18"PRIu64, cycles[i][j]);
3704418919fSjohnjiang 		printf("\n");
3714418919fSjohnjiang 	}
3724418919fSjohnjiang 	return 0;
3734418919fSjohnjiang }
3744418919fSjohnjiang 
3754418919fSjohnjiang static int
test_efd_perf(void)3764418919fSjohnjiang test_efd_perf(void)
3774418919fSjohnjiang {
3784418919fSjohnjiang 
3794418919fSjohnjiang 	if (run_all_tbl_perf_tests() < 0)
3804418919fSjohnjiang 		return -1;
3814418919fSjohnjiang 
3824418919fSjohnjiang 	return 0;
3834418919fSjohnjiang }
3844418919fSjohnjiang 
3854418919fSjohnjiang REGISTER_TEST_COMMAND(efd_perf_autotest, test_efd_perf);
386