From mboxrd@z Thu Jan 1 00:00:00 1970 Return-Path: Received: from mails.dpdk.org (mails.dpdk.org [217.70.189.124]) by inbox.dpdk.org (Postfix) with ESMTP id 2CD5BA0C4B; Tue, 2 Nov 2021 19:38:57 +0100 (CET) Received: from [217.70.189.124] (localhost [127.0.0.1]) by mails.dpdk.org (Postfix) with ESMTP id EEE7B41137; Tue, 2 Nov 2021 19:38:39 +0100 (CET) Received: from mga12.intel.com (mga12.intel.com [192.55.52.136]) by mails.dpdk.org (Postfix) with ESMTP id C69CF4111F for ; Tue, 2 Nov 2021 19:38:37 +0100 (CET) X-IronPort-AV: E=McAfee;i="6200,9189,10156"; a="211397038" X-IronPort-AV: E=Sophos;i="5.87,203,1631602800"; d="scan'208";a="211397038" Received: from orsmga007.jf.intel.com ([10.7.209.58]) by fmsmga106.fm.intel.com with ESMTP/TLS/ECDHE-RSA-AES256-GCM-SHA384; 02 Nov 2021 11:38:37 -0700 X-ExtLoop1: 1 X-IronPort-AV: E=Sophos;i="5.87,203,1631602800"; d="scan'208";a="489227713" Received: from silpixa00400072.ir.intel.com ([10.237.222.213]) by orsmga007.jf.intel.com with ESMTP; 02 Nov 2021 11:38:35 -0700 From: Vladimir Medvedkin To: dev@dpdk.org Cc: yipeng1.wang@intel.com, sameh.gobriel@intel.com, bruce.richardson@intel.com, konstantin.ananyev@intel.com, stephen@networkplumber.org, thomas@monjalon.net Date: Tue, 2 Nov 2021 18:38:25 +0000 Message-Id: <1635878305-102888-5-git-send-email-vladimir.medvedkin@intel.com> X-Mailer: git-send-email 2.7.4 In-Reply-To: <1635878305-102888-1-git-send-email-vladimir.medvedkin@intel.com> References: <1635878305-102888-1-git-send-email-vladimir.medvedkin@intel.com> In-Reply-To: <1630944239-363648-1-git-send-email-vladimir.medvedkin@intel.com> References: <1630944239-363648-1-git-send-email-vladimir.medvedkin@intel.com> Subject: [dpdk-dev] [PATCH v8 4/4] test/thash: add performance tests for the Toeplitz hash X-BeenThere: dev@dpdk.org X-Mailman-Version: 2.1.29 Precedence: list List-Id: DPDK patches and discussions List-Unsubscribe: , List-Archive: List-Post: List-Help: List-Subscribe: , Errors-To: dev-bounces@dpdk.org Sender: "dev" This patch adds performance tests for the following Toeplitz hash function implementations: Scalar: - rte_softrss() - rte_softrss_be() Vector using gfni: - rte_thash_gfni() - rte_thash_gfni_bulk() Signed-off-by: Vladimir Medvedkin --- app/test/meson.build | 2 + app/test/test_thash_perf.c | 135 +++++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 137 insertions(+) create mode 100644 app/test/test_thash_perf.c diff --git a/app/test/meson.build b/app/test/meson.build index 20f36a1..913e8f6 100644 --- a/app/test/meson.build +++ b/app/test/meson.build @@ -144,6 +144,7 @@ test_sources = files( 'test_table_tables.c', 'test_tailq.c', 'test_thash.c', + 'test_thash_perf.c', 'test_timer.c', 'test_timer_perf.c', 'test_timer_racecond.c', @@ -322,6 +323,7 @@ perf_test_names = [ 'hash_readwrite_lf_perf_autotest', 'trace_perf_autotest', 'ipsec_perf_autotest', + 'thash_perf_autotest', ] driver_test_names = [ diff --git a/app/test/test_thash_perf.c b/app/test/test_thash_perf.c new file mode 100644 index 0000000..7aa9360 --- /dev/null +++ b/app/test/test_thash_perf.c @@ -0,0 +1,135 @@ +/* SPDX-License-Identifier: BSD-3-Clause + * Copyright(c) 2021 Intel Corporation + */ + +#include +#include +#include +#include + +#include +#include +#include +#include + +#include "test.h" + +#define ITERATIONS (1 << 15) +#define BATCH_SZ (1 << 10) + +#define IPV4_2_TUPLE_LEN (8) +#define IPV4_4_TUPLE_LEN (12) +#define IPV6_2_TUPLE_LEN (32) +#define IPV6_4_TUPLE_LEN (36) + + +static const uint8_t default_rss_key[] = { + 0x6d, 0x5a, 0x56, 0xda, 0x25, 0x5b, 0x0e, 0xc2, + 0x41, 0x67, 0x25, 0x3d, 0x43, 0xa3, 0x8f, 0xb0, + 0xd0, 0xca, 0x2b, 0xcb, 0xae, 0x7b, 0x30, 0xb4, + 0x77, 0xcb, 0x2d, 0xa3, 0x80, 0x30, 0xf2, 0x0c, + 0x6a, 0x42, 0xb7, 0x3b, 0xbe, 0xac, 0x01, 0xfa, +}; + +enum test_rss_type { + TEST_SOFTRSS, + TEST_SOFTRSS_BE, + TEST_RSS_GFNI +}; + +static inline uint64_t +run_rss_calc(uint32_t *tuples[BATCH_SZ], enum test_rss_type type, int len, + const void *key) +{ + int i, j; + uint64_t start_tsc, end_tsc; + volatile uint32_t hash = 0; + + start_tsc = rte_rdtsc_precise(); + for (i = 0; i < ITERATIONS; i++) { + for (j = 0; j < BATCH_SZ; j++) { + if (type == TEST_SOFTRSS) + hash ^= rte_softrss(tuples[j], len / + sizeof(uint32_t), (const uint8_t *)key); + else if (type == TEST_SOFTRSS_BE) + hash ^= rte_softrss_be(tuples[j], len / + sizeof(uint32_t), (const uint8_t *)key); + else + hash ^= rte_thash_gfni((const uint64_t *)key, + (uint8_t *)tuples[j], len); + } + } + end_tsc = rte_rdtsc_precise(); + + return end_tsc - start_tsc; +} + +static inline uint64_t +run_rss_calc_bulk(uint32_t *tuples[BATCH_SZ], int len, const void *key) +{ + int i; + uint64_t start_tsc, end_tsc; + uint32_t bulk_hash[BATCH_SZ] = { 0 }; + + start_tsc = rte_rdtsc_precise(); + for (i = 0; i < ITERATIONS; i++) + rte_thash_gfni_bulk((const uint64_t *)key, len, + (uint8_t **)tuples, bulk_hash, BATCH_SZ); + + end_tsc = rte_rdtsc_precise(); + + return end_tsc - start_tsc; +} + +static void +run_thash_test(unsigned int tuple_len) +{ + uint32_t *tuples[BATCH_SZ]; + unsigned int i, j; + uint32_t len = RTE_ALIGN_CEIL(tuple_len, sizeof(uint32_t)); + uint64_t tsc_diff; + + for (i = 0; i < BATCH_SZ; i++) { + tuples[i] = rte_zmalloc(NULL, len, 0); + for (j = 0; j < len / sizeof(uint32_t); j++) + tuples[i][j] = rte_rand(); + } + + tsc_diff = run_rss_calc(tuples, TEST_SOFTRSS, len, default_rss_key); + printf("Average rte_softrss() takes \t\t%.1f cycles for key len %d\n", + (double)(tsc_diff) / (double)(ITERATIONS * BATCH_SZ), len); + + tsc_diff = run_rss_calc(tuples, TEST_SOFTRSS_BE, len, + default_rss_key); + printf("Average rte_softrss_be() takes \t\t%.1f cycles for key len %d\n", + (double)(tsc_diff) / (double)(ITERATIONS * BATCH_SZ), len); + + if (!rte_thash_gfni_supported()) + return; + + uint64_t rss_key_matrixes[RTE_DIM(default_rss_key)]; + + rte_thash_complete_matrix(rss_key_matrixes, default_rss_key, + RTE_DIM(default_rss_key)); + + tsc_diff = run_rss_calc(tuples, TEST_RSS_GFNI, len, rss_key_matrixes); + printf("Average rte_thash_gfni takes \t\t%.1f cycles for key len %d\n", + (double)(tsc_diff) / (double)(ITERATIONS * BATCH_SZ), len); + + tsc_diff = run_rss_calc_bulk(tuples, len, rss_key_matrixes); + printf("Average rte_thash_gfni_bulk takes \t%.1f cycles for key len %d\n", + (double)(tsc_diff) / (double)(ITERATIONS * BATCH_SZ), len); +} + +static int +test_thash_perf(void) +{ + run_thash_test(IPV4_2_TUPLE_LEN); + run_thash_test(IPV4_4_TUPLE_LEN); + run_thash_test(IPV6_2_TUPLE_LEN); + run_thash_test(IPV6_4_TUPLE_LEN); + + return 0; +} + +REGISTER_TEST_COMMAND(thash_perf_autotest, test_thash_perf); -- 2.7.4