From mboxrd@z Thu Jan 1 00:00:00 1970 Return-Path: Received: from dpdk.org (dpdk.org [92.243.14.124]) by inbox.dpdk.org (Postfix) with ESMTP id ED5E5A0527; Mon, 20 Jul 2020 18:01:48 +0200 (CEST) Received: from [92.243.14.124] (localhost [127.0.0.1]) by dpdk.org (Postfix) with ESMTP id E746A1BFBC; Mon, 20 Jul 2020 18:01:47 +0200 (CEST) Received: from mga11.intel.com (mga11.intel.com [192.55.52.93]) by dpdk.org (Postfix) with ESMTP id 38B681023 for ; Mon, 20 Jul 2020 18:01:45 +0200 (CEST) IronPort-SDR: XCxDF7sEpjvzRA1g5Q2S13KNqTzO7od7/uMvKRp2694U+PYNhxSr4ytou5QIMPcUBCdyZUXF36 uoSYh0UXPErQ== X-IronPort-AV: E=McAfee;i="6000,8403,9688"; a="147895653" X-IronPort-AV: E=Sophos;i="5.75,375,1589266800"; d="scan'208";a="147895653" X-Amp-Result: SKIPPED(no attachment in message) X-Amp-File-Uploaded: False Received: from orsmga007.jf.intel.com ([10.7.209.58]) by fmsmga102.fm.intel.com with ESMTP/TLS/ECDHE-RSA-AES256-GCM-SHA384; 20 Jul 2020 09:01:44 -0700 IronPort-SDR: 4/poHqaX88qzYrDEFYjDfJDdrNjtoSKQ49CRMo0SxUMc/epqqyLRnl//uMqVJK+Jngh3N52lMm MG8NznEtCZRg== X-ExtLoop1: 1 X-IronPort-AV: E=Sophos;i="5.75,375,1589266800"; d="scan'208";a="327574130" Received: from silpixa00399912.ir.intel.com (HELO silpixa00399912.ger.corp.intel.com) ([10.237.223.64]) by orsmga007.jf.intel.com with ESMTP; 20 Jul 2020 09:01:42 -0700 From: David Coyle To: fiona.trahe@intel.com, akhil.goyal@nxp.com Cc: dev@dpdk.org, brendan.ryan@intel.com, mairtin.oloingsigh@intel.com, declan.doherty@intel.com, pablo.de.lara.guarch@intel.com, David Coyle Date: Mon, 20 Jul 2020 16:37:07 +0100 Message-Id: <20200720153707.18210-1-david.coyle@intel.com> X-Mailer: git-send-email 2.17.1 Subject: [dpdk-dev] [PATCH v1] crypto/qat: add DOCSIS performance optimization X-BeenThere: dev@dpdk.org X-Mailman-Version: 2.1.15 Precedence: list List-Id: DPDK patches and discussions List-Unsubscribe: , List-Archive: List-Post: List-Help: List-Subscribe: , Errors-To: dev-bounces@dpdk.org Sender: "dev" DOCSIS protocol performance in the downlink direction can be improved significantly in the QAT SYM PMD, especially for larger packets, by pre-processing all CRC generations in a batch before building and enqueuing any requests to the HW. This patch adds this optimization. Fixes: 6f0ef237404b ("crypto/qat: support DOCSIS protocol") Signed-off-by: David Coyle --- drivers/common/qat/qat_qp.c | 2 + drivers/crypto/qat/qat_sym.c | 75 ++++++++---------------------------- drivers/crypto/qat/qat_sym.h | 57 +++++++++++++++++++++++++++ 3 files changed, 76 insertions(+), 58 deletions(-) diff --git a/drivers/common/qat/qat_qp.c b/drivers/common/qat/qat_qp.c index aacd4ab21..6fd836fdb 100644 --- a/drivers/common/qat/qat_qp.c +++ b/drivers/common/qat/qat_qp.c @@ -627,6 +627,8 @@ qat_enqueue_op_burst(void *qp, void **ops, uint16_t nb_ops) } } + if (tmp_qp->service_type == QAT_SERVICE_SYMMETRIC) + qat_sym_preprocess_requests(ops, nb_ops_possible); while (nb_ops_sent != nb_ops_possible) { if (tmp_qp->service_type == QAT_SERVICE_SYMMETRIC) { diff --git a/drivers/crypto/qat/qat_sym.c b/drivers/crypto/qat/qat_sym.c index e6bf11523..e3f98a76b 100644 --- a/drivers/crypto/qat/qat_sym.c +++ b/drivers/crypto/qat/qat_sym.c @@ -9,9 +9,6 @@ #include #include #include -#ifdef RTE_LIBRTE_SECURITY -#include -#endif #include "qat_sym.h" @@ -102,29 +99,6 @@ qat_bpicipher_preprocess(struct qat_sym_session *ctx, return sym_op->cipher.data.length - last_block_len; } -#ifdef RTE_LIBRTE_SECURITY -static inline void -qat_crc_generate(struct qat_sym_session *ctx, - struct rte_crypto_op *op) -{ - struct rte_crypto_sym_op *sym_op = op->sym; - uint32_t *crc, crc_data_len; - uint8_t *crc_data; - - if (ctx->qat_dir == ICP_QAT_HW_CIPHER_ENCRYPT && - sym_op->auth.data.length != 0) { - - crc_data_len = sym_op->auth.data.length; - crc_data = rte_pktmbuf_mtod_offset(sym_op->m_src, uint8_t *, - sym_op->auth.data.offset); - crc = (uint32_t *)(crc_data + crc_data_len); - - *crc = rte_net_crc_calc(crc_data, crc_data_len, - RTE_NET_CRC32_ETH); - } -} -#endif - static inline void set_cipher_iv(uint16_t iv_length, uint16_t iv_offset, struct icp_qat_fw_la_cipher_req_params *cipher_param, @@ -187,7 +161,6 @@ qat_sym_build_request(void *in_op, uint8_t *out_msg, uint64_t auth_data_end = 0; uint8_t do_sgl = 0; uint8_t in_place = 1; - uint8_t is_docsis_sec = 0; int alignment_adjustment = 0; struct rte_crypto_op *op = (struct rte_crypto_op *)in_op; struct qat_sym_op_cookie *cookie = @@ -211,13 +184,23 @@ qat_sym_build_request(void *in_op, uint8_t *out_msg, } else { ctx = (struct qat_sym_session *)get_sec_session_private_data( op->sym->sec_session); - if (ctx && ctx->bpi_ctx == NULL) { - QAT_DP_LOG(ERR, "QAT PMD only supports security" - " operation requests for DOCSIS, op" - " (%p) is not for DOCSIS.", op); - return -EINVAL; + if (likely(ctx)) { + if (unlikely(ctx->bpi_ctx == NULL)) { + QAT_DP_LOG(ERR, "QAT PMD only supports security" + " operation requests for" + " DOCSIS, op (%p) is not for" + " DOCSIS.", op); + return -EINVAL; + } else if (unlikely(((op->sym->m_dst != NULL) && + (op->sym->m_dst != op->sym->m_src)) || + op->sym->m_src->nb_segs > 1)) { + QAT_DP_LOG(ERR, "OOP and/or multi-segment" + " buffers not supported for" + " DOCSIS security."); + op->status = RTE_CRYPTO_OP_STATUS_INVALID_ARGS; + return -EINVAL; + } } - is_docsis_sec = 1; #endif } @@ -281,31 +264,7 @@ qat_sym_build_request(void *in_op, uint8_t *out_msg, cipher_ofs = op->sym->cipher.data.offset >> 3; } else if (ctx->bpi_ctx) { - /* DOCSIS processing */ -#ifdef RTE_LIBRTE_SECURITY - if (is_docsis_sec) { - /* Check for OOP or multi-segment buffers */ - if (unlikely(((op->sym->m_dst != NULL) && - (op->sym->m_dst != - op->sym->m_src)) || - op->sym->m_src->nb_segs > 1)) { - QAT_DP_LOG(ERR, - "OOP and/or multi-segment " - "buffers are not supported for " - "DOCSIS security"); - op->status = - RTE_CRYPTO_OP_STATUS_INVALID_ARGS; - return -EINVAL; - } - - /* Calculate CRC */ - qat_crc_generate(ctx, op); - } -#else - RTE_SET_USED(is_docsis_sec); -#endif - - /* Only send complete blocks to device. + /* DOCSIS - only send complete blocks to device. * Process any partial block using CFB mode. * Even if 0 complete blocks, still send this to device * to get into rx queue for post-process and dequeuing diff --git a/drivers/crypto/qat/qat_sym.h b/drivers/crypto/qat/qat_sym.h index 7934dd478..1a9748849 100644 --- a/drivers/crypto/qat/qat_sym.h +++ b/drivers/crypto/qat/qat_sym.h @@ -158,6 +158,57 @@ qat_crc_verify(struct qat_sym_session *ctx, struct rte_crypto_op *op) op->status = RTE_CRYPTO_OP_STATUS_AUTH_FAILED; } } + +static inline void +qat_crc_generate(struct qat_sym_session *ctx, + struct rte_crypto_op *op) +{ + struct rte_crypto_sym_op *sym_op = op->sym; + uint32_t *crc, crc_data_len; + uint8_t *crc_data; + + if (ctx->qat_dir == ICP_QAT_HW_CIPHER_ENCRYPT && + sym_op->auth.data.length != 0 && + sym_op->m_src->nb_segs == 1) { + + crc_data_len = sym_op->auth.data.length; + crc_data = rte_pktmbuf_mtod_offset(sym_op->m_src, uint8_t *, + sym_op->auth.data.offset); + crc = (uint32_t *)(crc_data + crc_data_len); + *crc = rte_net_crc_calc(crc_data, crc_data_len, + RTE_NET_CRC32_ETH); + } +} + +static inline void +qat_sym_preprocess_requests(void **ops, uint16_t nb_ops) +{ + struct rte_crypto_op *op; + struct qat_sym_session *ctx; + uint16_t i; + + for (i = 0; i < nb_ops; i++) { + op = (struct rte_crypto_op *)ops[i]; + + if (op->sess_type == RTE_CRYPTO_OP_SECURITY_SESSION) { + ctx = (struct qat_sym_session *) + get_sec_session_private_data( + op->sym->sec_session); + + if (ctx == NULL || ctx->bpi_ctx == NULL) + continue; + + qat_crc_generate(ctx, op); + } + } +} +#else + +static inline void +qat_sym_preprocess_requests(void **ops __rte_unused, + uint16_t nb_ops __rte_unused) +{ +} #endif static inline void @@ -215,6 +266,12 @@ qat_sym_process_response(void **op, uint8_t *resp) } #else +static inline void +qat_sym_preprocess_requests(void **ops __rte_unused, + uint16_t nb_ops __rte_unused) +{ +} + static inline void qat_sym_process_response(void **op __rte_unused, uint8_t *resp __rte_unused) { -- 2.17.1