* [dpdk-dev] [PATCH v6 1/3] eal: introduce integer divide through reciprocal
@ 2017-09-06 10:21 Pavan Nikhilesh
2017-09-06 10:21 ` [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal Pavan Nikhilesh
` (2 more replies)
0 siblings, 3 replies; 11+ messages in thread
From: Pavan Nikhilesh @ 2017-09-06 10:21 UTC (permalink / raw)
To: cristian.dumitrescu, stephen; +Cc: dev, Pavan Bhagavatula
From: Pavan Bhagavatula <pbhagavatula@caviumnetworks.com>
In some use cases of integer division, denominator remains constant and
numerator varies. It is possible to optimize division for such specific
scenarios.
The librte_sched uses rte_reciprocal to optimize division so, moving it to
eal/common would allow other libraries and applications to use it.
Signed-off-by: Pavan Nikhilesh <pbhagavatula@caviumnetworks.com>
Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
---
v6 changes:
- remove cache alignment from rte_reciprocal_u{32/64}structures as they would
be embedded in other structures.
v5 changes:
- fix test print strings
v4 changes:
- minor fix for test cases
- fix u32 divisor generation
v3 changes:
- fix x86_32 compilation issue
- fix improper licence in test
v2 changes:
- fix compilation issues with .map files
- add test cases for correctness and performance
- remove extra licence inclusion
- fix coding style issues
lib/librte_eal/bsdapp/eal/Makefile | 1 +
lib/librte_eal/bsdapp/eal/rte_eal_version.map | 7 +++++++
lib/librte_eal/common/Makefile | 1 +
lib/{librte_sched => librte_eal/common/include}/rte_reciprocal.h | 6 ++++--
lib/{librte_sched => librte_eal/common}/rte_reciprocal.c | 6 ++++--
lib/librte_eal/linuxapp/eal/Makefile | 1 +
lib/librte_eal/linuxapp/eal/rte_eal_version.map | 7 +++++++
lib/librte_sched/Makefile | 2 --
lib/librte_sched/rte_sched.c | 2 +-
9 files changed, 26 insertions(+), 7 deletions(-)
rename lib/{librte_sched => librte_eal/common/include}/rte_reciprocal.h (87%)
rename lib/{librte_sched => librte_eal/common}/rte_reciprocal.c (96%)
diff --git a/lib/librte_eal/bsdapp/eal/Makefile b/lib/librte_eal/bsdapp/eal/Makefile
index 005019e..56f9804 100644
--- a/lib/librte_eal/bsdapp/eal/Makefile
+++ b/lib/librte_eal/bsdapp/eal/Makefile
@@ -88,6 +88,7 @@ SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += malloc_elem.c
SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += malloc_heap.c
SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += rte_keepalive.c
SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += rte_service.c
+SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += rte_reciprocal.c
# from arch dir
SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += rte_cpuflags.c
diff --git a/lib/librte_eal/bsdapp/eal/rte_eal_version.map b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
index aac6fd7..90d7258 100644
--- a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
+++ b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
@@ -237,3 +237,10 @@ EXPERIMENTAL {
rte_service_unregister;
} DPDK_17.08;
+
+DPDK_17.11 {
+ global:
+
+ rte_reciprocal_value;
+
+} DPDK_17.08;
diff --git a/lib/librte_eal/common/Makefile b/lib/librte_eal/common/Makefile
index e8fd67a..a680b2d 100644
--- a/lib/librte_eal/common/Makefile
+++ b/lib/librte_eal/common/Makefile
@@ -42,6 +42,7 @@ INC += rte_hexdump.h rte_devargs.h rte_bus.h rte_dev.h rte_vdev.h
INC += rte_pci_dev_feature_defs.h rte_pci_dev_features.h
INC += rte_malloc.h rte_keepalive.h rte_time.h
INC += rte_service.h rte_service_component.h
+INC += rte_reciprocal.h
GENERIC_INC := rte_atomic.h rte_byteorder.h rte_cycles.h rte_prefetch.h
GENERIC_INC += rte_spinlock.h rte_memcpy.h rte_cpuflags.h rte_rwlock.h
diff --git a/lib/librte_sched/rte_reciprocal.h b/lib/librte_eal/common/include/rte_reciprocal.h
similarity index 87%
rename from lib/librte_sched/rte_reciprocal.h
rename to lib/librte_eal/common/include/rte_reciprocal.h
index 5e21f09..b6d752f 100644
--- a/lib/librte_sched/rte_reciprocal.h
+++ b/lib/librte_eal/common/include/rte_reciprocal.h
@@ -29,13 +29,15 @@ struct rte_reciprocal {
uint8_t sh1, sh2;
};
-static inline uint32_t rte_reciprocal_divide(uint32_t a, struct rte_reciprocal R)
+static inline uint32_t
+rte_reciprocal_divide(uint32_t a, struct rte_reciprocal R)
{
uint32_t t = (uint32_t)(((uint64_t)a * R.m) >> 32);
return (t + ((a - t) >> R.sh1)) >> R.sh2;
}
-struct rte_reciprocal rte_reciprocal_value(uint32_t d);
+struct rte_reciprocal
+rte_reciprocal_value(uint32_t d);
#endif /* _RTE_RECIPROCAL_H_ */
diff --git a/lib/librte_sched/rte_reciprocal.c b/lib/librte_eal/common/rte_reciprocal.c
similarity index 96%
rename from lib/librte_sched/rte_reciprocal.c
rename to lib/librte_eal/common/rte_reciprocal.c
index 652f023..7ab99b4 100644
--- a/lib/librte_sched/rte_reciprocal.c
+++ b/lib/librte_eal/common/rte_reciprocal.c
@@ -41,7 +41,8 @@
/* find largest set bit.
* portable and slow but does not matter for this usage.
*/
-static inline int fls(uint32_t x)
+static inline int
+fls(uint32_t x)
{
int b;
@@ -53,7 +54,8 @@ static inline int fls(uint32_t x)
return 0;
}
-struct rte_reciprocal rte_reciprocal_value(uint32_t d)
+struct rte_reciprocal
+rte_reciprocal_value(uint32_t d)
{
struct rte_reciprocal R;
uint64_t m;
diff --git a/lib/librte_eal/linuxapp/eal/Makefile b/lib/librte_eal/linuxapp/eal/Makefile
index 90bca4d..98f3b8e 100644
--- a/lib/librte_eal/linuxapp/eal/Makefile
+++ b/lib/librte_eal/linuxapp/eal/Makefile
@@ -100,6 +100,7 @@ SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += malloc_elem.c
SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += malloc_heap.c
SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += rte_keepalive.c
SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += rte_service.c
+SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += rte_reciprocal.c
# from arch dir
SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += rte_cpuflags.c
diff --git a/lib/librte_eal/linuxapp/eal/rte_eal_version.map b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
index 3a8f154..2070cba 100644
--- a/lib/librte_eal/linuxapp/eal/rte_eal_version.map
+++ b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
@@ -242,3 +242,10 @@ EXPERIMENTAL {
rte_service_unregister;
} DPDK_17.08;
+
+DPDK_17.11 {
+ global:
+
+ rte_reciprocal_value;
+
+} DPDK_17.08;
diff --git a/lib/librte_sched/Makefile b/lib/librte_sched/Makefile
index 18274e7..569656b 100644
--- a/lib/librte_sched/Makefile
+++ b/lib/librte_sched/Makefile
@@ -52,10 +52,8 @@ LIBABIVER := 1
# all source are stored in SRCS-y
#
SRCS-$(CONFIG_RTE_LIBRTE_SCHED) += rte_sched.c rte_red.c rte_approx.c
-SRCS-$(CONFIG_RTE_LIBRTE_SCHED) += rte_reciprocal.c
# install includes
SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include := rte_sched.h rte_bitmap.h rte_sched_common.h rte_red.h rte_approx.h
-SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include += rte_reciprocal.h
include $(RTE_SDK)/mk/rte.lib.mk
diff --git a/lib/librte_sched/rte_sched.c b/lib/librte_sched/rte_sched.c
index b7cba11..3b8ccaa 100644
--- a/lib/librte_sched/rte_sched.c
+++ b/lib/librte_sched/rte_sched.c
@@ -42,12 +42,12 @@
#include <rte_prefetch.h>
#include <rte_branch_prediction.h>
#include <rte_mbuf.h>
+#include <rte_reciprocal.h>
#include "rte_sched.h"
#include "rte_bitmap.h"
#include "rte_sched_common.h"
#include "rte_approx.h"
-#include "rte_reciprocal.h"
#ifdef __INTEL_COMPILER
#pragma warning(disable:2259) /* conversion may lose significant bits */
--
2.7.4
^ permalink raw reply [flat|nested] 11+ messages in thread
* [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal
2017-09-06 10:21 [dpdk-dev] [PATCH v6 1/3] eal: introduce integer divide through reciprocal Pavan Nikhilesh
@ 2017-09-06 10:21 ` Pavan Nikhilesh
2017-09-06 12:28 ` Kevin Traynor
2017-09-20 13:15 ` Dumitrescu, Cristian
2017-09-06 10:21 ` [dpdk-dev] [PATCH v6 3/3] test: add tests for reciprocal based division Pavan Nikhilesh
2017-09-20 13:10 ` [dpdk-dev] [PATCH v6 1/3] eal: introduce integer divide through reciprocal Dumitrescu, Cristian
2 siblings, 2 replies; 11+ messages in thread
From: Pavan Nikhilesh @ 2017-09-06 10:21 UTC (permalink / raw)
To: cristian.dumitrescu, stephen; +Cc: dev, Pavan Bhagavatula
From: Pavan Bhagavatula <pbhagavatula@caviumnetworks.com>
Currently, rte_reciprocal only supports unsigned 32bit divisors. This
commit adds support for unsigned 64bit divisors.
Rename unsigned 32bit specific functions appropriately and update
librte_sched accordingly.
Signed-off-by: Pavan Nikhilesh <pbhagavatula@caviumnetworks.com>
---
lib/librte_eal/bsdapp/eal/rte_eal_version.map | 3 +-
lib/librte_eal/common/include/rte_reciprocal.h | 109 ++++++++++++++++++++--
lib/librte_eal/common/rte_reciprocal.c | 116 +++++++++++++++++++++---
lib/librte_eal/linuxapp/eal/rte_eal_version.map | 3 +-
lib/librte_sched/Makefile | 4 +-
lib/librte_sched/rte_sched.c | 9 +-
6 files changed, 219 insertions(+), 25 deletions(-)
diff --git a/lib/librte_eal/bsdapp/eal/rte_eal_version.map b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
index 90d7258..59a85bb 100644
--- a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
+++ b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
@@ -241,6 +241,7 @@ EXPERIMENTAL {
DPDK_17.11 {
global:
- rte_reciprocal_value;
+ rte_reciprocal_value_u32;
+ rte_reciprocal_value_u64;
} DPDK_17.08;
diff --git a/lib/librte_eal/common/include/rte_reciprocal.h b/lib/librte_eal/common/include/rte_reciprocal.h
index b6d752f..85599e6 100644
--- a/lib/librte_eal/common/include/rte_reciprocal.h
+++ b/lib/librte_eal/common/include/rte_reciprocal.h
@@ -22,22 +22,117 @@
#ifndef _RTE_RECIPROCAL_H_
#define _RTE_RECIPROCAL_H_
-#include <stdint.h>
+#include <rte_memory.h>
-struct rte_reciprocal {
+/**
+ * Unsigned 32-bit divisor structure.
+ */
+struct rte_reciprocal_u32 {
uint32_t m;
uint8_t sh1, sh2;
};
+/**
+ * Unsigned 64-bit divisor structure.
+ */
+struct rte_reciprocal_u64 {
+ uint64_t m;
+ uint8_t sh1;
+};
+
+/**
+ * Divide given unsigned 32-bit integer with pre calculated divisor.
+ *
+ * @param a
+ * The 32-bit dividend.
+ * @param R
+ * The pointer to pre calculated divisor reciprocal structure.
+ *
+ * @return
+ * The result of the division
+ */
static inline uint32_t
-rte_reciprocal_divide(uint32_t a, struct rte_reciprocal R)
+rte_reciprocal_divide_u32(uint32_t a, struct rte_reciprocal_u32 *R)
{
- uint32_t t = (uint32_t)(((uint64_t)a * R.m) >> 32);
+ uint32_t t = (((uint64_t)a * R->m) >> 32);
- return (t + ((a - t) >> R.sh1)) >> R.sh2;
+ return (t + ((a - t) >> R->sh1)) >> R->sh2;
}
-struct rte_reciprocal
-rte_reciprocal_value(uint32_t d);
+static inline uint64_t
+mullhi_u64(uint64_t x, uint64_t y)
+{
+#ifdef __SIZEOF_INT128__
+ __uint128_t xl = x;
+ __uint128_t rl = xl * y;
+
+ return (rl >> 64);
+#else
+ uint64_t u0, u1, v0, v1, k, t;
+ uint64_t w1, w2;
+ uint64_t whi;
+
+ u1 = x >> 32; u0 = x & 0xFFFFFFFF;
+ v1 = y >> 32; v0 = y & 0xFFFFFFFF;
+
+ t = u0*v0;
+ k = t >> 32;
+
+ t = u1*v0 + k;
+ w1 = t & 0xFFFFFFFF;
+ w2 = t >> 32;
+
+ t = u0*v1 + w1;
+ k = t >> 32;
+
+ whi = u1*v1 + w2 + k;
+
+ return whi;
+#endif
+}
+
+/**
+ * Divide given unsigned 64-bit integer with pre calculated divisor.
+ *
+ * @param a
+ * The 64-bit dividend.
+ * @param R
+ * The pointer to pre calculated divisor reciprocal structure.
+ *
+ * @return
+ * The result of the division
+ */
+static inline uint64_t
+rte_reciprocal_divide_u64(uint64_t a, struct rte_reciprocal_u64 *R)
+{
+ uint64_t q = mullhi_u64(R->m, a);
+ uint64_t t = ((a - q) >> 1) + q;
+
+ return t >> R->sh1;
+}
+
+/**
+ * Generate pre calculated divisor structure.
+ *
+ * @param d
+ * The unsigned 32-bit divisor.
+ *
+ * @return
+ * Divisor structure.
+ */
+struct rte_reciprocal_u32
+rte_reciprocal_value_u32(uint32_t d);
+
+/**
+ * Generate pre calculated divisor structure.
+ *
+ * @param d
+ * The unsigned 64-bit divisor.
+ *
+ * @return
+ * Divisor structure.
+ */
+struct rte_reciprocal_u64
+rte_reciprocal_value_u64(uint64_t d);
#endif /* _RTE_RECIPROCAL_H_ */
diff --git a/lib/librte_eal/common/rte_reciprocal.c b/lib/librte_eal/common/rte_reciprocal.c
index 7ab99b4..2024e62 100644
--- a/lib/librte_eal/common/rte_reciprocal.c
+++ b/lib/librte_eal/common/rte_reciprocal.c
@@ -31,18 +31,13 @@
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
-#include <stdio.h>
-#include <stdint.h>
-
-#include <rte_common.h>
-
-#include "rte_reciprocal.h"
+#include <rte_reciprocal.h>
/* find largest set bit.
* portable and slow but does not matter for this usage.
*/
static inline int
-fls(uint32_t x)
+fls_u32(uint32_t x)
{
int b;
@@ -54,14 +49,14 @@ fls(uint32_t x)
return 0;
}
-struct rte_reciprocal
-rte_reciprocal_value(uint32_t d)
+struct rte_reciprocal_u32
+rte_reciprocal_value_u32(uint32_t d)
{
- struct rte_reciprocal R;
+ struct rte_reciprocal_u32 R;
uint64_t m;
int l;
- l = fls(d - 1);
+ l = fls_u32(d - 1);
m = ((1ULL << 32) * ((1ULL << l) - d));
m /= d;
@@ -72,3 +67,102 @@ rte_reciprocal_value(uint32_t d)
return R;
}
+
+/* Code taken from Hacker's Delight:
+ * http://www.hackersdelight.org/HDcode/divlu.c.
+ * License permits inclusion here per:
+ * http://www.hackersdelight.org/permissions.htm
+ */
+static inline uint64_t
+divide_128_div_64_to_64(uint64_t u1, uint64_t u0, uint64_t v, uint64_t *r)
+{
+ const uint64_t b = (1ULL << 32); /* Number base (16 bits). */
+ uint64_t un1, un0, /* Norm. dividend LSD's. */
+ vn1, vn0, /* Norm. divisor digits. */
+ q1, q0, /* Quotient digits. */
+ un64, un21, un10, /* Dividend digit pairs. */
+ rhat; /* A remainder. */
+ int s; /* Shift amount for norm. */
+
+ /* If overflow, set rem. to an impossible value. */
+ if (u1 >= v) {
+ if (r != NULL)
+ *r = (uint64_t) -1;
+ return (uint64_t) -1;
+ }
+
+ /* Count leading zeros. */
+ s = __builtin_clzll(v);
+ if (s > 0) {
+ v = v << s;
+ un64 = (u1 << s) | ((u0 >> (64 - s)) & (-s >> 31));
+ un10 = u0 << s;
+ } else {
+
+ un64 = u1 | u0;
+ un10 = u0;
+ }
+
+ vn1 = v >> 32;
+ vn0 = v & 0xFFFFFFFF;
+
+ un1 = un10 >> 32;
+ un0 = un10 & 0xFFFFFFFF;
+
+ q1 = un64/vn1;
+ rhat = un64 - q1*vn1;
+again1:
+ if (q1 >= b || q1*vn0 > b*rhat + un1) {
+ q1 = q1 - 1;
+ rhat = rhat + vn1;
+ if (rhat < b)
+ goto again1;
+ }
+
+ un21 = un64*b + un1 - q1*v;
+
+ q0 = un21/vn1;
+ rhat = un21 - q0*vn1;
+again2:
+ if (q0 >= b || q0*vn0 > b*rhat + un0) {
+ q0 = q0 - 1;
+ rhat = rhat + vn1;
+ if (rhat < b)
+ goto again2;
+ }
+
+ if (r != NULL)
+ *r = (un21*b + un0 - q0*v) >> s;
+ return q1*b + q0;
+}
+
+struct rte_reciprocal_u64
+rte_reciprocal_value_u64(uint64_t d)
+{
+ struct rte_reciprocal_u64 R;
+
+ const uint32_t fld = 63 - __builtin_clzll(d);
+
+ if ((d & (d - 1)) == 0) {
+ R.m = 0;
+ R.sh1 = (fld - 1) | 0x40;
+ } else {
+ uint64_t rem;
+ uint64_t multiplier;
+ uint8_t more;
+
+ multiplier = divide_128_div_64_to_64(1ULL << fld, 0, d, &rem);
+ multiplier += multiplier;
+
+ const uint64_t twice_rem = rem + rem;
+ if (twice_rem >= d || twice_rem < rem)
+ multiplier += 1;
+ more = fld;
+ R.m = 1 + multiplier;
+ R.sh1 = more | 0x40;
+ }
+
+ R.sh1 &= 0x3F;
+
+ return R;
+}
diff --git a/lib/librte_eal/linuxapp/eal/rte_eal_version.map b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
index 2070cba..2671627 100644
--- a/lib/librte_eal/linuxapp/eal/rte_eal_version.map
+++ b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
@@ -246,6 +246,7 @@ EXPERIMENTAL {
DPDK_17.11 {
global:
- rte_reciprocal_value;
+ rte_reciprocal_value_u32;
+ rte_reciprocal_value_u64;
} DPDK_17.08;
diff --git a/lib/librte_sched/Makefile b/lib/librte_sched/Makefile
index 569656b..a2fd6f3 100644
--- a/lib/librte_sched/Makefile
+++ b/lib/librte_sched/Makefile
@@ -54,6 +54,8 @@ LIBABIVER := 1
SRCS-$(CONFIG_RTE_LIBRTE_SCHED) += rte_sched.c rte_red.c rte_approx.c
# install includes
-SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include := rte_sched.h rte_bitmap.h rte_sched_common.h rte_red.h rte_approx.h
+SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include := rte_sched.h rte_bitmap.h
+SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include += rte_sched_common.h rte_red.h
+SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include += rte_approx.h
include $(RTE_SDK)/mk/rte.lib.mk
diff --git a/lib/librte_sched/rte_sched.c b/lib/librte_sched/rte_sched.c
index 3b8ccaa..7bb6d51 100644
--- a/lib/librte_sched/rte_sched.c
+++ b/lib/librte_sched/rte_sched.c
@@ -228,7 +228,7 @@ struct rte_sched_port {
uint64_t time_cpu_cycles; /* Current CPU time measured in CPU cyles */
uint64_t time_cpu_bytes; /* Current CPU time measured in bytes */
uint64_t time; /* Current NIC TX time measured in bytes */
- struct rte_reciprocal inv_cycles_per_byte; /* CPU cycles per byte */
+ struct rte_reciprocal_u32 inv_cycles_per_byte; /* CPU cycles per byte */
/* Scheduling loop detection */
uint32_t pipe_loop;
@@ -677,7 +677,7 @@ rte_sched_port_config(struct rte_sched_port_params *params)
cycles_per_byte = (rte_get_tsc_hz() << RTE_SCHED_TIME_SHIFT)
/ params->rate;
- port->inv_cycles_per_byte = rte_reciprocal_value(cycles_per_byte);
+ port->inv_cycles_per_byte = rte_reciprocal_value_u32(cycles_per_byte);
/* Scheduling loop detection */
port->pipe_loop = RTE_SCHED_PIPE_INVALID;
@@ -2147,8 +2147,9 @@ rte_sched_port_time_resync(struct rte_sched_port *port)
uint64_t bytes_diff;
/* Compute elapsed time in bytes */
- bytes_diff = rte_reciprocal_divide(cycles_diff << RTE_SCHED_TIME_SHIFT,
- port->inv_cycles_per_byte);
+ bytes_diff = rte_reciprocal_divide_u32(
+ cycles_diff << RTE_SCHED_TIME_SHIFT,
+ &port->inv_cycles_per_byte);
/* Advance port time */
port->time_cpu_cycles = cycles;
--
2.7.4
^ permalink raw reply [flat|nested] 11+ messages in thread
* [dpdk-dev] [PATCH v6 3/3] test: add tests for reciprocal based division
2017-09-06 10:21 [dpdk-dev] [PATCH v6 1/3] eal: introduce integer divide through reciprocal Pavan Nikhilesh
2017-09-06 10:21 ` [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal Pavan Nikhilesh
@ 2017-09-06 10:21 ` Pavan Nikhilesh
2017-09-20 13:10 ` [dpdk-dev] [PATCH v6 1/3] eal: introduce integer divide through reciprocal Dumitrescu, Cristian
2 siblings, 0 replies; 11+ messages in thread
From: Pavan Nikhilesh @ 2017-09-06 10:21 UTC (permalink / raw)
To: cristian.dumitrescu, stephen; +Cc: dev, Pavan Bhagavatula
From: Pavan Bhagavatula <pbhagavatula@caviumnetworks.com>
This commit provides a set of tests for verifying the correctness and
performance of both unsigned 32 and 64bit reciprocal based division.
Signed-off-by: Pavan Nikhilesh <pbhagavatula@caviumnetworks.com>
---
test/test/Makefile | 2 +
test/test/test_reciprocal_division.c | 109 +++++++++++++++++
test/test/test_reciprocal_division_perf.c | 193 ++++++++++++++++++++++++++++++
3 files changed, 304 insertions(+)
create mode 100644 test/test/test_reciprocal_division.c
create mode 100644 test/test/test_reciprocal_division_perf.c
diff --git a/test/test/Makefile b/test/test/Makefile
index 42d9a49..6017862 100644
--- a/test/test/Makefile
+++ b/test/test/Makefile
@@ -94,6 +94,8 @@ SRCS-y += test_cycles.c
SRCS-y += test_spinlock.c
SRCS-y += test_memory.c
SRCS-y += test_memzone.c
+SRCS-y += test_reciprocal_division.c
+SRCS-y += test_reciprocal_division_perf.c
SRCS-y += test_ring.c
SRCS-y += test_ring_perf.c
diff --git a/test/test/test_reciprocal_division.c b/test/test/test_reciprocal_division.c
new file mode 100644
index 0000000..771ea64
--- /dev/null
+++ b/test/test/test_reciprocal_division.c
@@ -0,0 +1,109 @@
+/*
+ * BSD LICENSE
+ *
+ * Copyright (C) Cavium, Inc. 2017.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *
+ * * Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * * Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in
+ * the documentation and/or other materials provided with the
+ * distribution.
+ * * Neither the name of Cavium, Inc nor the names of its
+ * contributors may be used to endorse or promote products derived
+ * from this software without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+ * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+ * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+ * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+ * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+ * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+ * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+ * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include "test.h"
+
+#include <stdio.h>
+#include <unistd.h>
+#include <inttypes.h>
+
+#include <rte_common.h>
+#include <rte_cycles.h>
+#include <rte_random.h>
+#include <rte_reciprocal.h>
+
+#define MAX_ITERATIONS 1000000
+#define DIVIDE_ITER 100
+
+static int
+test_reciprocal_division(void)
+{
+ int i;
+ int result = 0;
+ uint32_t divisor_u32 = 0;
+ uint32_t dividend_u32;
+ uint32_t nresult_u32;
+ uint32_t rresult_u32;
+ uint64_t divisor_u64 = 0;
+ uint64_t dividend_u64;
+ uint64_t nresult_u64;
+ uint64_t rresult_u64;
+ struct rte_reciprocal_u32 reci_u32;
+ struct rte_reciprocal_u64 reci_u64;
+
+ rte_srand(rte_rdtsc());
+ printf("Validating unsigned 32bit division.\n");
+ for (i = 0; i < MAX_ITERATIONS; i++) {
+ /* Change divisor every DIVIDE_ITER iterations. */
+ if (i % DIVIDE_ITER == 0) {
+ divisor_u32 = rte_rand();
+ reci_u32 = rte_reciprocal_value_u32(divisor_u32);
+ }
+
+ dividend_u32 = rte_rand();
+ nresult_u32 = dividend_u32 / divisor_u32;
+ rresult_u32 = rte_reciprocal_divide_u32(dividend_u32,
+ &reci_u32);
+ if (nresult_u32 != rresult_u32) {
+ printf("Division failed, expected %"PRIu32" "
+ "result %"PRIu32"",
+ nresult_u32, rresult_u32);
+ result = 1;
+ break;
+ }
+ }
+
+ printf("Validating unsigned 64bit division.\n");
+ for (i = 0; i < MAX_ITERATIONS; i++) {
+ /* Change divisor every DIVIDE_ITER iterations. */
+ if (i % DIVIDE_ITER == 0) {
+ divisor_u64 = rte_rand();
+ reci_u64 = rte_reciprocal_value_u64(divisor_u64);
+ }
+
+ dividend_u64 = rte_rand();
+ nresult_u64 = dividend_u64 / divisor_u64;
+ rresult_u64 = rte_reciprocal_divide_u64(dividend_u64,
+ &reci_u64);
+ if (nresult_u64 != rresult_u64) {
+ printf("Division failed, expected %"PRIu64" "
+ "result %"PRIu64"",
+ nresult_u64, rresult_u64);
+ result = 1;
+ break;
+ }
+ }
+
+ return result;
+}
+
+REGISTER_TEST_COMMAND(reciprocal_division, test_reciprocal_division);
diff --git a/test/test/test_reciprocal_division_perf.c b/test/test/test_reciprocal_division_perf.c
new file mode 100644
index 0000000..3eaf575
--- /dev/null
+++ b/test/test/test_reciprocal_division_perf.c
@@ -0,0 +1,193 @@
+/*
+ * BSD LICENSE
+ *
+ * Copyright (C) Cavium, Inc. 2017.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *
+ * * Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * * Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in
+ * the documentation and/or other materials provided with the
+ * distribution.
+ * * Neither the name of Cavium, Inc nor the names of its
+ * contributors may be used to endorse or promote products derived
+ * from this software without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+ * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+ * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+ * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+ * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+ * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+ * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+ * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include "test.h"
+
+#include <stdio.h>
+#include <unistd.h>
+#include <inttypes.h>
+
+#include <rte_common.h>
+#include <rte_cycles.h>
+#include <rte_random.h>
+#include <rte_reciprocal.h>
+
+#define MAX_ITERATIONS 1000000
+#define DIVIDE_ITER 100
+
+static int
+test_reciprocal_division_perf(void)
+{
+ int result = 0;
+ uint32_t divisor_u32 = 0;
+ volatile uint32_t dividend_u32;
+ uint32_t nresult_u32;
+ uint32_t rresult_u32;
+ uint64_t divisor_u64 = 0;
+ volatile uint64_t dividend_u64;
+ uint64_t nresult_u64;
+ uint64_t rresult_u64;
+ uint64_t start_cyc;
+ uint64_t split_cyc;
+ uint64_t end_cyc;
+ uint64_t tot_cyc_n = 0;
+ uint64_t tot_cyc_r = 0;
+ uint64_t i;
+ struct rte_reciprocal_u32 reci_u32 = {0};
+ struct rte_reciprocal_u64 reci_u64 = {0};
+
+ rte_srand(rte_rdtsc());
+
+ printf("Validating unsigned 32bit division.\n");
+
+ for (i = 0; i < MAX_ITERATIONS; i++) {
+ /* Change divisor every DIVIDE_ITER iterations. */
+ if (i % DIVIDE_ITER == 0) {
+ divisor_u32 = rte_rand();
+ reci_u32 = rte_reciprocal_value_u32(divisor_u32);
+ }
+
+ dividend_u32 = rte_rand();
+
+ start_cyc = rte_rdtsc();
+ nresult_u32 = dividend_u32 / divisor_u32;
+ split_cyc = rte_rdtsc();
+ rresult_u32 = rte_reciprocal_divide_u32(dividend_u32,
+ &reci_u32);
+ end_cyc = rte_rdtsc();
+
+ tot_cyc_n += split_cyc - start_cyc;
+ tot_cyc_r += end_cyc - split_cyc;
+ if (nresult_u32 != rresult_u32) {
+ printf("Division failed, expected %"PRIu32" "
+ "result %"PRIu32"",
+ nresult_u32, rresult_u32);
+ result = 1;
+ break;
+ }
+ }
+ printf("32bit Division results:\n");
+ printf("Total number of cycles normal division : %"PRIu64"\n",
+ tot_cyc_n);
+ printf("Total number of cycles reciprocal division : %"PRIu64"\n",
+ tot_cyc_r);
+ printf("Cycles per division(normal) : %3.2f\n",
+ ((double)tot_cyc_n)/i);
+ printf("Cycles per division(reciprocal) : %3.2f\n\n",
+ ((double)tot_cyc_r)/i);
+
+ tot_cyc_n = 0;
+ tot_cyc_r = 0;
+
+ printf("Validating unsigned 64bit division.\n");
+
+ for (i = 0; i < MAX_ITERATIONS; i++) {
+ /* Change divisor every DIVIDE_ITER iterations. */
+ if (i % DIVIDE_ITER == 0) {
+ divisor_u64 = rte_rand();
+ reci_u64 = rte_reciprocal_value_u64(divisor_u64);
+ }
+
+ dividend_u64 = rte_rand();
+
+ start_cyc = rte_rdtsc();
+ nresult_u64 = dividend_u64 / divisor_u64;
+ split_cyc = rte_rdtsc();
+ rresult_u64 = rte_reciprocal_divide_u64(dividend_u64,
+ &reci_u64);
+ end_cyc = rte_rdtsc();
+
+ tot_cyc_n += split_cyc - start_cyc;
+ tot_cyc_r += end_cyc - split_cyc;
+ if (nresult_u64 != rresult_u64) {
+ printf("Division failed, expected %"PRIu64" "
+ "result %"PRIu64"",
+ nresult_u64, rresult_u64);
+ result = 1;
+ break;
+ }
+ }
+ printf("64bit Division results:\n");
+ printf("Total number of cycles normal division : %"PRIu64"\n",
+ tot_cyc_n);
+ printf("Total number of cycles reciprocal division : %"PRIu64"\n",
+ tot_cyc_r);
+ printf("Cycles per division(normal) : %3.2f\n",
+ ((double)tot_cyc_n)/i);
+ printf("Cycles per division(reciprocal) : %3.2f\n\n",
+ ((double)tot_cyc_r)/i);
+
+ tot_cyc_n = 0;
+ tot_cyc_r = 0;
+
+ printf("Validating unsigned 64bit division with 32bit divisor.\n");
+
+ for (i = 0; i < MAX_ITERATIONS; i++) {
+ /* Change divisor every DIVIDE_ITER iterations. */
+ if (i % DIVIDE_ITER == 0) {
+ divisor_u64 = rte_rand() >> 32;
+ reci_u64 = rte_reciprocal_value_u64(divisor_u64);
+ }
+
+ dividend_u64 = rte_rand();
+
+ start_cyc = rte_rdtsc();
+ nresult_u64 = dividend_u64 / divisor_u64;
+ split_cyc = rte_rdtsc();
+ rresult_u64 = rte_reciprocal_divide_u64(dividend_u64,
+ &reci_u64);
+ end_cyc = rte_rdtsc();
+
+ tot_cyc_n += split_cyc - start_cyc;
+ tot_cyc_r += end_cyc - split_cyc;
+ if (nresult_u64 != rresult_u64) {
+ printf("Division failed, expected %"PRIu64" "
+ "result %"PRIu64"",
+ nresult_u64, rresult_u64);
+ result = 1;
+ break;
+ }
+ }
+ printf("64bit Division results:\n");
+ printf("Total number of cycles normal division : %"PRIu64"\n",
+ tot_cyc_n);
+ printf("Total number of cycles reciprocal division : %"PRIu64"\n",
+ tot_cyc_r);
+ printf("Cycles per division(normal) : %3.2f\n",
+ ((double)tot_cyc_n)/i);
+ printf("Cycles per division(reciprocal) : %3.2f\n",
+ ((double)tot_cyc_r)/i);
+
+ return result;
+}
+
+REGISTER_TEST_COMMAND(reciprocal_division_perf, test_reciprocal_division_perf);
--
2.7.4
^ permalink raw reply [flat|nested] 11+ messages in thread
* Re: [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal
2017-09-06 10:21 ` [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal Pavan Nikhilesh
@ 2017-09-06 12:28 ` Kevin Traynor
2017-09-06 14:41 ` Pavan Nikhilesh Bhagavatula
2017-09-20 13:15 ` Dumitrescu, Cristian
1 sibling, 1 reply; 11+ messages in thread
From: Kevin Traynor @ 2017-09-06 12:28 UTC (permalink / raw)
To: Pavan Nikhilesh, cristian.dumitrescu, stephen; +Cc: dev
On 09/06/2017 11:21 AM, Pavan Nikhilesh wrote:
> From: Pavan Bhagavatula <pbhagavatula@caviumnetworks.com>
>
> Currently, rte_reciprocal only supports unsigned 32bit divisors. This
> commit adds support for unsigned 64bit divisors.
>
> Rename unsigned 32bit specific functions appropriately and update
> librte_sched accordingly.
>
> Signed-off-by: Pavan Nikhilesh <pbhagavatula@caviumnetworks.com>
> ---
> lib/librte_eal/bsdapp/eal/rte_eal_version.map | 3 +-
> lib/librte_eal/common/include/rte_reciprocal.h | 109 ++++++++++++++++++++--
> lib/librte_eal/common/rte_reciprocal.c | 116 +++++++++++++++++++++---
> lib/librte_eal/linuxapp/eal/rte_eal_version.map | 3 +-
> lib/librte_sched/Makefile | 4 +-
> lib/librte_sched/rte_sched.c | 9 +-
> 6 files changed, 219 insertions(+), 25 deletions(-)
>
> diff --git a/lib/librte_eal/bsdapp/eal/rte_eal_version.map b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> index 90d7258..59a85bb 100644
> --- a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> +++ b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> @@ -241,6 +241,7 @@ EXPERIMENTAL {
> DPDK_17.11 {
> global:
>
> - rte_reciprocal_value;
> + rte_reciprocal_value_u32;
> + rte_reciprocal_value_u64;
>
> } DPDK_17.08;
> diff --git a/lib/librte_eal/common/include/rte_reciprocal.h b/lib/librte_eal/common/include/rte_reciprocal.h
> index b6d752f..85599e6 100644
> --- a/lib/librte_eal/common/include/rte_reciprocal.h
> +++ b/lib/librte_eal/common/include/rte_reciprocal.h
Hi Pavan, sorry for commenting late but the license in v1 of this file
states it cannot be removed. It is not included in later versions - can
you explain why?
+/*
+ * libdivide
+ * Copyright (C) 2010 ridiculous_fish
+ * This software is provided 'as-is', without any express or implied
+ * warranty. In no event will the authors be held liable for any damages
+ * arising from the use of this software.
+ * Permission is granted to anyone to use this software for any purpose,
+ * including commercial applications, and to alter it and redistribute it
+ * freely, subject to the following restrictions:
+ *
+ * 1. The origin of this software must not be misrepresented; you must not
+ * claim that you wrote the original software. If you use this software
+ * in a product, an acknowledgment in the product documentation would be
+ * appreciated but is not required.
+ *
+ * 2. Altered source versions must be plainly marked as such, and must
not be
+ * misrepresented as being the original software.
+ *
+ * 3. This notice may not be removed or altered from any source
distribution.
+ *
+ * libdivide@ridiculousfish.com
+ *
+ */
+
> @@ -22,22 +22,117 @@
> #ifndef _RTE_RECIPROCAL_H_
> #define _RTE_RECIPROCAL_H_
>
> -#include <stdint.h>
> +#include <rte_memory.h>
>
> -struct rte_reciprocal {
> +/**
> + * Unsigned 32-bit divisor structure.
> + */
> +struct rte_reciprocal_u32 {
> uint32_t m;
> uint8_t sh1, sh2;
> };
>
> +/**
> + * Unsigned 64-bit divisor structure.
> + */
> +struct rte_reciprocal_u64 {
> + uint64_t m;
> + uint8_t sh1;
> +};
> +
> +/**
> + * Divide given unsigned 32-bit integer with pre calculated divisor.
> + *
> + * @param a
> + * The 32-bit dividend.
> + * @param R
> + * The pointer to pre calculated divisor reciprocal structure.
> + *
> + * @return
> + * The result of the division
> + */
> static inline uint32_t
> -rte_reciprocal_divide(uint32_t a, struct rte_reciprocal R)
> +rte_reciprocal_divide_u32(uint32_t a, struct rte_reciprocal_u32 *R)
> {
> - uint32_t t = (uint32_t)(((uint64_t)a * R.m) >> 32);
> + uint32_t t = (((uint64_t)a * R->m) >> 32);
>
> - return (t + ((a - t) >> R.sh1)) >> R.sh2;
> + return (t + ((a - t) >> R->sh1)) >> R->sh2;
> }
>
> -struct rte_reciprocal
> -rte_reciprocal_value(uint32_t d);
> +static inline uint64_t
> +mullhi_u64(uint64_t x, uint64_t y)
> +{
> +#ifdef __SIZEOF_INT128__
> + __uint128_t xl = x;
> + __uint128_t rl = xl * y;
> +
> + return (rl >> 64);
> +#else
> + uint64_t u0, u1, v0, v1, k, t;
> + uint64_t w1, w2;
> + uint64_t whi;
> +
> + u1 = x >> 32; u0 = x & 0xFFFFFFFF;
> + v1 = y >> 32; v0 = y & 0xFFFFFFFF;
> +
> + t = u0*v0;
> + k = t >> 32;
> +
> + t = u1*v0 + k;
> + w1 = t & 0xFFFFFFFF;
> + w2 = t >> 32;
> +
> + t = u0*v1 + w1;
> + k = t >> 32;
> +
> + whi = u1*v1 + w2 + k;
> +
> + return whi;
> +#endif
> +}
> +
> +/**
> + * Divide given unsigned 64-bit integer with pre calculated divisor.
> + *
> + * @param a
> + * The 64-bit dividend.
> + * @param R
> + * The pointer to pre calculated divisor reciprocal structure.
> + *
> + * @return
> + * The result of the division
> + */
> +static inline uint64_t
> +rte_reciprocal_divide_u64(uint64_t a, struct rte_reciprocal_u64 *R)
> +{
> + uint64_t q = mullhi_u64(R->m, a);
> + uint64_t t = ((a - q) >> 1) + q;
> +
> + return t >> R->sh1;
> +}
> +
> +/**
> + * Generate pre calculated divisor structure.
> + *
> + * @param d
> + * The unsigned 32-bit divisor.
> + *
> + * @return
> + * Divisor structure.
> + */
> +struct rte_reciprocal_u32
> +rte_reciprocal_value_u32(uint32_t d);
> +
> +/**
> + * Generate pre calculated divisor structure.
> + *
> + * @param d
> + * The unsigned 64-bit divisor.
> + *
> + * @return
> + * Divisor structure.
> + */
> +struct rte_reciprocal_u64
> +rte_reciprocal_value_u64(uint64_t d);
>
> #endif /* _RTE_RECIPROCAL_H_ */
> diff --git a/lib/librte_eal/common/rte_reciprocal.c b/lib/librte_eal/common/rte_reciprocal.c
> index 7ab99b4..2024e62 100644
> --- a/lib/librte_eal/common/rte_reciprocal.c
> +++ b/lib/librte_eal/common/rte_reciprocal.c
> @@ -31,18 +31,13 @@
> * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
> */
>
> -#include <stdio.h>
> -#include <stdint.h>
> -
> -#include <rte_common.h>
> -
> -#include "rte_reciprocal.h"
> +#include <rte_reciprocal.h>
>
> /* find largest set bit.
> * portable and slow but does not matter for this usage.
> */
> static inline int
> -fls(uint32_t x)
> +fls_u32(uint32_t x)
> {
> int b;
>
> @@ -54,14 +49,14 @@ fls(uint32_t x)
> return 0;
> }
>
> -struct rte_reciprocal
> -rte_reciprocal_value(uint32_t d)
> +struct rte_reciprocal_u32
> +rte_reciprocal_value_u32(uint32_t d)
> {
> - struct rte_reciprocal R;
> + struct rte_reciprocal_u32 R;
> uint64_t m;
> int l;
>
> - l = fls(d - 1);
> + l = fls_u32(d - 1);
> m = ((1ULL << 32) * ((1ULL << l) - d));
> m /= d;
>
> @@ -72,3 +67,102 @@ rte_reciprocal_value(uint32_t d)
>
> return R;
> }
> +
> +/* Code taken from Hacker's Delight:
> + * http://www.hackersdelight.org/HDcode/divlu.c.
> + * License permits inclusion here per:
> + * http://www.hackersdelight.org/permissions.htm
> + */
> +static inline uint64_t
> +divide_128_div_64_to_64(uint64_t u1, uint64_t u0, uint64_t v, uint64_t *r)
> +{
> + const uint64_t b = (1ULL << 32); /* Number base (16 bits). */
> + uint64_t un1, un0, /* Norm. dividend LSD's. */
> + vn1, vn0, /* Norm. divisor digits. */
> + q1, q0, /* Quotient digits. */
> + un64, un21, un10, /* Dividend digit pairs. */
> + rhat; /* A remainder. */
> + int s; /* Shift amount for norm. */
> +
> + /* If overflow, set rem. to an impossible value. */
> + if (u1 >= v) {
> + if (r != NULL)
> + *r = (uint64_t) -1;
> + return (uint64_t) -1;
> + }
> +
> + /* Count leading zeros. */
> + s = __builtin_clzll(v);
> + if (s > 0) {
> + v = v << s;
> + un64 = (u1 << s) | ((u0 >> (64 - s)) & (-s >> 31));
> + un10 = u0 << s;
> + } else {
> +
> + un64 = u1 | u0;
> + un10 = u0;
> + }
> +
> + vn1 = v >> 32;
> + vn0 = v & 0xFFFFFFFF;
> +
> + un1 = un10 >> 32;
> + un0 = un10 & 0xFFFFFFFF;
> +
> + q1 = un64/vn1;
> + rhat = un64 - q1*vn1;
> +again1:
> + if (q1 >= b || q1*vn0 > b*rhat + un1) {
> + q1 = q1 - 1;
> + rhat = rhat + vn1;
> + if (rhat < b)
> + goto again1;
> + }
> +
> + un21 = un64*b + un1 - q1*v;
> +
> + q0 = un21/vn1;
> + rhat = un21 - q0*vn1;
> +again2:
> + if (q0 >= b || q0*vn0 > b*rhat + un0) {
> + q0 = q0 - 1;
> + rhat = rhat + vn1;
> + if (rhat < b)
> + goto again2;
> + }
> +
> + if (r != NULL)
> + *r = (un21*b + un0 - q0*v) >> s;
> + return q1*b + q0;
> +}
> +
> +struct rte_reciprocal_u64
> +rte_reciprocal_value_u64(uint64_t d)
> +{
> + struct rte_reciprocal_u64 R;
> +
> + const uint32_t fld = 63 - __builtin_clzll(d);
> +
> + if ((d & (d - 1)) == 0) {
> + R.m = 0;
> + R.sh1 = (fld - 1) | 0x40;
> + } else {
> + uint64_t rem;
> + uint64_t multiplier;
> + uint8_t more;
> +
> + multiplier = divide_128_div_64_to_64(1ULL << fld, 0, d, &rem);
> + multiplier += multiplier;
> +
> + const uint64_t twice_rem = rem + rem;
> + if (twice_rem >= d || twice_rem < rem)
> + multiplier += 1;
> + more = fld;
> + R.m = 1 + multiplier;
> + R.sh1 = more | 0x40;
> + }
> +
> + R.sh1 &= 0x3F;
> +
> + return R;
> +}
> diff --git a/lib/librte_eal/linuxapp/eal/rte_eal_version.map b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> index 2070cba..2671627 100644
> --- a/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> +++ b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> @@ -246,6 +246,7 @@ EXPERIMENTAL {
> DPDK_17.11 {
> global:
>
> - rte_reciprocal_value;
> + rte_reciprocal_value_u32;
> + rte_reciprocal_value_u64;
>
> } DPDK_17.08;
> diff --git a/lib/librte_sched/Makefile b/lib/librte_sched/Makefile
> index 569656b..a2fd6f3 100644
> --- a/lib/librte_sched/Makefile
> +++ b/lib/librte_sched/Makefile
> @@ -54,6 +54,8 @@ LIBABIVER := 1
> SRCS-$(CONFIG_RTE_LIBRTE_SCHED) += rte_sched.c rte_red.c rte_approx.c
>
> # install includes
> -SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include := rte_sched.h rte_bitmap.h rte_sched_common.h rte_red.h rte_approx.h
> +SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include := rte_sched.h rte_bitmap.h
> +SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include += rte_sched_common.h rte_red.h
> +SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include += rte_approx.h
>
> include $(RTE_SDK)/mk/rte.lib.mk
> diff --git a/lib/librte_sched/rte_sched.c b/lib/librte_sched/rte_sched.c
> index 3b8ccaa..7bb6d51 100644
> --- a/lib/librte_sched/rte_sched.c
> +++ b/lib/librte_sched/rte_sched.c
> @@ -228,7 +228,7 @@ struct rte_sched_port {
> uint64_t time_cpu_cycles; /* Current CPU time measured in CPU cyles */
> uint64_t time_cpu_bytes; /* Current CPU time measured in bytes */
> uint64_t time; /* Current NIC TX time measured in bytes */
> - struct rte_reciprocal inv_cycles_per_byte; /* CPU cycles per byte */
> + struct rte_reciprocal_u32 inv_cycles_per_byte; /* CPU cycles per byte */
>
> /* Scheduling loop detection */
> uint32_t pipe_loop;
> @@ -677,7 +677,7 @@ rte_sched_port_config(struct rte_sched_port_params *params)
>
> cycles_per_byte = (rte_get_tsc_hz() << RTE_SCHED_TIME_SHIFT)
> / params->rate;
> - port->inv_cycles_per_byte = rte_reciprocal_value(cycles_per_byte);
> + port->inv_cycles_per_byte = rte_reciprocal_value_u32(cycles_per_byte);
>
> /* Scheduling loop detection */
> port->pipe_loop = RTE_SCHED_PIPE_INVALID;
> @@ -2147,8 +2147,9 @@ rte_sched_port_time_resync(struct rte_sched_port *port)
> uint64_t bytes_diff;
>
> /* Compute elapsed time in bytes */
> - bytes_diff = rte_reciprocal_divide(cycles_diff << RTE_SCHED_TIME_SHIFT,
> - port->inv_cycles_per_byte);
> + bytes_diff = rte_reciprocal_divide_u32(
> + cycles_diff << RTE_SCHED_TIME_SHIFT,
> + &port->inv_cycles_per_byte);
>
> /* Advance port time */
> port->time_cpu_cycles = cycles;
>
^ permalink raw reply [flat|nested] 11+ messages in thread
* Re: [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal
2017-09-06 12:28 ` Kevin Traynor
@ 2017-09-06 14:41 ` Pavan Nikhilesh Bhagavatula
2017-09-06 15:35 ` Kevin Traynor
2017-09-06 15:37 ` Stephen Hemminger
0 siblings, 2 replies; 11+ messages in thread
From: Pavan Nikhilesh Bhagavatula @ 2017-09-06 14:41 UTC (permalink / raw)
To: Kevin Traynor, stephen, cristian.dumitrescu; +Cc: dev
On Wed, Sep 06, 2017 at 01:28:24PM +0100, Kevin Traynor wrote:
> On 09/06/2017 11:21 AM, Pavan Nikhilesh wrote:
> > From: Pavan Bhagavatula <pbhagavatula@caviumnetworks.com>
> >
> > Currently, rte_reciprocal only supports unsigned 32bit divisors. This
> > commit adds support for unsigned 64bit divisors.
> >
> > Rename unsigned 32bit specific functions appropriately and update
> > librte_sched accordingly.
> >
> > Signed-off-by: Pavan Nikhilesh <pbhagavatula@caviumnetworks.com>
> > ---
> > lib/librte_eal/bsdapp/eal/rte_eal_version.map | 3 +-
> > lib/librte_eal/common/include/rte_reciprocal.h | 109 ++++++++++++++++++++--
> > lib/librte_eal/common/rte_reciprocal.c | 116 +++++++++++++++++++++---
> > lib/librte_eal/linuxapp/eal/rte_eal_version.map | 3 +-
> > lib/librte_sched/Makefile | 4 +-
> > lib/librte_sched/rte_sched.c | 9 +-
> > 6 files changed, 219 insertions(+), 25 deletions(-)
> >
> > diff --git a/lib/librte_eal/bsdapp/eal/rte_eal_version.map b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> > index 90d7258..59a85bb 100644
> > --- a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> > +++ b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> > @@ -241,6 +241,7 @@ EXPERIMENTAL {
> > DPDK_17.11 {
> > global:
> >
> > - rte_reciprocal_value;
> > + rte_reciprocal_value_u32;
> > + rte_reciprocal_value_u64;
> >
> > } DPDK_17.08;
> > diff --git a/lib/librte_eal/common/include/rte_reciprocal.h b/lib/librte_eal/common/include/rte_reciprocal.h
> > index b6d752f..85599e6 100644
> > --- a/lib/librte_eal/common/include/rte_reciprocal.h
> > +++ b/lib/librte_eal/common/include/rte_reciprocal.h
>
> Hi Pavan, sorry for commenting late but the license in v1 of this file
> states it cannot be removed. It is not included in later versions - can
> you explain why?
>
Hi Kevin,
I have misinterpreted this mail
http://dpdk.org/ml/archives/dev/2017-August/073781.html,
any suggestion on how to proceed on this further?
Thanks,
Pavan
> +/*
> + * libdivide
> + * Copyright (C) 2010 ridiculous_fish
> + * This software is provided 'as-is', without any express or implied
> + * warranty. In no event will the authors be held liable for any damages
> + * arising from the use of this software.
> + * Permission is granted to anyone to use this software for any purpose,
> + * including commercial applications, and to alter it and redistribute it
> + * freely, subject to the following restrictions:
> + *
> + * 1. The origin of this software must not be misrepresented; you must not
> + * claim that you wrote the original software. If you use this software
> + * in a product, an acknowledgment in the product documentation would be
> + * appreciated but is not required.
> + *
> + * 2. Altered source versions must be plainly marked as such, and must
> not be
> + * misrepresented as being the original software.
> + *
> + * 3. This notice may not be removed or altered from any source
> distribution.
> + *
> + * libdivide@ridiculousfish.com
> + *
> + */
> +
>
>
>
> > @@ -22,22 +22,117 @@
> > #ifndef _RTE_RECIPROCAL_H_
> > #define _RTE_RECIPROCAL_H_
> >
> > -#include <stdint.h>
> > +#include <rte_memory.h>
> >
> > -struct rte_reciprocal {
> > +/**
> > + * Unsigned 32-bit divisor structure.
> > + */
> > +struct rte_reciprocal_u32 {
> > uint32_t m;
> > uint8_t sh1, sh2;
> > };
> >
> > +/**
> > + * Unsigned 64-bit divisor structure.
> > + */
> > +struct rte_reciprocal_u64 {
> > + uint64_t m;
> > + uint8_t sh1;
> > +};
> > +
> > +/**
> > + * Divide given unsigned 32-bit integer with pre calculated divisor.
> > + *
> > + * @param a
> > + * The 32-bit dividend.
> > + * @param R
> > + * The pointer to pre calculated divisor reciprocal structure.
> > + *
> > + * @return
> > + * The result of the division
> > + */
> > static inline uint32_t
> > -rte_reciprocal_divide(uint32_t a, struct rte_reciprocal R)
> > +rte_reciprocal_divide_u32(uint32_t a, struct rte_reciprocal_u32 *R)
> > {
> > - uint32_t t = (uint32_t)(((uint64_t)a * R.m) >> 32);
> > + uint32_t t = (((uint64_t)a * R->m) >> 32);
> >
> > - return (t + ((a - t) >> R.sh1)) >> R.sh2;
> > + return (t + ((a - t) >> R->sh1)) >> R->sh2;
> > }
> >
> > -struct rte_reciprocal
> > -rte_reciprocal_value(uint32_t d);
> > +static inline uint64_t
> > +mullhi_u64(uint64_t x, uint64_t y)
> > +{
> > +#ifdef __SIZEOF_INT128__
> > + __uint128_t xl = x;
> > + __uint128_t rl = xl * y;
> > +
> > + return (rl >> 64);
> > +#else
> > + uint64_t u0, u1, v0, v1, k, t;
> > + uint64_t w1, w2;
> > + uint64_t whi;
> > +
> > + u1 = x >> 32; u0 = x & 0xFFFFFFFF;
> > + v1 = y >> 32; v0 = y & 0xFFFFFFFF;
> > +
> > + t = u0*v0;
> > + k = t >> 32;
> > +
> > + t = u1*v0 + k;
> > + w1 = t & 0xFFFFFFFF;
> > + w2 = t >> 32;
> > +
> > + t = u0*v1 + w1;
> > + k = t >> 32;
> > +
> > + whi = u1*v1 + w2 + k;
> > +
> > + return whi;
> > +#endif
> > +}
> > +
> > +/**
> > + * Divide given unsigned 64-bit integer with pre calculated divisor.
> > + *
> > + * @param a
> > + * The 64-bit dividend.
> > + * @param R
> > + * The pointer to pre calculated divisor reciprocal structure.
> > + *
> > + * @return
> > + * The result of the division
> > + */
> > +static inline uint64_t
> > +rte_reciprocal_divide_u64(uint64_t a, struct rte_reciprocal_u64 *R)
> > +{
> > + uint64_t q = mullhi_u64(R->m, a);
> > + uint64_t t = ((a - q) >> 1) + q;
> > +
> > + return t >> R->sh1;
> > +}
> > +
> > +/**
> > + * Generate pre calculated divisor structure.
> > + *
> > + * @param d
> > + * The unsigned 32-bit divisor.
> > + *
> > + * @return
> > + * Divisor structure.
> > + */
> > +struct rte_reciprocal_u32
> > +rte_reciprocal_value_u32(uint32_t d);
> > +
> > +/**
> > + * Generate pre calculated divisor structure.
> > + *
> > + * @param d
> > + * The unsigned 64-bit divisor.
> > + *
> > + * @return
> > + * Divisor structure.
> > + */
> > +struct rte_reciprocal_u64
> > +rte_reciprocal_value_u64(uint64_t d);
> >
> > #endif /* _RTE_RECIPROCAL_H_ */
> > diff --git a/lib/librte_eal/common/rte_reciprocal.c b/lib/librte_eal/common/rte_reciprocal.c
> > index 7ab99b4..2024e62 100644
> > --- a/lib/librte_eal/common/rte_reciprocal.c
> > +++ b/lib/librte_eal/common/rte_reciprocal.c
> > @@ -31,18 +31,13 @@
> > * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
> > */
> >
> > -#include <stdio.h>
> > -#include <stdint.h>
> > -
> > -#include <rte_common.h>
> > -
> > -#include "rte_reciprocal.h"
> > +#include <rte_reciprocal.h>
> >
> > /* find largest set bit.
> > * portable and slow but does not matter for this usage.
> > */
> > static inline int
> > -fls(uint32_t x)
> > +fls_u32(uint32_t x)
> > {
> > int b;
> >
> > @@ -54,14 +49,14 @@ fls(uint32_t x)
> > return 0;
> > }
> >
> > -struct rte_reciprocal
> > -rte_reciprocal_value(uint32_t d)
> > +struct rte_reciprocal_u32
> > +rte_reciprocal_value_u32(uint32_t d)
> > {
> > - struct rte_reciprocal R;
> > + struct rte_reciprocal_u32 R;
> > uint64_t m;
> > int l;
> >
> > - l = fls(d - 1);
> > + l = fls_u32(d - 1);
> > m = ((1ULL << 32) * ((1ULL << l) - d));
> > m /= d;
> >
> > @@ -72,3 +67,102 @@ rte_reciprocal_value(uint32_t d)
> >
> > return R;
> > }
> > +
> > +/* Code taken from Hacker's Delight:
> > + * http://www.hackersdelight.org/HDcode/divlu.c.
> > + * License permits inclusion here per:
> > + * http://www.hackersdelight.org/permissions.htm
> > + */
> > +static inline uint64_t
> > +divide_128_div_64_to_64(uint64_t u1, uint64_t u0, uint64_t v, uint64_t *r)
> > +{
> > + const uint64_t b = (1ULL << 32); /* Number base (16 bits). */
> > + uint64_t un1, un0, /* Norm. dividend LSD's. */
> > + vn1, vn0, /* Norm. divisor digits. */
> > + q1, q0, /* Quotient digits. */
> > + un64, un21, un10, /* Dividend digit pairs. */
> > + rhat; /* A remainder. */
> > + int s; /* Shift amount for norm. */
> > +
> > + /* If overflow, set rem. to an impossible value. */
> > + if (u1 >= v) {
> > + if (r != NULL)
> > + *r = (uint64_t) -1;
> > + return (uint64_t) -1;
> > + }
> > +
> > + /* Count leading zeros. */
> > + s = __builtin_clzll(v);
> > + if (s > 0) {
> > + v = v << s;
> > + un64 = (u1 << s) | ((u0 >> (64 - s)) & (-s >> 31));
> > + un10 = u0 << s;
> > + } else {
> > +
> > + un64 = u1 | u0;
> > + un10 = u0;
> > + }
> > +
> > + vn1 = v >> 32;
> > + vn0 = v & 0xFFFFFFFF;
> > +
> > + un1 = un10 >> 32;
> > + un0 = un10 & 0xFFFFFFFF;
> > +
> > + q1 = un64/vn1;
> > + rhat = un64 - q1*vn1;
> > +again1:
> > + if (q1 >= b || q1*vn0 > b*rhat + un1) {
> > + q1 = q1 - 1;
> > + rhat = rhat + vn1;
> > + if (rhat < b)
> > + goto again1;
> > + }
> > +
> > + un21 = un64*b + un1 - q1*v;
> > +
> > + q0 = un21/vn1;
> > + rhat = un21 - q0*vn1;
> > +again2:
> > + if (q0 >= b || q0*vn0 > b*rhat + un0) {
> > + q0 = q0 - 1;
> > + rhat = rhat + vn1;
> > + if (rhat < b)
> > + goto again2;
> > + }
> > +
> > + if (r != NULL)
> > + *r = (un21*b + un0 - q0*v) >> s;
> > + return q1*b + q0;
> > +}
> > +
> > +struct rte_reciprocal_u64
> > +rte_reciprocal_value_u64(uint64_t d)
> > +{
> > + struct rte_reciprocal_u64 R;
> > +
> > + const uint32_t fld = 63 - __builtin_clzll(d);
> > +
> > + if ((d & (d - 1)) == 0) {
> > + R.m = 0;
> > + R.sh1 = (fld - 1) | 0x40;
> > + } else {
> > + uint64_t rem;
> > + uint64_t multiplier;
> > + uint8_t more;
> > +
> > + multiplier = divide_128_div_64_to_64(1ULL << fld, 0, d, &rem);
> > + multiplier += multiplier;
> > +
> > + const uint64_t twice_rem = rem + rem;
> > + if (twice_rem >= d || twice_rem < rem)
> > + multiplier += 1;
> > + more = fld;
> > + R.m = 1 + multiplier;
> > + R.sh1 = more | 0x40;
> > + }
> > +
> > + R.sh1 &= 0x3F;
> > +
> > + return R;
> > +}
> > diff --git a/lib/librte_eal/linuxapp/eal/rte_eal_version.map b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> > index 2070cba..2671627 100644
> > --- a/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> > +++ b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> > @@ -246,6 +246,7 @@ EXPERIMENTAL {
> > DPDK_17.11 {
> > global:
> >
> > - rte_reciprocal_value;
> > + rte_reciprocal_value_u32;
> > + rte_reciprocal_value_u64;
> >
> > } DPDK_17.08;
> > diff --git a/lib/librte_sched/Makefile b/lib/librte_sched/Makefile
> > index 569656b..a2fd6f3 100644
> > --- a/lib/librte_sched/Makefile
> > +++ b/lib/librte_sched/Makefile
> > @@ -54,6 +54,8 @@ LIBABIVER := 1
> > SRCS-$(CONFIG_RTE_LIBRTE_SCHED) += rte_sched.c rte_red.c rte_approx.c
> >
> > # install includes
> > -SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include := rte_sched.h rte_bitmap.h rte_sched_common.h rte_red.h rte_approx.h
> > +SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include := rte_sched.h rte_bitmap.h
> > +SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include += rte_sched_common.h rte_red.h
> > +SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include += rte_approx.h
> >
> > include $(RTE_SDK)/mk/rte.lib.mk
> > diff --git a/lib/librte_sched/rte_sched.c b/lib/librte_sched/rte_sched.c
> > index 3b8ccaa..7bb6d51 100644
> > --- a/lib/librte_sched/rte_sched.c
> > +++ b/lib/librte_sched/rte_sched.c
> > @@ -228,7 +228,7 @@ struct rte_sched_port {
> > uint64_t time_cpu_cycles; /* Current CPU time measured in CPU cyles */
> > uint64_t time_cpu_bytes; /* Current CPU time measured in bytes */
> > uint64_t time; /* Current NIC TX time measured in bytes */
> > - struct rte_reciprocal inv_cycles_per_byte; /* CPU cycles per byte */
> > + struct rte_reciprocal_u32 inv_cycles_per_byte; /* CPU cycles per byte */
> >
> > /* Scheduling loop detection */
> > uint32_t pipe_loop;
> > @@ -677,7 +677,7 @@ rte_sched_port_config(struct rte_sched_port_params *params)
> >
> > cycles_per_byte = (rte_get_tsc_hz() << RTE_SCHED_TIME_SHIFT)
> > / params->rate;
> > - port->inv_cycles_per_byte = rte_reciprocal_value(cycles_per_byte);
> > + port->inv_cycles_per_byte = rte_reciprocal_value_u32(cycles_per_byte);
> >
> > /* Scheduling loop detection */
> > port->pipe_loop = RTE_SCHED_PIPE_INVALID;
> > @@ -2147,8 +2147,9 @@ rte_sched_port_time_resync(struct rte_sched_port *port)
> > uint64_t bytes_diff;
> >
> > /* Compute elapsed time in bytes */
> > - bytes_diff = rte_reciprocal_divide(cycles_diff << RTE_SCHED_TIME_SHIFT,
> > - port->inv_cycles_per_byte);
> > + bytes_diff = rte_reciprocal_divide_u32(
> > + cycles_diff << RTE_SCHED_TIME_SHIFT,
> > + &port->inv_cycles_per_byte);
> >
> > /* Advance port time */
> > port->time_cpu_cycles = cycles;
> >
>
^ permalink raw reply [flat|nested] 11+ messages in thread
* Re: [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal
2017-09-06 14:41 ` Pavan Nikhilesh Bhagavatula
@ 2017-09-06 15:35 ` Kevin Traynor
2017-09-06 15:37 ` Stephen Hemminger
1 sibling, 0 replies; 11+ messages in thread
From: Kevin Traynor @ 2017-09-06 15:35 UTC (permalink / raw)
To: Pavan Nikhilesh Bhagavatula, stephen, cristian.dumitrescu; +Cc: dev
On 09/06/2017 03:41 PM, Pavan Nikhilesh Bhagavatula wrote:
> On Wed, Sep 06, 2017 at 01:28:24PM +0100, Kevin Traynor wrote:
>> On 09/06/2017 11:21 AM, Pavan Nikhilesh wrote:
>>> From: Pavan Bhagavatula <pbhagavatula@caviumnetworks.com>
>>>
>>> Currently, rte_reciprocal only supports unsigned 32bit divisors. This
>>> commit adds support for unsigned 64bit divisors.
>>>
>>> Rename unsigned 32bit specific functions appropriately and update
>>> librte_sched accordingly.
>>>
>>> Signed-off-by: Pavan Nikhilesh <pbhagavatula@caviumnetworks.com>
>>> ---
>>> lib/librte_eal/bsdapp/eal/rte_eal_version.map | 3 +-
>>> lib/librte_eal/common/include/rte_reciprocal.h | 109 ++++++++++++++++++++--
>>> lib/librte_eal/common/rte_reciprocal.c | 116 +++++++++++++++++++++---
>>> lib/librte_eal/linuxapp/eal/rte_eal_version.map | 3 +-
>>> lib/librte_sched/Makefile | 4 +-
>>> lib/librte_sched/rte_sched.c | 9 +-
>>> 6 files changed, 219 insertions(+), 25 deletions(-)
>>>
>>> diff --git a/lib/librte_eal/bsdapp/eal/rte_eal_version.map b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
>>> index 90d7258..59a85bb 100644
>>> --- a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
>>> +++ b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
>>> @@ -241,6 +241,7 @@ EXPERIMENTAL {
>>> DPDK_17.11 {
>>> global:
>>>
>>> - rte_reciprocal_value;
>>> + rte_reciprocal_value_u32;
>>> + rte_reciprocal_value_u64;
>>>
>>> } DPDK_17.08;
>>> diff --git a/lib/librte_eal/common/include/rte_reciprocal.h b/lib/librte_eal/common/include/rte_reciprocal.h
>>> index b6d752f..85599e6 100644
>>> --- a/lib/librte_eal/common/include/rte_reciprocal.h
>>> +++ b/lib/librte_eal/common/include/rte_reciprocal.h
>>
>> Hi Pavan, sorry for commenting late but the license in v1 of this file
>> states it cannot be removed. It is not included in later versions - can
>> you explain why?
>>
> Hi Kevin,
>
> I have misinterpreted this mail
> http://dpdk.org/ml/archives/dev/2017-August/073781.html,
> any suggestion on how to proceed on this further?
>
> Thanks,
> Pavan
>
no, not really :( maybe someone else has a suggestion.
The DPDK charter [1] (6.IP Policy) lists the incoming licenses that are
accepted. There is a note about getting governing board approval for an
exception, but I don't think it's applicable to a relatively small
optimization like this.
Kevin.
[1] http://dpdk.org/about/charter
>> +/*
>> + * libdivide
>> + * Copyright (C) 2010 ridiculous_fish
>> + * This software is provided 'as-is', without any express or implied
>> + * warranty. In no event will the authors be held liable for any damages
>> + * arising from the use of this software.
>> + * Permission is granted to anyone to use this software for any purpose,
>> + * including commercial applications, and to alter it and redistribute it
>> + * freely, subject to the following restrictions:
>> + *
>> + * 1. The origin of this software must not be misrepresented; you must not
>> + * claim that you wrote the original software. If you use this software
>> + * in a product, an acknowledgment in the product documentation would be
>> + * appreciated but is not required.
>> + *
>> + * 2. Altered source versions must be plainly marked as such, and must
>> not be
>> + * misrepresented as being the original software.
>> + *
>> + * 3. This notice may not be removed or altered from any source
>> distribution.
>> + *
>> + * libdivide@ridiculousfish.com
>> + *
>> + */
>> +
>>
>>
>>
>>> @@ -22,22 +22,117 @@
>>> #ifndef _RTE_RECIPROCAL_H_
>>> #define _RTE_RECIPROCAL_H_
>>>
>>> -#include <stdint.h>
>>> +#include <rte_memory.h>
>>>
>>> -struct rte_reciprocal {
>>> +/**
>>> + * Unsigned 32-bit divisor structure.
>>> + */
>>> +struct rte_reciprocal_u32 {
>>> uint32_t m;
>>> uint8_t sh1, sh2;
>>> };
>>>
>>> +/**
>>> + * Unsigned 64-bit divisor structure.
>>> + */
>>> +struct rte_reciprocal_u64 {
>>> + uint64_t m;
>>> + uint8_t sh1;
>>> +};
>>> +
>>> +/**
>>> + * Divide given unsigned 32-bit integer with pre calculated divisor.
>>> + *
>>> + * @param a
>>> + * The 32-bit dividend.
>>> + * @param R
>>> + * The pointer to pre calculated divisor reciprocal structure.
>>> + *
>>> + * @return
>>> + * The result of the division
>>> + */
>>> static inline uint32_t
>>> -rte_reciprocal_divide(uint32_t a, struct rte_reciprocal R)
>>> +rte_reciprocal_divide_u32(uint32_t a, struct rte_reciprocal_u32 *R)
>>> {
>>> - uint32_t t = (uint32_t)(((uint64_t)a * R.m) >> 32);
>>> + uint32_t t = (((uint64_t)a * R->m) >> 32);
>>>
>>> - return (t + ((a - t) >> R.sh1)) >> R.sh2;
>>> + return (t + ((a - t) >> R->sh1)) >> R->sh2;
>>> }
>>>
>>> -struct rte_reciprocal
>>> -rte_reciprocal_value(uint32_t d);
>>> +static inline uint64_t
>>> +mullhi_u64(uint64_t x, uint64_t y)
>>> +{
>>> +#ifdef __SIZEOF_INT128__
>>> + __uint128_t xl = x;
>>> + __uint128_t rl = xl * y;
>>> +
>>> + return (rl >> 64);
>>> +#else
>>> + uint64_t u0, u1, v0, v1, k, t;
>>> + uint64_t w1, w2;
>>> + uint64_t whi;
>>> +
>>> + u1 = x >> 32; u0 = x & 0xFFFFFFFF;
>>> + v1 = y >> 32; v0 = y & 0xFFFFFFFF;
>>> +
>>> + t = u0*v0;
>>> + k = t >> 32;
>>> +
>>> + t = u1*v0 + k;
>>> + w1 = t & 0xFFFFFFFF;
>>> + w2 = t >> 32;
>>> +
>>> + t = u0*v1 + w1;
>>> + k = t >> 32;
>>> +
>>> + whi = u1*v1 + w2 + k;
>>> +
>>> + return whi;
>>> +#endif
>>> +}
>>> +
>>> +/**
>>> + * Divide given unsigned 64-bit integer with pre calculated divisor.
>>> + *
>>> + * @param a
>>> + * The 64-bit dividend.
>>> + * @param R
>>> + * The pointer to pre calculated divisor reciprocal structure.
>>> + *
>>> + * @return
>>> + * The result of the division
>>> + */
>>> +static inline uint64_t
>>> +rte_reciprocal_divide_u64(uint64_t a, struct rte_reciprocal_u64 *R)
>>> +{
>>> + uint64_t q = mullhi_u64(R->m, a);
>>> + uint64_t t = ((a - q) >> 1) + q;
>>> +
>>> + return t >> R->sh1;
>>> +}
>>> +
>>> +/**
>>> + * Generate pre calculated divisor structure.
>>> + *
>>> + * @param d
>>> + * The unsigned 32-bit divisor.
>>> + *
>>> + * @return
>>> + * Divisor structure.
>>> + */
>>> +struct rte_reciprocal_u32
>>> +rte_reciprocal_value_u32(uint32_t d);
>>> +
>>> +/**
>>> + * Generate pre calculated divisor structure.
>>> + *
>>> + * @param d
>>> + * The unsigned 64-bit divisor.
>>> + *
>>> + * @return
>>> + * Divisor structure.
>>> + */
>>> +struct rte_reciprocal_u64
>>> +rte_reciprocal_value_u64(uint64_t d);
>>>
>>> #endif /* _RTE_RECIPROCAL_H_ */
>>> diff --git a/lib/librte_eal/common/rte_reciprocal.c b/lib/librte_eal/common/rte_reciprocal.c
>>> index 7ab99b4..2024e62 100644
>>> --- a/lib/librte_eal/common/rte_reciprocal.c
>>> +++ b/lib/librte_eal/common/rte_reciprocal.c
>>> @@ -31,18 +31,13 @@
>>> * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
>>> */
>>>
>>> -#include <stdio.h>
>>> -#include <stdint.h>
>>> -
>>> -#include <rte_common.h>
>>> -
>>> -#include "rte_reciprocal.h"
>>> +#include <rte_reciprocal.h>
>>>
>>> /* find largest set bit.
>>> * portable and slow but does not matter for this usage.
>>> */
>>> static inline int
>>> -fls(uint32_t x)
>>> +fls_u32(uint32_t x)
>>> {
>>> int b;
>>>
>>> @@ -54,14 +49,14 @@ fls(uint32_t x)
>>> return 0;
>>> }
>>>
>>> -struct rte_reciprocal
>>> -rte_reciprocal_value(uint32_t d)
>>> +struct rte_reciprocal_u32
>>> +rte_reciprocal_value_u32(uint32_t d)
>>> {
>>> - struct rte_reciprocal R;
>>> + struct rte_reciprocal_u32 R;
>>> uint64_t m;
>>> int l;
>>>
>>> - l = fls(d - 1);
>>> + l = fls_u32(d - 1);
>>> m = ((1ULL << 32) * ((1ULL << l) - d));
>>> m /= d;
>>>
>>> @@ -72,3 +67,102 @@ rte_reciprocal_value(uint32_t d)
>>>
>>> return R;
>>> }
>>> +
>>> +/* Code taken from Hacker's Delight:
>>> + * http://www.hackersdelight.org/HDcode/divlu.c.
>>> + * License permits inclusion here per:
>>> + * http://www.hackersdelight.org/permissions.htm
>>> + */
>>> +static inline uint64_t
>>> +divide_128_div_64_to_64(uint64_t u1, uint64_t u0, uint64_t v, uint64_t *r)
>>> +{
>>> + const uint64_t b = (1ULL << 32); /* Number base (16 bits). */
>>> + uint64_t un1, un0, /* Norm. dividend LSD's. */
>>> + vn1, vn0, /* Norm. divisor digits. */
>>> + q1, q0, /* Quotient digits. */
>>> + un64, un21, un10, /* Dividend digit pairs. */
>>> + rhat; /* A remainder. */
>>> + int s; /* Shift amount for norm. */
>>> +
>>> + /* If overflow, set rem. to an impossible value. */
>>> + if (u1 >= v) {
>>> + if (r != NULL)
>>> + *r = (uint64_t) -1;
>>> + return (uint64_t) -1;
>>> + }
>>> +
>>> + /* Count leading zeros. */
>>> + s = __builtin_clzll(v);
>>> + if (s > 0) {
>>> + v = v << s;
>>> + un64 = (u1 << s) | ((u0 >> (64 - s)) & (-s >> 31));
>>> + un10 = u0 << s;
>>> + } else {
>>> +
>>> + un64 = u1 | u0;
>>> + un10 = u0;
>>> + }
>>> +
>>> + vn1 = v >> 32;
>>> + vn0 = v & 0xFFFFFFFF;
>>> +
>>> + un1 = un10 >> 32;
>>> + un0 = un10 & 0xFFFFFFFF;
>>> +
>>> + q1 = un64/vn1;
>>> + rhat = un64 - q1*vn1;
>>> +again1:
>>> + if (q1 >= b || q1*vn0 > b*rhat + un1) {
>>> + q1 = q1 - 1;
>>> + rhat = rhat + vn1;
>>> + if (rhat < b)
>>> + goto again1;
>>> + }
>>> +
>>> + un21 = un64*b + un1 - q1*v;
>>> +
>>> + q0 = un21/vn1;
>>> + rhat = un21 - q0*vn1;
>>> +again2:
>>> + if (q0 >= b || q0*vn0 > b*rhat + un0) {
>>> + q0 = q0 - 1;
>>> + rhat = rhat + vn1;
>>> + if (rhat < b)
>>> + goto again2;
>>> + }
>>> +
>>> + if (r != NULL)
>>> + *r = (un21*b + un0 - q0*v) >> s;
>>> + return q1*b + q0;
>>> +}
>>> +
>>> +struct rte_reciprocal_u64
>>> +rte_reciprocal_value_u64(uint64_t d)
>>> +{
>>> + struct rte_reciprocal_u64 R;
>>> +
>>> + const uint32_t fld = 63 - __builtin_clzll(d);
>>> +
>>> + if ((d & (d - 1)) == 0) {
>>> + R.m = 0;
>>> + R.sh1 = (fld - 1) | 0x40;
>>> + } else {
>>> + uint64_t rem;
>>> + uint64_t multiplier;
>>> + uint8_t more;
>>> +
>>> + multiplier = divide_128_div_64_to_64(1ULL << fld, 0, d, &rem);
>>> + multiplier += multiplier;
>>> +
>>> + const uint64_t twice_rem = rem + rem;
>>> + if (twice_rem >= d || twice_rem < rem)
>>> + multiplier += 1;
>>> + more = fld;
>>> + R.m = 1 + multiplier;
>>> + R.sh1 = more | 0x40;
>>> + }
>>> +
>>> + R.sh1 &= 0x3F;
>>> +
>>> + return R;
>>> +}
>>> diff --git a/lib/librte_eal/linuxapp/eal/rte_eal_version.map b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
>>> index 2070cba..2671627 100644
>>> --- a/lib/librte_eal/linuxapp/eal/rte_eal_version.map
>>> +++ b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
>>> @@ -246,6 +246,7 @@ EXPERIMENTAL {
>>> DPDK_17.11 {
>>> global:
>>>
>>> - rte_reciprocal_value;
>>> + rte_reciprocal_value_u32;
>>> + rte_reciprocal_value_u64;
>>>
>>> } DPDK_17.08;
>>> diff --git a/lib/librte_sched/Makefile b/lib/librte_sched/Makefile
>>> index 569656b..a2fd6f3 100644
>>> --- a/lib/librte_sched/Makefile
>>> +++ b/lib/librte_sched/Makefile
>>> @@ -54,6 +54,8 @@ LIBABIVER := 1
>>> SRCS-$(CONFIG_RTE_LIBRTE_SCHED) += rte_sched.c rte_red.c rte_approx.c
>>>
>>> # install includes
>>> -SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include := rte_sched.h rte_bitmap.h rte_sched_common.h rte_red.h rte_approx.h
>>> +SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include := rte_sched.h rte_bitmap.h
>>> +SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include += rte_sched_common.h rte_red.h
>>> +SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include += rte_approx.h
>>>
>>> include $(RTE_SDK)/mk/rte.lib.mk
>>> diff --git a/lib/librte_sched/rte_sched.c b/lib/librte_sched/rte_sched.c
>>> index 3b8ccaa..7bb6d51 100644
>>> --- a/lib/librte_sched/rte_sched.c
>>> +++ b/lib/librte_sched/rte_sched.c
>>> @@ -228,7 +228,7 @@ struct rte_sched_port {
>>> uint64_t time_cpu_cycles; /* Current CPU time measured in CPU cyles */
>>> uint64_t time_cpu_bytes; /* Current CPU time measured in bytes */
>>> uint64_t time; /* Current NIC TX time measured in bytes */
>>> - struct rte_reciprocal inv_cycles_per_byte; /* CPU cycles per byte */
>>> + struct rte_reciprocal_u32 inv_cycles_per_byte; /* CPU cycles per byte */
>>>
>>> /* Scheduling loop detection */
>>> uint32_t pipe_loop;
>>> @@ -677,7 +677,7 @@ rte_sched_port_config(struct rte_sched_port_params *params)
>>>
>>> cycles_per_byte = (rte_get_tsc_hz() << RTE_SCHED_TIME_SHIFT)
>>> / params->rate;
>>> - port->inv_cycles_per_byte = rte_reciprocal_value(cycles_per_byte);
>>> + port->inv_cycles_per_byte = rte_reciprocal_value_u32(cycles_per_byte);
>>>
>>> /* Scheduling loop detection */
>>> port->pipe_loop = RTE_SCHED_PIPE_INVALID;
>>> @@ -2147,8 +2147,9 @@ rte_sched_port_time_resync(struct rte_sched_port *port)
>>> uint64_t bytes_diff;
>>>
>>> /* Compute elapsed time in bytes */
>>> - bytes_diff = rte_reciprocal_divide(cycles_diff << RTE_SCHED_TIME_SHIFT,
>>> - port->inv_cycles_per_byte);
>>> + bytes_diff = rte_reciprocal_divide_u32(
>>> + cycles_diff << RTE_SCHED_TIME_SHIFT,
>>> + &port->inv_cycles_per_byte);
>>>
>>> /* Advance port time */
>>> port->time_cpu_cycles = cycles;
>>>
>>
^ permalink raw reply [flat|nested] 11+ messages in thread
* Re: [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal
2017-09-06 14:41 ` Pavan Nikhilesh Bhagavatula
2017-09-06 15:35 ` Kevin Traynor
@ 2017-09-06 15:37 ` Stephen Hemminger
2017-09-06 17:05 ` Dumitrescu, Cristian
1 sibling, 1 reply; 11+ messages in thread
From: Stephen Hemminger @ 2017-09-06 15:37 UTC (permalink / raw)
To: Pavan Nikhilesh Bhagavatula; +Cc: Kevin Traynor, cristian.dumitrescu, dev
On Wed, 6 Sep 2017 20:11:34 +0530
Pavan Nikhilesh Bhagavatula <pbhagavatula@caviumnetworks.com> wrote:
> On Wed, Sep 06, 2017 at 01:28:24PM +0100, Kevin Traynor wrote:
> > On 09/06/2017 11:21 AM, Pavan Nikhilesh wrote:
> > > From: Pavan Bhagavatula <pbhagavatula@caviumnetworks.com>
> > >
> > > Currently, rte_reciprocal only supports unsigned 32bit divisors. This
> > > commit adds support for unsigned 64bit divisors.
> > >
> > > Rename unsigned 32bit specific functions appropriately and update
> > > librte_sched accordingly.
> > >
> > > Signed-off-by: Pavan Nikhilesh <pbhagavatula@caviumnetworks.com>
> > > ---
> > > lib/librte_eal/bsdapp/eal/rte_eal_version.map | 3 +-
> > > lib/librte_eal/common/include/rte_reciprocal.h | 109 ++++++++++++++++++++--
> > > lib/librte_eal/common/rte_reciprocal.c | 116 +++++++++++++++++++++---
> > > lib/librte_eal/linuxapp/eal/rte_eal_version.map | 3 +-
> > > lib/librte_sched/Makefile | 4 +-
> > > lib/librte_sched/rte_sched.c | 9 +-
> > > 6 files changed, 219 insertions(+), 25 deletions(-)
> > >
> > > diff --git a/lib/librte_eal/bsdapp/eal/rte_eal_version.map b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> > > index 90d7258..59a85bb 100644
> > > --- a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> > > +++ b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> > > @@ -241,6 +241,7 @@ EXPERIMENTAL {
> > > DPDK_17.11 {
> > > global:
> > >
> > > - rte_reciprocal_value;
> > > + rte_reciprocal_value_u32;
> > > + rte_reciprocal_value_u64;
> > >
> > > } DPDK_17.08;
> > > diff --git a/lib/librte_eal/common/include/rte_reciprocal.h b/lib/librte_eal/common/include/rte_reciprocal.h
> > > index b6d752f..85599e6 100644
> > > --- a/lib/librte_eal/common/include/rte_reciprocal.h
> > > +++ b/lib/librte_eal/common/include/rte_reciprocal.h
> >
> > Hi Pavan, sorry for commenting late but the license in v1 of this file
> > states it cannot be removed. It is not included in later versions - can
> > you explain why?
> >
> Hi Kevin,
>
> I have misinterpreted this mail
> http://dpdk.org/ml/archives/dev/2017-August/073781.html,
> any suggestion on how to proceed on this further?
>
> Thanks,
> Pavan
License issues need legal advice (TAB could ask LF if required).
Sorry, I am a cynic engineer not a lawyer.
Easiest solution is to find equivalent code in FreeBSD or some other project
which does not have the restrictions.
^ permalink raw reply [flat|nested] 11+ messages in thread
* Re: [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal
2017-09-06 15:37 ` Stephen Hemminger
@ 2017-09-06 17:05 ` Dumitrescu, Cristian
0 siblings, 0 replies; 11+ messages in thread
From: Dumitrescu, Cristian @ 2017-09-06 17:05 UTC (permalink / raw)
To: Stephen Hemminger, Pavan Nikhilesh Bhagavatula; +Cc: Kevin Traynor, dev
> -----Original Message-----
> From: Stephen Hemminger [mailto:stephen@networkplumber.org]
> Sent: Wednesday, September 6, 2017 4:37 PM
> To: Pavan Nikhilesh Bhagavatula <pbhagavatula@caviumnetworks.com>
> Cc: Kevin Traynor <ktraynor@redhat.com>; Dumitrescu, Cristian
> <cristian.dumitrescu@intel.com>; dev@dpdk.org
> Subject: Re: [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal
>
> On Wed, 6 Sep 2017 20:11:34 +0530
> Pavan Nikhilesh Bhagavatula <pbhagavatula@caviumnetworks.com> wrote:
>
> > On Wed, Sep 06, 2017 at 01:28:24PM +0100, Kevin Traynor wrote:
> > > On 09/06/2017 11:21 AM, Pavan Nikhilesh wrote:
> > > > From: Pavan Bhagavatula <pbhagavatula@caviumnetworks.com>
> > > >
> > > > Currently, rte_reciprocal only supports unsigned 32bit divisors. This
> > > > commit adds support for unsigned 64bit divisors.
> > > >
> > > > Rename unsigned 32bit specific functions appropriately and update
> > > > librte_sched accordingly.
> > > >
> > > > Signed-off-by: Pavan Nikhilesh <pbhagavatula@caviumnetworks.com>
> > > > ---
> > > > lib/librte_eal/bsdapp/eal/rte_eal_version.map | 3 +-
> > > > lib/librte_eal/common/include/rte_reciprocal.h | 109
> ++++++++++++++++++++--
> > > > lib/librte_eal/common/rte_reciprocal.c | 116
> +++++++++++++++++++++---
> > > > lib/librte_eal/linuxapp/eal/rte_eal_version.map | 3 +-
> > > > lib/librte_sched/Makefile | 4 +-
> > > > lib/librte_sched/rte_sched.c | 9 +-
> > > > 6 files changed, 219 insertions(+), 25 deletions(-)
> > > >
> > > > diff --git a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> > > > index 90d7258..59a85bb 100644
> > > > --- a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> > > > +++ b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> > > > @@ -241,6 +241,7 @@ EXPERIMENTAL {
> > > > DPDK_17.11 {
> > > > global:
> > > >
> > > > - rte_reciprocal_value;
> > > > + rte_reciprocal_value_u32;
> > > > + rte_reciprocal_value_u64;
> > > >
> > > > } DPDK_17.08;
> > > > diff --git a/lib/librte_eal/common/include/rte_reciprocal.h
> b/lib/librte_eal/common/include/rte_reciprocal.h
> > > > index b6d752f..85599e6 100644
> > > > --- a/lib/librte_eal/common/include/rte_reciprocal.h
> > > > +++ b/lib/librte_eal/common/include/rte_reciprocal.h
> > >
> > > Hi Pavan, sorry for commenting late but the license in v1 of this file
> > > states it cannot be removed. It is not included in later versions - can
> > > you explain why?
> > >
> > Hi Kevin,
> >
> > I have misinterpreted this mail
> > http://dpdk.org/ml/archives/dev/2017-August/073781.html,
> > any suggestion on how to proceed on this further?
> >
> > Thanks,
> > Pavan
>
> License issues need legal advice (TAB could ask LF if required).
> Sorry, I am a cynic engineer not a lawyer.
>
> Easiest solution is to find equivalent code in FreeBSD or some other project
> which does not have the restrictions.
How about just adding your copyright on the existing BSD license?
^ permalink raw reply [flat|nested] 11+ messages in thread
* Re: [dpdk-dev] [PATCH v6 1/3] eal: introduce integer divide through reciprocal
2017-09-06 10:21 [dpdk-dev] [PATCH v6 1/3] eal: introduce integer divide through reciprocal Pavan Nikhilesh
2017-09-06 10:21 ` [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal Pavan Nikhilesh
2017-09-06 10:21 ` [dpdk-dev] [PATCH v6 3/3] test: add tests for reciprocal based division Pavan Nikhilesh
@ 2017-09-20 13:10 ` Dumitrescu, Cristian
2017-09-20 13:27 ` Pavan Nikhilesh Bhagavatula
2 siblings, 1 reply; 11+ messages in thread
From: Dumitrescu, Cristian @ 2017-09-20 13:10 UTC (permalink / raw)
To: Pavan Nikhilesh, stephen; +Cc: dev
Hi Pavan,
I think moving rte_reciprocal.[hc] to a common code area like EAL is a very good idea, so thanks for doing this work!
One ask from my side: please do not change the existing code.
1. Keep the existing name for the 32-bit API functions and data structures (no _u32 name suffix), add the _u64 suffix just for the new API functions that you add.
- If you want, you can create aliases with _32 name suffix for the existing 32-bit API
- The only change to rte_sched.c should be header include line: #include "rte_reciprocal.h" -> #include <rte_reciprocal.h>
2. Do not do any cosmetic changes in existing code in rte_reciprocal.[hc] (such as adding CR+LF), as they result in lots of code churn for no real value
Once these changes are done, the size of your patch set is reduced considerably.
> -----Original Message-----
> From: Pavan Nikhilesh [mailto:pbhagavatula@caviumnetworks.com]
> Sent: Wednesday, September 6, 2017 11:22 AM
> To: Dumitrescu, Cristian <cristian.dumitrescu@intel.com>;
> stephen@networkplumber.org
> Cc: dev@dpdk.org; Pavan Bhagavatula
> <pbhagavatula@caviumnetworks.com>
> Subject: [dpdk-dev] [PATCH v6 1/3] eal: introduce integer divide through
> reciprocal
>
> From: Pavan Bhagavatula <pbhagavatula@caviumnetworks.com>
>
> In some use cases of integer division, denominator remains constant and
> numerator varies. It is possible to optimize division for such specific
> scenarios.
>
> The librte_sched uses rte_reciprocal to optimize division so, moving it to
> eal/common would allow other libraries and applications to use it.
>
> Signed-off-by: Pavan Nikhilesh <pbhagavatula@caviumnetworks.com>
> Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
> ---
>
> v6 changes:
> - remove cache alignment from rte_reciprocal_u{32/64}structures as they
> would
> be embedded in other structures.
>
> v5 changes:
> - fix test print strings
>
> v4 changes:
> - minor fix for test cases
> - fix u32 divisor generation
>
> v3 changes:
> - fix x86_32 compilation issue
> - fix improper licence in test
>
> v2 changes:
> - fix compilation issues with .map files
> - add test cases for correctness and performance
> - remove extra licence inclusion
> - fix coding style issues
>
> lib/librte_eal/bsdapp/eal/Makefile | 1 +
> lib/librte_eal/bsdapp/eal/rte_eal_version.map | 7 +++++++
> lib/librte_eal/common/Makefile | 1 +
> lib/{librte_sched => librte_eal/common/include}/rte_reciprocal.h | 6 ++++--
> lib/{librte_sched => librte_eal/common}/rte_reciprocal.c | 6 ++++--
> lib/librte_eal/linuxapp/eal/Makefile | 1 +
> lib/librte_eal/linuxapp/eal/rte_eal_version.map | 7 +++++++
> lib/librte_sched/Makefile | 2 --
> lib/librte_sched/rte_sched.c | 2 +-
> 9 files changed, 26 insertions(+), 7 deletions(-)
> rename lib/{librte_sched => librte_eal/common/include}/rte_reciprocal.h
> (87%)
> rename lib/{librte_sched => librte_eal/common}/rte_reciprocal.c (96%)
>
> diff --git a/lib/librte_eal/bsdapp/eal/Makefile
> b/lib/librte_eal/bsdapp/eal/Makefile
> index 005019e..56f9804 100644
> --- a/lib/librte_eal/bsdapp/eal/Makefile
> +++ b/lib/librte_eal/bsdapp/eal/Makefile
> @@ -88,6 +88,7 @@ SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) +=
> malloc_elem.c
> SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += malloc_heap.c
> SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += rte_keepalive.c
> SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += rte_service.c
> +SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += rte_reciprocal.c
>
> # from arch dir
> SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += rte_cpuflags.c
> diff --git a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> index aac6fd7..90d7258 100644
> --- a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> +++ b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> @@ -237,3 +237,10 @@ EXPERIMENTAL {
> rte_service_unregister;
>
> } DPDK_17.08;
> +
> +DPDK_17.11 {
> + global:
> +
> + rte_reciprocal_value;
> +
> +} DPDK_17.08;
> diff --git a/lib/librte_eal/common/Makefile
> b/lib/librte_eal/common/Makefile
> index e8fd67a..a680b2d 100644
> --- a/lib/librte_eal/common/Makefile
> +++ b/lib/librte_eal/common/Makefile
> @@ -42,6 +42,7 @@ INC += rte_hexdump.h rte_devargs.h rte_bus.h
> rte_dev.h rte_vdev.h
> INC += rte_pci_dev_feature_defs.h rte_pci_dev_features.h
> INC += rte_malloc.h rte_keepalive.h rte_time.h
> INC += rte_service.h rte_service_component.h
> +INC += rte_reciprocal.h
>
> GENERIC_INC := rte_atomic.h rte_byteorder.h rte_cycles.h rte_prefetch.h
> GENERIC_INC += rte_spinlock.h rte_memcpy.h rte_cpuflags.h rte_rwlock.h
> diff --git a/lib/librte_sched/rte_reciprocal.h
> b/lib/librte_eal/common/include/rte_reciprocal.h
> similarity index 87%
> rename from lib/librte_sched/rte_reciprocal.h
> rename to lib/librte_eal/common/include/rte_reciprocal.h
> index 5e21f09..b6d752f 100644
> --- a/lib/librte_sched/rte_reciprocal.h
> +++ b/lib/librte_eal/common/include/rte_reciprocal.h
> @@ -29,13 +29,15 @@ struct rte_reciprocal {
> uint8_t sh1, sh2;
> };
>
> -static inline uint32_t rte_reciprocal_divide(uint32_t a, struct rte_reciprocal
> R)
> +static inline uint32_t
> +rte_reciprocal_divide(uint32_t a, struct rte_reciprocal R)
> {
> uint32_t t = (uint32_t)(((uint64_t)a * R.m) >> 32);
>
> return (t + ((a - t) >> R.sh1)) >> R.sh2;
> }
>
> -struct rte_reciprocal rte_reciprocal_value(uint32_t d);
> +struct rte_reciprocal
> +rte_reciprocal_value(uint32_t d);
>
Please remove these cosmetic changes that result in code churn for no real value.
> #endif /* _RTE_RECIPROCAL_H_ */
> diff --git a/lib/librte_sched/rte_reciprocal.c
> b/lib/librte_eal/common/rte_reciprocal.c
> similarity index 96%
> rename from lib/librte_sched/rte_reciprocal.c
> rename to lib/librte_eal/common/rte_reciprocal.c
> index 652f023..7ab99b4 100644
> --- a/lib/librte_sched/rte_reciprocal.c
> +++ b/lib/librte_eal/common/rte_reciprocal.c
> @@ -41,7 +41,8 @@
> /* find largest set bit.
> * portable and slow but does not matter for this usage.
> */
> -static inline int fls(uint32_t x)
> +static inline int
> +fls(uint32_t x)
> {
> int b;
>
> @@ -53,7 +54,8 @@ static inline int fls(uint32_t x)
> return 0;
> }
>
> -struct rte_reciprocal rte_reciprocal_value(uint32_t d)
> +struct rte_reciprocal
> +rte_reciprocal_value(uint32_t d)
> {
> struct rte_reciprocal R;
> uint64_t m;
Please remove these cosmetic changes that result in code churn for no real value.
> diff --git a/lib/librte_eal/linuxapp/eal/Makefile
> b/lib/librte_eal/linuxapp/eal/Makefile
> index 90bca4d..98f3b8e 100644
> --- a/lib/librte_eal/linuxapp/eal/Makefile
> +++ b/lib/librte_eal/linuxapp/eal/Makefile
> @@ -100,6 +100,7 @@ SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) +=
> malloc_elem.c
> SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += malloc_heap.c
> SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += rte_keepalive.c
> SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += rte_service.c
> +SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += rte_reciprocal.c
>
> # from arch dir
> SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += rte_cpuflags.c
> diff --git a/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> index 3a8f154..2070cba 100644
> --- a/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> +++ b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> @@ -242,3 +242,10 @@ EXPERIMENTAL {
> rte_service_unregister;
>
> } DPDK_17.08;
> +
> +DPDK_17.11 {
> + global:
> +
> + rte_reciprocal_value;
> +
> +} DPDK_17.08;
> diff --git a/lib/librte_sched/Makefile b/lib/librte_sched/Makefile
> index 18274e7..569656b 100644
> --- a/lib/librte_sched/Makefile
> +++ b/lib/librte_sched/Makefile
> @@ -52,10 +52,8 @@ LIBABIVER := 1
> # all source are stored in SRCS-y
> #
> SRCS-$(CONFIG_RTE_LIBRTE_SCHED) += rte_sched.c rte_red.c rte_approx.c
> -SRCS-$(CONFIG_RTE_LIBRTE_SCHED) += rte_reciprocal.c
>
> # install includes
> SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include := rte_sched.h
> rte_bitmap.h rte_sched_common.h rte_red.h rte_approx.h
> -SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include += rte_reciprocal.h
>
> include $(RTE_SDK)/mk/rte.lib.mk
> diff --git a/lib/librte_sched/rte_sched.c b/lib/librte_sched/rte_sched.c
> index b7cba11..3b8ccaa 100644
> --- a/lib/librte_sched/rte_sched.c
> +++ b/lib/librte_sched/rte_sched.c
> @@ -42,12 +42,12 @@
> #include <rte_prefetch.h>
> #include <rte_branch_prediction.h>
> #include <rte_mbuf.h>
> +#include <rte_reciprocal.h>
>
> #include "rte_sched.h"
> #include "rte_bitmap.h"
> #include "rte_sched_common.h"
> #include "rte_approx.h"
> -#include "rte_reciprocal.h"
>
> #ifdef __INTEL_COMPILER
> #pragma warning(disable:2259) /* conversion may lose significant bits */
> --
> 2.7.4
Regards,
Cristian
^ permalink raw reply [flat|nested] 11+ messages in thread
* Re: [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal
2017-09-06 10:21 ` [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal Pavan Nikhilesh
2017-09-06 12:28 ` Kevin Traynor
@ 2017-09-20 13:15 ` Dumitrescu, Cristian
1 sibling, 0 replies; 11+ messages in thread
From: Dumitrescu, Cristian @ 2017-09-20 13:15 UTC (permalink / raw)
To: Pavan Nikhilesh, stephen; +Cc: dev
Hi Pavan,
Same ask as for the first patch:
-Do not change existing code in rte_reciprocal.[hc]: no _u32 suffix, please
-Do not add lots of CR+LF to existing code
> -----Original Message-----
> From: Pavan Nikhilesh [mailto:pbhagavatula@caviumnetworks.com]
> Sent: Wednesday, September 6, 2017 11:22 AM
> To: Dumitrescu, Cristian <cristian.dumitrescu@intel.com>;
> stephen@networkplumber.org
> Cc: dev@dpdk.org; Pavan Bhagavatula
> <pbhagavatula@caviumnetworks.com>
> Subject: [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal
>
> From: Pavan Bhagavatula <pbhagavatula@caviumnetworks.com>
>
> Currently, rte_reciprocal only supports unsigned 32bit divisors. This
> commit adds support for unsigned 64bit divisors.
>
> Rename unsigned 32bit specific functions appropriately and update
> librte_sched accordingly.
>
> Signed-off-by: Pavan Nikhilesh <pbhagavatula@caviumnetworks.com>
> ---
> lib/librte_eal/bsdapp/eal/rte_eal_version.map | 3 +-
> lib/librte_eal/common/include/rte_reciprocal.h | 109
> ++++++++++++++++++++--
> lib/librte_eal/common/rte_reciprocal.c | 116
> +++++++++++++++++++++---
> lib/librte_eal/linuxapp/eal/rte_eal_version.map | 3 +-
> lib/librte_sched/Makefile | 4 +-
> lib/librte_sched/rte_sched.c | 9 +-
> 6 files changed, 219 insertions(+), 25 deletions(-)
>
> diff --git a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> index 90d7258..59a85bb 100644
> --- a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> +++ b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> @@ -241,6 +241,7 @@ EXPERIMENTAL {
> DPDK_17.11 {
> global:
>
> - rte_reciprocal_value;
> + rte_reciprocal_value_u32;
> + rte_reciprocal_value_u64;
>
> } DPDK_17.08;
> diff --git a/lib/librte_eal/common/include/rte_reciprocal.h
> b/lib/librte_eal/common/include/rte_reciprocal.h
> index b6d752f..85599e6 100644
> --- a/lib/librte_eal/common/include/rte_reciprocal.h
> +++ b/lib/librte_eal/common/include/rte_reciprocal.h
> @@ -22,22 +22,117 @@
> #ifndef _RTE_RECIPROCAL_H_
> #define _RTE_RECIPROCAL_H_
>
> -#include <stdint.h>
> +#include <rte_memory.h>
>
> -struct rte_reciprocal {
> +/**
> + * Unsigned 32-bit divisor structure.
> + */
> +struct rte_reciprocal_u32 {
> uint32_t m;
> uint8_t sh1, sh2;
> };
>
Do not add _32 suffix for exiting function, no name change, please.
> +/**
> + * Unsigned 64-bit divisor structure.
> + */
> +struct rte_reciprocal_u64 {
> + uint64_t m;
> + uint8_t sh1;
> +};
> +
I am OK with adding +64 suffix for new API.
> +/**
> + * Divide given unsigned 32-bit integer with pre calculated divisor.
> + *
> + * @param a
> + * The 32-bit dividend.
> + * @param R
> + * The pointer to pre calculated divisor reciprocal structure.
> + *
> + * @return
> + * The result of the division
> + */
> static inline uint32_t
> -rte_reciprocal_divide(uint32_t a, struct rte_reciprocal R)
> +rte_reciprocal_divide_u32(uint32_t a, struct rte_reciprocal_u32 *R)
> {
> - uint32_t t = (uint32_t)(((uint64_t)a * R.m) >> 32);
> + uint32_t t = (((uint64_t)a * R->m) >> 32);
>
> - return (t + ((a - t) >> R.sh1)) >> R.sh2;
> + return (t + ((a - t) >> R->sh1)) >> R->sh2;
> }
Do not add _u32 suffix for existing API.
>
> -struct rte_reciprocal
> -rte_reciprocal_value(uint32_t d);
> +static inline uint64_t
> +mullhi_u64(uint64_t x, uint64_t y)
> +{
> +#ifdef __SIZEOF_INT128__
> + __uint128_t xl = x;
> + __uint128_t rl = xl * y;
> +
> + return (rl >> 64);
> +#else
> + uint64_t u0, u1, v0, v1, k, t;
> + uint64_t w1, w2;
> + uint64_t whi;
> +
> + u1 = x >> 32; u0 = x & 0xFFFFFFFF;
> + v1 = y >> 32; v0 = y & 0xFFFFFFFF;
> +
> + t = u0*v0;
> + k = t >> 32;
> +
> + t = u1*v0 + k;
> + w1 = t & 0xFFFFFFFF;
> + w2 = t >> 32;
> +
> + t = u0*v1 + w1;
> + k = t >> 32;
> +
> + whi = u1*v1 + w2 + k;
> +
> + return whi;
> +#endif
> +}
> +
> +/**
> + * Divide given unsigned 64-bit integer with pre calculated divisor.
> + *
> + * @param a
> + * The 64-bit dividend.
> + * @param R
> + * The pointer to pre calculated divisor reciprocal structure.
> + *
> + * @return
> + * The result of the division
> + */
> +static inline uint64_t
> +rte_reciprocal_divide_u64(uint64_t a, struct rte_reciprocal_u64 *R)
> +{
> + uint64_t q = mullhi_u64(R->m, a);
> + uint64_t t = ((a - q) >> 1) + q;
> +
> + return t >> R->sh1;
> +}
> +
> +/**
> + * Generate pre calculated divisor structure.
> + *
> + * @param d
> + * The unsigned 32-bit divisor.
> + *
> + * @return
> + * Divisor structure.
> + */
> +struct rte_reciprocal_u32
> +rte_reciprocal_value_u32(uint32_t d);
> +
Do not add _u32 suffix for existing API.
> +/**
> + * Generate pre calculated divisor structure.
> + *
> + * @param d
> + * The unsigned 64-bit divisor.
> + *
> + * @return
> + * Divisor structure.
> + */
> +struct rte_reciprocal_u64
> +rte_reciprocal_value_u64(uint64_t d);
>
> #endif /* _RTE_RECIPROCAL_H_ */
> diff --git a/lib/librte_eal/common/rte_reciprocal.c
> b/lib/librte_eal/common/rte_reciprocal.c
> index 7ab99b4..2024e62 100644
> --- a/lib/librte_eal/common/rte_reciprocal.c
> +++ b/lib/librte_eal/common/rte_reciprocal.c
> @@ -31,18 +31,13 @@
> * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH
> DAMAGE.
> */
>
> -#include <stdio.h>
> -#include <stdint.h>
> -
> -#include <rte_common.h>
> -
> -#include "rte_reciprocal.h"
> +#include <rte_reciprocal.h>
>
> /* find largest set bit.
> * portable and slow but does not matter for this usage.
> */
> static inline int
> -fls(uint32_t x)
> +fls_u32(uint32_t x)
> {
> int b;
>
> @@ -54,14 +49,14 @@ fls(uint32_t x)
> return 0;
> }
>
Do not add _u32 suffix for existing API.
> -struct rte_reciprocal
> -rte_reciprocal_value(uint32_t d)
> +struct rte_reciprocal_u32
> +rte_reciprocal_value_u32(uint32_t d)
Do not add _u32 suffix for existing API.
> {
> - struct rte_reciprocal R;
> + struct rte_reciprocal_u32 R;
> uint64_t m;
> int l;
>
> - l = fls(d - 1);
> + l = fls_u32(d - 1);
> m = ((1ULL << 32) * ((1ULL << l) - d));
> m /= d;
>
> @@ -72,3 +67,102 @@ rte_reciprocal_value(uint32_t d)
>
> return R;
> }
> +
> +/* Code taken from Hacker's Delight:
> + * http://www.hackersdelight.org/HDcode/divlu.c.
> + * License permits inclusion here per:
> + * http://www.hackersdelight.org/permissions.htm
> + */
> +static inline uint64_t
> +divide_128_div_64_to_64(uint64_t u1, uint64_t u0, uint64_t v, uint64_t *r)
> +{
> + const uint64_t b = (1ULL << 32); /* Number base (16 bits). */
> + uint64_t un1, un0, /* Norm. dividend LSD's. */
> + vn1, vn0, /* Norm. divisor digits. */
> + q1, q0, /* Quotient digits. */
> + un64, un21, un10, /* Dividend digit pairs. */
> + rhat; /* A remainder. */
> + int s; /* Shift amount for norm. */
> +
> + /* If overflow, set rem. to an impossible value. */
> + if (u1 >= v) {
> + if (r != NULL)
> + *r = (uint64_t) -1;
> + return (uint64_t) -1;
> + }
> +
> + /* Count leading zeros. */
> + s = __builtin_clzll(v);
> + if (s > 0) {
> + v = v << s;
> + un64 = (u1 << s) | ((u0 >> (64 - s)) & (-s >> 31));
> + un10 = u0 << s;
> + } else {
> +
> + un64 = u1 | u0;
> + un10 = u0;
> + }
> +
> + vn1 = v >> 32;
> + vn0 = v & 0xFFFFFFFF;
> +
> + un1 = un10 >> 32;
> + un0 = un10 & 0xFFFFFFFF;
> +
> + q1 = un64/vn1;
> + rhat = un64 - q1*vn1;
> +again1:
> + if (q1 >= b || q1*vn0 > b*rhat + un1) {
> + q1 = q1 - 1;
> + rhat = rhat + vn1;
> + if (rhat < b)
> + goto again1;
> + }
> +
> + un21 = un64*b + un1 - q1*v;
> +
> + q0 = un21/vn1;
> + rhat = un21 - q0*vn1;
> +again2:
> + if (q0 >= b || q0*vn0 > b*rhat + un0) {
> + q0 = q0 - 1;
> + rhat = rhat + vn1;
> + if (rhat < b)
> + goto again2;
> + }
> +
> + if (r != NULL)
> + *r = (un21*b + un0 - q0*v) >> s;
> + return q1*b + q0;
> +}
> +
> +struct rte_reciprocal_u64
> +rte_reciprocal_value_u64(uint64_t d)
> +{
> + struct rte_reciprocal_u64 R;
> +
> + const uint32_t fld = 63 - __builtin_clzll(d);
> +
> + if ((d & (d - 1)) == 0) {
> + R.m = 0;
> + R.sh1 = (fld - 1) | 0x40;
> + } else {
> + uint64_t rem;
> + uint64_t multiplier;
> + uint8_t more;
> +
> + multiplier = divide_128_div_64_to_64(1ULL << fld, 0, d,
> &rem);
> + multiplier += multiplier;
> +
> + const uint64_t twice_rem = rem + rem;
> + if (twice_rem >= d || twice_rem < rem)
> + multiplier += 1;
> + more = fld;
> + R.m = 1 + multiplier;
> + R.sh1 = more | 0x40;
> + }
> +
> + R.sh1 &= 0x3F;
> +
> + return R;
> +}
> diff --git a/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> index 2070cba..2671627 100644
> --- a/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> +++ b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> @@ -246,6 +246,7 @@ EXPERIMENTAL {
> DPDK_17.11 {
> global:
>
> - rte_reciprocal_value;
> + rte_reciprocal_value_u32;
Do not add _u32 suffix for existing API.
> + rte_reciprocal_value_u64;
>
> } DPDK_17.08;
> diff --git a/lib/librte_sched/Makefile b/lib/librte_sched/Makefile
> index 569656b..a2fd6f3 100644
> --- a/lib/librte_sched/Makefile
> +++ b/lib/librte_sched/Makefile
> @@ -54,6 +54,8 @@ LIBABIVER := 1
> SRCS-$(CONFIG_RTE_LIBRTE_SCHED) += rte_sched.c rte_red.c rte_approx.c
>
> # install includes
> -SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include := rte_sched.h
> rte_bitmap.h rte_sched_common.h rte_red.h rte_approx.h
> +SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include := rte_sched.h
> rte_bitmap.h
> +SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include += rte_sched_common.h
> rte_red.h
> +SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include += rte_approx.h
>
> include $(RTE_SDK)/mk/rte.lib.mk
> diff --git a/lib/librte_sched/rte_sched.c b/lib/librte_sched/rte_sched.c
> index 3b8ccaa..7bb6d51 100644
> --- a/lib/librte_sched/rte_sched.c
> +++ b/lib/librte_sched/rte_sched.c
> @@ -228,7 +228,7 @@ struct rte_sched_port {
> uint64_t time_cpu_cycles; /* Current CPU time measured in CPU
> cyles */
> uint64_t time_cpu_bytes; /* Current CPU time measured in bytes
> */
> uint64_t time; /* Current NIC TX time measured in bytes */
> - struct rte_reciprocal inv_cycles_per_byte; /* CPU cycles per byte */
> + struct rte_reciprocal_u32 inv_cycles_per_byte; /* CPU cycles per
> byte */
>
> /* Scheduling loop detection */
> uint32_t pipe_loop;
> @@ -677,7 +677,7 @@ rte_sched_port_config(struct
> rte_sched_port_params *params)
>
> cycles_per_byte = (rte_get_tsc_hz() << RTE_SCHED_TIME_SHIFT)
> / params->rate;
> - port->inv_cycles_per_byte = rte_reciprocal_value(cycles_per_byte);
> + port->inv_cycles_per_byte =
> rte_reciprocal_value_u32(cycles_per_byte);
>
Do not add _u32 suffix for existing API.
> /* Scheduling loop detection */
> port->pipe_loop = RTE_SCHED_PIPE_INVALID;
> @@ -2147,8 +2147,9 @@ rte_sched_port_time_resync(struct
> rte_sched_port *port)
> uint64_t bytes_diff;
>
> /* Compute elapsed time in bytes */
> - bytes_diff = rte_reciprocal_divide(cycles_diff <<
> RTE_SCHED_TIME_SHIFT,
> - port->inv_cycles_per_byte);
> + bytes_diff = rte_reciprocal_divide_u32(
Do not add _u32 suffix for existing API.
> + cycles_diff << RTE_SCHED_TIME_SHIFT,
> + &port->inv_cycles_per_byte);
>
> /* Advance port time */
> port->time_cpu_cycles = cycles;
> --
> 2.7.4
^ permalink raw reply [flat|nested] 11+ messages in thread
* Re: [dpdk-dev] [PATCH v6 1/3] eal: introduce integer divide through reciprocal
2017-09-20 13:10 ` [dpdk-dev] [PATCH v6 1/3] eal: introduce integer divide through reciprocal Dumitrescu, Cristian
@ 2017-09-20 13:27 ` Pavan Nikhilesh Bhagavatula
0 siblings, 0 replies; 11+ messages in thread
From: Pavan Nikhilesh Bhagavatula @ 2017-09-20 13:27 UTC (permalink / raw)
To: Dumitrescu, Cristian, stephen; +Cc: dev
On Wed, Sep 20, 2017 at 01:10:53PM +0000, Dumitrescu, Cristian wrote:
> Hi Pavan,
Hi Cristian,
>
> I think moving rte_reciprocal.[hc] to a common code area like EAL is a very good idea, so thanks for doing this work!
>
> One ask from my side: please do not change the existing code.
> 1. Keep the existing name for the 32-bit API functions and data structures (no _u32 name suffix), add the _u64 suffix just for the new API functions that you add.
> - If you want, you can create aliases with _32 name suffix for the existing 32-bit API
> - The only change to rte_sched.c should be header include line: #include "rte_reciprocal.h" -> #include <rte_reciprocal.h>
> 2. Do not do any cosmetic changes in existing code in rte_reciprocal.[hc] (such as adding CR+LF), as they result in lots of code churn for no real value
>
> Once these changes are done, the size of your patch set is reduced considerably.
>
Will do the changes once the licencing issues get sorted out(v7).
-Pavan
>
> > -----Original Message-----
> > From: Pavan Nikhilesh [mailto:pbhagavatula@caviumnetworks.com]
> > Sent: Wednesday, September 6, 2017 11:22 AM
> > To: Dumitrescu, Cristian <cristian.dumitrescu@intel.com>;
> > stephen@networkplumber.org
> > Cc: dev@dpdk.org; Pavan Bhagavatula
> > <pbhagavatula@caviumnetworks.com>
> > Subject: [dpdk-dev] [PATCH v6 1/3] eal: introduce integer divide through
> > reciprocal
> >
> > From: Pavan Bhagavatula <pbhagavatula@caviumnetworks.com>
> >
> > In some use cases of integer division, denominator remains constant and
> > numerator varies. It is possible to optimize division for such specific
> > scenarios.
> >
> > The librte_sched uses rte_reciprocal to optimize division so, moving it to
> > eal/common would allow other libraries and applications to use it.
> >
> > Signed-off-by: Pavan Nikhilesh <pbhagavatula@caviumnetworks.com>
> > Reviewed-by: Anatoly Burakov <anatoly.burakov@intel.com>
> > ---
> >
> > v6 changes:
> > - remove cache alignment from rte_reciprocal_u{32/64}structures as they
> > would
> > be embedded in other structures.
> >
> > v5 changes:
> > - fix test print strings
> >
> > v4 changes:
> > - minor fix for test cases
> > - fix u32 divisor generation
> >
> > v3 changes:
> > - fix x86_32 compilation issue
> > - fix improper licence in test
> >
> > v2 changes:
> > - fix compilation issues with .map files
> > - add test cases for correctness and performance
> > - remove extra licence inclusion
> > - fix coding style issues
> >
> > lib/librte_eal/bsdapp/eal/Makefile | 1 +
> > lib/librte_eal/bsdapp/eal/rte_eal_version.map | 7 +++++++
> > lib/librte_eal/common/Makefile | 1 +
> > lib/{librte_sched => librte_eal/common/include}/rte_reciprocal.h | 6 ++++--
> > lib/{librte_sched => librte_eal/common}/rte_reciprocal.c | 6 ++++--
> > lib/librte_eal/linuxapp/eal/Makefile | 1 +
> > lib/librte_eal/linuxapp/eal/rte_eal_version.map | 7 +++++++
> > lib/librte_sched/Makefile | 2 --
> > lib/librte_sched/rte_sched.c | 2 +-
> > 9 files changed, 26 insertions(+), 7 deletions(-)
> > rename lib/{librte_sched => librte_eal/common/include}/rte_reciprocal.h
> > (87%)
> > rename lib/{librte_sched => librte_eal/common}/rte_reciprocal.c (96%)
> >
> > diff --git a/lib/librte_eal/bsdapp/eal/Makefile
> > b/lib/librte_eal/bsdapp/eal/Makefile
> > index 005019e..56f9804 100644
> > --- a/lib/librte_eal/bsdapp/eal/Makefile
> > +++ b/lib/librte_eal/bsdapp/eal/Makefile
> > @@ -88,6 +88,7 @@ SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) +=
> > malloc_elem.c
> > SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += malloc_heap.c
> > SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += rte_keepalive.c
> > SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += rte_service.c
> > +SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += rte_reciprocal.c
> >
> > # from arch dir
> > SRCS-$(CONFIG_RTE_EXEC_ENV_BSDAPP) += rte_cpuflags.c
> > diff --git a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> > b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> > index aac6fd7..90d7258 100644
> > --- a/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> > +++ b/lib/librte_eal/bsdapp/eal/rte_eal_version.map
> > @@ -237,3 +237,10 @@ EXPERIMENTAL {
> > rte_service_unregister;
> >
> > } DPDK_17.08;
> > +
> > +DPDK_17.11 {
> > + global:
> > +
> > + rte_reciprocal_value;
> > +
> > +} DPDK_17.08;
> > diff --git a/lib/librte_eal/common/Makefile
> > b/lib/librte_eal/common/Makefile
> > index e8fd67a..a680b2d 100644
> > --- a/lib/librte_eal/common/Makefile
> > +++ b/lib/librte_eal/common/Makefile
> > @@ -42,6 +42,7 @@ INC += rte_hexdump.h rte_devargs.h rte_bus.h
> > rte_dev.h rte_vdev.h
> > INC += rte_pci_dev_feature_defs.h rte_pci_dev_features.h
> > INC += rte_malloc.h rte_keepalive.h rte_time.h
> > INC += rte_service.h rte_service_component.h
> > +INC += rte_reciprocal.h
> >
> > GENERIC_INC := rte_atomic.h rte_byteorder.h rte_cycles.h rte_prefetch.h
> > GENERIC_INC += rte_spinlock.h rte_memcpy.h rte_cpuflags.h rte_rwlock.h
> > diff --git a/lib/librte_sched/rte_reciprocal.h
> > b/lib/librte_eal/common/include/rte_reciprocal.h
> > similarity index 87%
> > rename from lib/librte_sched/rte_reciprocal.h
> > rename to lib/librte_eal/common/include/rte_reciprocal.h
> > index 5e21f09..b6d752f 100644
> > --- a/lib/librte_sched/rte_reciprocal.h
> > +++ b/lib/librte_eal/common/include/rte_reciprocal.h
> > @@ -29,13 +29,15 @@ struct rte_reciprocal {
> > uint8_t sh1, sh2;
> > };
> >
> > -static inline uint32_t rte_reciprocal_divide(uint32_t a, struct rte_reciprocal
> > R)
> > +static inline uint32_t
> > +rte_reciprocal_divide(uint32_t a, struct rte_reciprocal R)
> > {
> > uint32_t t = (uint32_t)(((uint64_t)a * R.m) >> 32);
> >
> > return (t + ((a - t) >> R.sh1)) >> R.sh2;
> > }
> >
> > -struct rte_reciprocal rte_reciprocal_value(uint32_t d);
> > +struct rte_reciprocal
> > +rte_reciprocal_value(uint32_t d);
> >
>
> Please remove these cosmetic changes that result in code churn for no real value.
>
> > #endif /* _RTE_RECIPROCAL_H_ */
> > diff --git a/lib/librte_sched/rte_reciprocal.c
> > b/lib/librte_eal/common/rte_reciprocal.c
> > similarity index 96%
> > rename from lib/librte_sched/rte_reciprocal.c
> > rename to lib/librte_eal/common/rte_reciprocal.c
> > index 652f023..7ab99b4 100644
> > --- a/lib/librte_sched/rte_reciprocal.c
> > +++ b/lib/librte_eal/common/rte_reciprocal.c
> > @@ -41,7 +41,8 @@
> > /* find largest set bit.
> > * portable and slow but does not matter for this usage.
> > */
> > -static inline int fls(uint32_t x)
> > +static inline int
> > +fls(uint32_t x)
> > {
> > int b;
> >
> > @@ -53,7 +54,8 @@ static inline int fls(uint32_t x)
> > return 0;
> > }
> >
> > -struct rte_reciprocal rte_reciprocal_value(uint32_t d)
> > +struct rte_reciprocal
> > +rte_reciprocal_value(uint32_t d)
> > {
> > struct rte_reciprocal R;
> > uint64_t m;
>
> Please remove these cosmetic changes that result in code churn for no real value.
>
> > diff --git a/lib/librte_eal/linuxapp/eal/Makefile
> > b/lib/librte_eal/linuxapp/eal/Makefile
> > index 90bca4d..98f3b8e 100644
> > --- a/lib/librte_eal/linuxapp/eal/Makefile
> > +++ b/lib/librte_eal/linuxapp/eal/Makefile
> > @@ -100,6 +100,7 @@ SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) +=
> > malloc_elem.c
> > SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += malloc_heap.c
> > SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += rte_keepalive.c
> > SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += rte_service.c
> > +SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += rte_reciprocal.c
> >
> > # from arch dir
> > SRCS-$(CONFIG_RTE_EXEC_ENV_LINUXAPP) += rte_cpuflags.c
> > diff --git a/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> > b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> > index 3a8f154..2070cba 100644
> > --- a/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> > +++ b/lib/librte_eal/linuxapp/eal/rte_eal_version.map
> > @@ -242,3 +242,10 @@ EXPERIMENTAL {
> > rte_service_unregister;
> >
> > } DPDK_17.08;
> > +
> > +DPDK_17.11 {
> > + global:
> > +
> > + rte_reciprocal_value;
> > +
> > +} DPDK_17.08;
> > diff --git a/lib/librte_sched/Makefile b/lib/librte_sched/Makefile
> > index 18274e7..569656b 100644
> > --- a/lib/librte_sched/Makefile
> > +++ b/lib/librte_sched/Makefile
> > @@ -52,10 +52,8 @@ LIBABIVER := 1
> > # all source are stored in SRCS-y
> > #
> > SRCS-$(CONFIG_RTE_LIBRTE_SCHED) += rte_sched.c rte_red.c rte_approx.c
> > -SRCS-$(CONFIG_RTE_LIBRTE_SCHED) += rte_reciprocal.c
> >
> > # install includes
> > SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include := rte_sched.h
> > rte_bitmap.h rte_sched_common.h rte_red.h rte_approx.h
> > -SYMLINK-$(CONFIG_RTE_LIBRTE_SCHED)-include += rte_reciprocal.h
> >
> > include $(RTE_SDK)/mk/rte.lib.mk
> > diff --git a/lib/librte_sched/rte_sched.c b/lib/librte_sched/rte_sched.c
> > index b7cba11..3b8ccaa 100644
> > --- a/lib/librte_sched/rte_sched.c
> > +++ b/lib/librte_sched/rte_sched.c
> > @@ -42,12 +42,12 @@
> > #include <rte_prefetch.h>
> > #include <rte_branch_prediction.h>
> > #include <rte_mbuf.h>
> > +#include <rte_reciprocal.h>
> >
> > #include "rte_sched.h"
> > #include "rte_bitmap.h"
> > #include "rte_sched_common.h"
> > #include "rte_approx.h"
> > -#include "rte_reciprocal.h"
> >
> > #ifdef __INTEL_COMPILER
> > #pragma warning(disable:2259) /* conversion may lose significant bits */
> > --
> > 2.7.4
>
> Regards,
> Cristian
>
^ permalink raw reply [flat|nested] 11+ messages in thread
end of thread, other threads:[~2017-09-20 13:28 UTC | newest]
Thread overview: 11+ messages (download: mbox.gz / follow: Atom feed)
-- links below jump to the message on this page --
2017-09-06 10:21 [dpdk-dev] [PATCH v6 1/3] eal: introduce integer divide through reciprocal Pavan Nikhilesh
2017-09-06 10:21 ` [dpdk-dev] [PATCH v6 2/3] eal: add u64 bit variant for reciprocal Pavan Nikhilesh
2017-09-06 12:28 ` Kevin Traynor
2017-09-06 14:41 ` Pavan Nikhilesh Bhagavatula
2017-09-06 15:35 ` Kevin Traynor
2017-09-06 15:37 ` Stephen Hemminger
2017-09-06 17:05 ` Dumitrescu, Cristian
2017-09-20 13:15 ` Dumitrescu, Cristian
2017-09-06 10:21 ` [dpdk-dev] [PATCH v6 3/3] test: add tests for reciprocal based division Pavan Nikhilesh
2017-09-20 13:10 ` [dpdk-dev] [PATCH v6 1/3] eal: introduce integer divide through reciprocal Dumitrescu, Cristian
2017-09-20 13:27 ` Pavan Nikhilesh Bhagavatula
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).