From: David Marchand <david.marchand@6wind.com>
To: Bruce Richardson <bruce.richardson@intel.com>
Cc: "dev@dpdk.org" <dev@dpdk.org>
Subject: Re: [dpdk-dev] [PATCH v3 1/3] eal: enable uio_pci_generic support
Date: Mon, 23 Feb 2015 16:24:31 +0100 [thread overview]
Message-ID: <CALwxeUv6HT-UJu3s9P8CCKkWN77c52fqBJem2XVq-+7pmedu5Q@mail.gmail.com> (raw)
In-Reply-To: <1424451557-27419-2-git-send-email-bruce.richardson@intel.com>
Hello,
Ok this is coming too late, but anyway, my comments.
On Fri, Feb 20, 2015 at 5:59 PM, Bruce Richardson <
bruce.richardson@intel.com> wrote:
[snip]
diff --git a/lib/librte_eal/linuxapp/eal/eal_pci_uio.c
> b/lib/librte_eal/linuxapp/eal/eal_pci_uio.c
> index 54cce08..2b16fcb 100644
> --- a/lib/librte_eal/linuxapp/eal/eal_pci_uio.c
> +++ b/lib/librte_eal/linuxapp/eal/eal_pci_uio.c
> @@ -36,6 +36,7 @@
> #include <dirent.h>
> #include <sys/stat.h>
> #include <sys/mman.h>
> +#include <linux/pci_regs.h>
>
> #include <rte_log.h>
> #include <rte_pci.h>
> @@ -47,71 +48,73 @@
> #include "eal_filesystem.h"
> #include "eal_pci_init.h"
>
> -static int pci_parse_sysfs_value(const char *filename, uint64_t *val);
> -
> void *pci_map_addr = NULL;
>
>
> #define OFF_MAX ((uint64_t)(off_t)-1)
> static int
> -pci_uio_get_mappings(const char *devname, struct pci_map maps[], int
> nb_maps)
> +pci_uio_get_mappings(struct rte_pci_device *dev,
> + struct pci_map maps[], int nb_maps)
> {
> - int i;
> - char dirname[PATH_MAX];
> + struct rte_pci_addr *loc = &dev->addr;
> + int i = 0;
> char filename[PATH_MAX];
> - uint64_t offset, size;
> + unsigned long long start_addr, end_addr, flags;
> + FILE *f;
>
> - for (i = 0; i != nb_maps; i++) {
> + snprintf(filename, sizeof(filename),
> + SYSFS_PCI_DEVICES "/" PCI_PRI_FMT "/resource",
> + loc->domain, loc->bus, loc->devid, loc->function);
>
> - /* check if map directory exists */
> - snprintf(dirname, sizeof(dirname),
> - "%s/maps/map%u", devname, i);
> -
> - if (access(dirname, F_OK) != 0)
> - break;
> + f = fopen(filename, "r");
> + if (f == NULL) {
> + RTE_LOG(ERR, EAL,
> + "%s(): cannot open sysfs %s\n",
> + __func__, filename);
> + return -1;
> + }
>
> - /* get mapping offset */
> - snprintf(filename, sizeof(filename),
> - "%s/offset", dirname);
> - if (pci_parse_sysfs_value(filename, &offset) < 0) {
> - RTE_LOG(ERR, EAL,
> - "%s(): cannot parse offset of %s\n",
> - __func__, dirname);
> - return -1;
> + while (fscanf(f, "%llx %llx %llx", &start_addr,
> + &end_addr, &flags) == 3 && i < nb_maps) {
> + if (flags & IORESOURCE_MEM) {
> + maps[i].offset = 0x0;
> + maps[i].size = end_addr - start_addr + 1;
> + maps[i].phaddr = start_addr;
> + i++;
> }
> + }
> + fclose(f);
>
> - /* get mapping size */
> - snprintf(filename, sizeof(filename),
> - "%s/size", dirname);
> - if (pci_parse_sysfs_value(filename, &size) < 0) {
> - RTE_LOG(ERR, EAL,
> - "%s(): cannot parse size of %s\n",
> - __func__, dirname);
> - return -1;
> - }
> + return i;
> +}
>
> - /* get mapping physical address */
> - snprintf(filename, sizeof(filename),
> - "%s/addr", dirname);
> - if (pci_parse_sysfs_value(filename, &maps[i].phaddr) < 0) {
> - RTE_LOG(ERR, EAL,
> - "%s(): cannot parse addr of %s\n",
> - __func__, dirname);
> - return -1;
> - }
>
This function ends up reinventing the wheel from eal_pci.c plus it adds
some new array with mappings in them but not indexed the same way as
eal_pci.c see comments at the end of this mail.
> +static int
> +pci_uio_set_bus_master(int dev_fd)
> +{
> + uint16_t reg;
> + int ret;
>
> - if ((offset > OFF_MAX) || (size > SIZE_MAX)) {
> - RTE_LOG(ERR, EAL,
> - "%s(): offset/size exceed system max
> value\n",
> - __func__);
> - return -1;
> - }
> + ret = pread(dev_fd, ®, sizeof(reg), PCI_COMMAND);
> + if (ret != sizeof(reg)) {
> + RTE_LOG(ERR, EAL,
> + "Cannot read command from PCI config space!\n");
> + return -1;
> + }
> +
> + /* return if bus mastering is already on */
> + if (reg & PCI_COMMAND_MASTER)
> + return 0;
> +
> + reg |= PCI_COMMAND_MASTER;
>
> - maps[i].offset = offset;
> - maps[i].size = size;
> + ret = pwrite(dev_fd, ®, sizeof(reg), PCI_COMMAND);
> + if (ret != sizeof(reg)) {
> + RTE_LOG(ERR, EAL,
> + "Cannot write command to PCI config space!\n");
> + return -1;
> }
>
> - return i;
> + return 0;
> }
>
It would have been the good time to have a generic api to access pci config
space.
Something like what Stephen proposed.
> static int
> @@ -127,6 +130,10 @@ pci_uio_map_secondary(struct rte_pci_device *dev)
> continue;
>
> for (i = 0; i != uio_res->nb_maps; i++) {
> + /* ignore mappings unused in primary process */
> + if (uio_res->maps[i].addr == NULL)
> + continue;
> +
/*
> * open devname, to mmap it
> */
> @@ -282,6 +289,7 @@ pci_uio_map_resource(struct rte_pci_device *dev)
> {
> int i, j;
> char dirname[PATH_MAX];
> + char cfgname[PATH_MAX];
> char devname[PATH_MAX]; /* contains the /dev/uioX */
> void *mapaddr;
> int uio_num;
> @@ -294,6 +302,7 @@ pci_uio_map_resource(struct rte_pci_device *dev)
> struct pci_map *maps;
>
> dev->intr_handle.fd = -1;
> + dev->intr_handle.uio_cfg_fd = -1;
> dev->intr_handle.type = RTE_INTR_HANDLE_UNKNOWN;
>
> /* secondary processes - use already recorded details */
> @@ -318,6 +327,28 @@ pci_uio_map_resource(struct rte_pci_device *dev)
> }
> dev->intr_handle.type = RTE_INTR_HANDLE_UIO;
>
> + snprintf(cfgname, sizeof(cfgname),
> + "/sys/class/uio/uio%u/device/config", uio_num);
> + dev->intr_handle.uio_cfg_fd = open(cfgname, O_RDWR);
> + if (dev->intr_handle.uio_cfg_fd < 0) {
> + RTE_LOG(ERR, EAL, "Cannot open %s: %s\n",
> + cfgname, strerror(errno));
> + return -1;
> + }
> +
> + /* update devname for mmap */
> + snprintf(devname, sizeof(devname),
> + SYSFS_PCI_DEVICES "/" PCI_PRI_FMT "/resource%d",
> + loc->domain, loc->bus, loc->devid, loc->function, 0);
>
Why bother with a %d if you hardcode 0 ?
More importantly, since you hardcode "devname" to /sys/.../resource0, then
the mmap code will use a fd on this file.
I really am skeptical on the fact that it can work for devices that have no
bar0.
Then, how is this supposed to work ?
You rely on sysfs mmap code for pci resources.
Is this really equivalent to uio mmap operations ?
> +
> + /* set bus master that is not done by uio_pci_generic */
> + if (rte_eal_process_type() == RTE_PROC_PRIMARY) {
> + if (pci_uio_set_bus_master(dev->intr_handle.uio_cfg_fd)) {
> + RTE_LOG(ERR, EAL, "Cannot set up bus
> mastering!\n");
> + return -1;
> + }
> + }
> +
>
You are already running in a primary process, this check is useless.
> /* allocate the mapping details for secondary processes*/
> uio_res = rte_zmalloc("UIO_RES", sizeof(*uio_res), 0);
> if (uio_res == NULL) {
> @@ -330,13 +361,12 @@ pci_uio_map_resource(struct rte_pci_device *dev)
> memcpy(&uio_res->pci_addr, &dev->addr, sizeof(uio_res->pci_addr));
>
> /* collect info about device mappings */
> - nb_maps = pci_uio_get_mappings(dirname, uio_res->maps,
> - RTE_DIM(uio_res->maps));
> + nb_maps = pci_uio_get_mappings(dev, uio_res->maps,
> + RTE_DIM(uio_res->maps));
> if (nb_maps < 0) {
> rte_free(uio_res);
> return nb_maps;
> }
> -
> uio_res->nb_maps = nb_maps;
>
> /* Map all BARs */
>
Ok then after this, we use this temp array uio_res->maps and we loop all
over the pci resources.
Why do we have all these loops ?
I could see no point before, and with this change, it is bothering me again.
Won't it be easier to loop on the pci resources discovered by eal_pci.c
before this function is called ?
eal_pci.c is responsible for discovering pci devices, prepare those devices
(filling mem_resource[] for example), then eal_pci_uio.c / eal_pci_vfio.c
do the "mapping" stuff.
So uio / vfio must not overwrite what has already been set before.
--
David Marchand
next prev parent reply other threads:[~2015-02-23 15:24 UTC|newest]
Thread overview: 13+ messages / expand[flat|nested] mbox.gz Atom feed top
2015-02-19 17:08 [dpdk-dev] [PATCH v2 0/3] Enable " Zhou Danny
2015-02-19 17:08 ` [dpdk-dev] [PATCH v2 1/3] eal: enable " Zhou Danny
2015-02-20 9:01 ` Thomas Monjalon
2015-02-20 10:15 ` Bruce Richardson
2015-02-19 17:08 ` [dpdk-dev] [PATCH v2 2/3] eal: add interrupt enable/disable routines for uio_pci_generic Zhou Danny
2015-02-19 17:08 ` [dpdk-dev] [PATCH v2 3/3] tools: enable binding NIC device to uio_pci_generic Zhou Danny
2015-02-20 16:59 ` [dpdk-dev] [PATCH v3 0/3] enable uio_pci_generic support Bruce Richardson
2015-02-20 16:59 ` [dpdk-dev] [PATCH v3 1/3] eal: " Bruce Richardson
2015-02-23 15:24 ` David Marchand [this message]
2015-02-20 16:59 ` [dpdk-dev] [PATCH v3 2/3] eal: add interrupt enable/disable routines for uio_pci_generic Bruce Richardson
2015-02-20 16:59 ` [dpdk-dev] [PATCH v3 3/3] tools: enable binding NIC device to uio_pci_generic Bruce Richardson
2015-02-20 17:44 ` [dpdk-dev] [PATCH v3 0/3] enable uio_pci_generic support Declan Doherty
2015-02-20 22:35 ` Thomas Monjalon
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=CALwxeUv6HT-UJu3s9P8CCKkWN77c52fqBJem2XVq-+7pmedu5Q@mail.gmail.com \
--to=david.marchand@6wind.com \
--cc=bruce.richardson@intel.com \
--cc=dev@dpdk.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).