New upstream version 18.08
[deb_dpdk.git] / drivers / bus / vdev / vdev.c
index e4bc724..6139dd5 100644 (file)
@@ -1,33 +1,5 @@
-/*-
- *   BSD LICENSE
- *
- *   Copyright(c) 2016 RehiveTech. All rights reserved.
- *
- *   Redistribution and use in source and binary forms, with or without
- *   modification, are permitted provided that the following conditions
- *   are met:
- *
- *     * Redistributions of source code must retain the above copyright
- *       notice, this list of conditions and the following disclaimer.
- *     * Redistributions in binary form must reproduce the above copyright
- *       notice, this list of conditions and the following disclaimer in
- *       the documentation and/or other materials provided with the
- *       distribution.
- *     * Neither the name of RehiveTech nor the names of its
- *       contributors may be used to endorse or promote products derived
- *       from this software without specific prior written permission.
- *
- *   THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
- *   "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
- *   LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
- *   A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
- *   OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- *   SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- *   LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- *   DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- *   THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- *   (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- *   OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+/* SPDX-License-Identifier: BSD-3-Clause
+ * Copyright(c) 2016 RehiveTech. All rights reserved.
  */
 
 #include <string.h>
 #include <rte_memory.h>
 #include <rte_tailq.h>
 #include <rte_spinlock.h>
+#include <rte_string_fns.h>
 #include <rte_errno.h>
 
 #include "rte_bus_vdev.h"
 #include "vdev_logs.h"
 
+#define VDEV_MP_KEY    "bus_vdev_mp"
+
 int vdev_logtype_bus;
 
 /* Forward declare to access virtual bus name */
@@ -61,6 +36,10 @@ TAILQ_HEAD(vdev_device_list, rte_vdev_device);
 
 static struct vdev_device_list vdev_device_list =
        TAILQ_HEAD_INITIALIZER(vdev_device_list);
+/* The lock needs to be recursive because a vdev can manage another vdev. */
+static rte_spinlock_recursive_t vdev_device_list_lock =
+       RTE_SPINLOCK_RECURSIVE_INITIALIZER;
+
 struct vdev_driver_list vdev_driver_list =
        TAILQ_HEAD_INITIALIZER(vdev_driver_list);
 
@@ -165,7 +144,7 @@ vdev_probe_all_drivers(struct rte_vdev_device *dev)
 
        name = rte_vdev_device_name(dev);
 
-       VDEV_LOG(DEBUG, "Search driver %s to probe device %s\n", name,
+       VDEV_LOG(DEBUG, "Search driver %s to probe device %s", name,
                rte_vdev_device_name(dev));
 
        if (vdev_parse(name, &driver))
@@ -177,6 +156,7 @@ vdev_probe_all_drivers(struct rte_vdev_device *dev)
        return ret;
 }
 
+/* The caller shall be responsible for thread-safe */
 static struct rte_vdev_device *
 find_vdev(const char *name)
 {
@@ -188,7 +168,7 @@ find_vdev(const char *name)
        TAILQ_FOREACH(dev, &vdev_device_list, next) {
                const char *devname = rte_vdev_device_name(dev);
 
-               if (!strncmp(devname, name, strlen(name)))
+               if (!strcmp(devname, name))
                        return dev;
        }
 
@@ -221,8 +201,8 @@ alloc_devargs(const char *name, const char *args)
        return devargs;
 }
 
-int
-rte_vdev_init(const char *name, const char *args)
+static int
+insert_vdev(const char *name, const char *args, struct rte_vdev_device **p_dev)
 {
        struct rte_vdev_device *dev;
        struct rte_devargs *devargs;
@@ -231,10 +211,6 @@ rte_vdev_init(const char *name, const char *args)
        if (name == NULL)
                return -EINVAL;
 
-       dev = find_vdev(name);
-       if (dev)
-               return -EEXIST;
-
        devargs = alloc_devargs(name, args);
        if (!devargs)
                return -ENOMEM;
@@ -249,18 +225,18 @@ rte_vdev_init(const char *name, const char *args)
        dev->device.numa_node = SOCKET_ID_ANY;
        dev->device.name = devargs->name;
 
-       ret = vdev_probe_all_drivers(dev);
-       if (ret) {
-               if (ret > 0)
-                       VDEV_LOG(ERR, "no driver found for %s\n", name);
+       if (find_vdev(name)) {
+               ret = -EEXIST;
                goto fail;
        }
 
-       TAILQ_INSERT_TAIL(&devargs_list, devargs, next);
-
        TAILQ_INSERT_TAIL(&vdev_device_list, dev, next);
-       return 0;
+       rte_devargs_insert(devargs);
+
+       if (p_dev)
+               *p_dev = dev;
 
+       return 0;
 fail:
        free(devargs->args);
        free(devargs);
@@ -268,6 +244,31 @@ fail:
        return ret;
 }
 
+int
+rte_vdev_init(const char *name, const char *args)
+{
+       struct rte_vdev_device *dev;
+       struct rte_devargs *devargs;
+       int ret;
+
+       rte_spinlock_recursive_lock(&vdev_device_list_lock);
+       ret = insert_vdev(name, args, &dev);
+       if (ret == 0) {
+               ret = vdev_probe_all_drivers(dev);
+               if (ret) {
+                       if (ret > 0)
+                               VDEV_LOG(ERR, "no driver found for %s", name);
+                       /* If fails, remove it from vdev list */
+                       devargs = dev->device.devargs;
+                       TAILQ_REMOVE(&vdev_device_list, dev, next);
+                       rte_devargs_remove(devargs->bus->name, devargs->name);
+                       free(dev);
+               }
+       }
+       rte_spinlock_recursive_unlock(&vdev_device_list_lock);
+       return ret;
+}
+
 static int
 vdev_remove_driver(struct rte_vdev_device *dev)
 {
@@ -275,7 +276,7 @@ vdev_remove_driver(struct rte_vdev_device *dev)
        const struct rte_vdev_driver *driver;
 
        if (!dev->device.driver) {
-               VDEV_LOG(DEBUG, "no driver attach to device %s\n", name);
+               VDEV_LOG(DEBUG, "no driver attach to device %s", name);
                return 1;
        }
 
@@ -294,23 +295,98 @@ rte_vdev_uninit(const char *name)
        if (name == NULL)
                return -EINVAL;
 
-       dev = find_vdev(name);
-       if (!dev)
-               return -ENOENT;
+       rte_spinlock_recursive_lock(&vdev_device_list_lock);
 
-       devargs = dev->device.devargs;
+       dev = find_vdev(name);
+       if (!dev) {
+               ret = -ENOENT;
+               goto unlock;
+       }
 
        ret = vdev_remove_driver(dev);
        if (ret)
-               return ret;
+               goto unlock;
 
        TAILQ_REMOVE(&vdev_device_list, dev, next);
+       devargs = dev->device.devargs;
+       rte_devargs_remove(devargs->bus->name, devargs->name);
+       free(dev);
 
-       TAILQ_REMOVE(&devargs_list, devargs, next);
+unlock:
+       rte_spinlock_recursive_unlock(&vdev_device_list_lock);
+       return ret;
+}
+
+struct vdev_param {
+#define VDEV_SCAN_REQ  1
+#define VDEV_SCAN_ONE  2
+#define VDEV_SCAN_REP  3
+       int type;
+       int num;
+       char name[RTE_DEV_NAME_MAX_LEN];
+};
+
+static int vdev_plug(struct rte_device *dev);
+
+/**
+ * This function works as the action for both primary and secondary process
+ * for static vdev discovery when a secondary process is booting.
+ *
+ * step 1, secondary process sends a sync request to ask for vdev in primary;
+ * step 2, primary process receives the request, and send vdevs one by one;
+ * step 3, primary process sends back reply, which indicates how many vdevs
+ * are sent.
+ */
+static int
+vdev_action(const struct rte_mp_msg *mp_msg, const void *peer)
+{
+       struct rte_vdev_device *dev;
+       struct rte_mp_msg mp_resp;
+       struct vdev_param *ou = (struct vdev_param *)&mp_resp.param;
+       const struct vdev_param *in = (const struct vdev_param *)mp_msg->param;
+       const char *devname;
+       int num;
+
+       strlcpy(mp_resp.name, VDEV_MP_KEY, sizeof(mp_resp.name));
+       mp_resp.len_param = sizeof(*ou);
+       mp_resp.num_fds = 0;
+
+       switch (in->type) {
+       case VDEV_SCAN_REQ:
+               ou->type = VDEV_SCAN_ONE;
+               ou->num = 1;
+               num = 0;
+
+               rte_spinlock_recursive_lock(&vdev_device_list_lock);
+               TAILQ_FOREACH(dev, &vdev_device_list, next) {
+                       devname = rte_vdev_device_name(dev);
+                       if (strlen(devname) == 0) {
+                               VDEV_LOG(INFO, "vdev with no name is not sent");
+                               continue;
+                       }
+                       VDEV_LOG(INFO, "send vdev, %s", devname);
+                       strlcpy(ou->name, devname, RTE_DEV_NAME_MAX_LEN);
+                       if (rte_mp_sendmsg(&mp_resp) < 0)
+                               VDEV_LOG(ERR, "send vdev, %s, failed, %s",
+                                        devname, strerror(rte_errno));
+                       num++;
+               }
+               rte_spinlock_recursive_unlock(&vdev_device_list_lock);
+
+               ou->type = VDEV_SCAN_REP;
+               ou->num = num;
+               if (rte_mp_reply(&mp_resp, peer) < 0)
+                       VDEV_LOG(ERR, "Failed to reply a scan request");
+               break;
+       case VDEV_SCAN_ONE:
+               VDEV_LOG(INFO, "receive vdev, %s", in->name);
+               if (insert_vdev(in->name, NULL, NULL) < 0)
+                       VDEV_LOG(ERR, "failed to add vdev, %s", in->name);
+               break;
+       default:
+               VDEV_LOG(ERR, "vdev cannot recognize this message");
+       }
 
-       free(devargs->args);
-       free(devargs);
-       free(dev);
        return 0;
 }
 
@@ -321,13 +397,41 @@ vdev_scan(void)
        struct rte_devargs *devargs;
        struct vdev_custom_scan *custom_scan;
 
+       if (rte_mp_action_register(VDEV_MP_KEY, vdev_action) < 0 &&
+           rte_errno != EEXIST) {
+               VDEV_LOG(ERR, "Failed to add vdev mp action");
+               return -1;
+       }
+
+       if (rte_eal_process_type() == RTE_PROC_SECONDARY) {
+               struct rte_mp_msg mp_req, *mp_rep;
+               struct rte_mp_reply mp_reply;
+               struct timespec ts = {.tv_sec = 5, .tv_nsec = 0};
+               struct vdev_param *req = (struct vdev_param *)mp_req.param;
+               struct vdev_param *resp;
+
+               strlcpy(mp_req.name, VDEV_MP_KEY, sizeof(mp_req.name));
+               mp_req.len_param = sizeof(*req);
+               mp_req.num_fds = 0;
+               req->type = VDEV_SCAN_REQ;
+               if (rte_mp_request_sync(&mp_req, &mp_reply, &ts) == 0 &&
+                   mp_reply.nb_received == 1) {
+                       mp_rep = &mp_reply.msgs[0];
+                       resp = (struct vdev_param *)mp_rep->param;
+                       VDEV_LOG(INFO, "Received %d vdevs", resp->num);
+               } else
+                       VDEV_LOG(ERR, "Failed to request vdev from primary");
+
+               /* Fall through to allow private vdevs in secondary process */
+       }
+
        /* call custom scan callbacks if any */
        rte_spinlock_lock(&vdev_custom_scan_lock);
        TAILQ_FOREACH(custom_scan, &vdev_custom_scans, next) {
                if (custom_scan->callback != NULL)
                        /*
                         * the callback should update devargs list
-                        * by calling rte_eal_devargs_insert() with
+                        * by calling rte_devargs_insert() with
                         *     devargs.bus = rte_bus_find_by_name("vdev");
                         *     devargs.type = RTE_DEVTYPE_VIRTUAL;
                         *     devargs.policy = RTE_DEV_WHITELISTED;
@@ -337,24 +441,27 @@ vdev_scan(void)
        rte_spinlock_unlock(&vdev_custom_scan_lock);
 
        /* for virtual devices we scan the devargs_list populated via cmdline */
-       TAILQ_FOREACH(devargs, &devargs_list, next) {
-
-               if (devargs->bus != &rte_vdev_bus)
-                       continue;
-
-               dev = find_vdev(devargs->name);
-               if (dev)
-                       continue;
+       RTE_EAL_DEVARGS_FOREACH("vdev", devargs) {
 
                dev = calloc(1, sizeof(*dev));
                if (!dev)
                        return -1;
 
+               rte_spinlock_recursive_lock(&vdev_device_list_lock);
+
+               if (find_vdev(devargs->name)) {
+                       rte_spinlock_recursive_unlock(&vdev_device_list_lock);
+                       free(dev);
+                       continue;
+               }
+
                dev->device.devargs = devargs;
                dev->device.numa_node = SOCKET_ID_ANY;
                dev->device.name = devargs->name;
 
                TAILQ_INSERT_TAIL(&vdev_device_list, dev, next);
+
+               rte_spinlock_recursive_unlock(&vdev_device_list_lock);
        }
 
        return 0;
@@ -368,12 +475,16 @@ vdev_probe(void)
 
        /* call the init function for each virtual device */
        TAILQ_FOREACH(dev, &vdev_device_list, next) {
+               /* we don't use the vdev lock here, as it's only used in DPDK
+                * initialization; and we don't want to hold such a lock when
+                * we call each driver probe.
+                */
 
                if (dev->device.driver)
                        continue;
 
                if (vdev_probe_all_drivers(dev)) {
-                       VDEV_LOG(ERR, "failed to initialize %s device\n",
+                       VDEV_LOG(ERR, "failed to initialize %s device",
                                rte_vdev_device_name(dev));
                        ret = -1;
                }
@@ -386,17 +497,24 @@ static struct rte_device *
 vdev_find_device(const struct rte_device *start, rte_dev_cmp_t cmp,
                 const void *data)
 {
+       const struct rte_vdev_device *vstart;
        struct rte_vdev_device *dev;
 
-       TAILQ_FOREACH(dev, &vdev_device_list, next) {
-               if (start && &dev->device == start) {
-                       start = NULL;
-                       continue;
-               }
+       rte_spinlock_recursive_lock(&vdev_device_list_lock);
+       if (start != NULL) {
+               vstart = RTE_DEV_TO_VDEV_CONST(start);
+               dev = TAILQ_NEXT(vstart, next);
+       } else {
+               dev = TAILQ_FIRST(&vdev_device_list);
+       }
+       while (dev != NULL) {
                if (cmp(&dev->device, data) == 0)
-                       return &dev->device;
+                       break;
+               dev = TAILQ_NEXT(dev, next);
        }
-       return NULL;
+       rte_spinlock_recursive_unlock(&vdev_device_list_lock);
+
+       return dev ? &dev->device : NULL;
 }
 
 static int