/* *------------------------------------------------------------------ * Copyright (c) 2016 Cisco and/or its affiliates. * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at: * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. *------------------------------------------------------------------ */ #define _GNU_SOURCE #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #define MEMIF_DEBUG 1 #if MEMIF_DEBUG == 1 #define DEBUG_LOG(...) clib_warning(__VA_ARGS__) #define DEBUG_UNIX_LOG(...) clib_unix_warning(__VA_ARGS__) #else #define DEBUG_LOG(...) #endif memif_main_t memif_main; static clib_error_t *memif_conn_fd_read_ready (unix_file_t * uf); static clib_error_t *memif_int_fd_read_ready (unix_file_t * uf); static u32 memif_eth_flag_change (vnet_main_t * vnm, vnet_hw_interface_t * hi, u32 flags) { /* nothing for now */ return 0; } static void memif_remove_pending_conn (memif_pending_conn_t * pending_conn) { memif_main_t *mm = &memif_main; unix_file_del (&unix_main, unix_main.file_pool + pending_conn->connection.index); pool_put (mm->pending_conns, pending_conn); } static void memif_connect (vlib_main_t * vm, memif_if_t * mif) { vnet_main_t *vnm = vnet_get_main (); int num_rings = mif->num_s2m_rings + mif->num_m2s_rings; memif_ring_data_t *rd = NULL; vec_validate_aligned (mif->ring_data, num_rings - 1, CLIB_CACHE_LINE_BYTES); vec_foreach (rd, mif->ring_data) { rd->last_head = 0; } mif->flags &= ~MEMIF_IF_FLAG_CONNECTING; mif->flags |= MEMIF_IF_FLAG_CONNECTED; vnet_hw_interface_set_flags (vnm, mif->hw_if_index, VNET_HW_INTERFACE_FLAG_LINK_UP); } static void memif_disconnect_do (vlib_main_t * vm, memif_if_t * mif) { vnet_main_t *vnm = vnet_get_main (); mif->flags &= ~(MEMIF_IF_FLAG_CONNECTED | MEMIF_IF_FLAG_CONNECTING); if (mif->hw_if_index != ~0) vnet_hw_interface_set_flags (vnm, mif->hw_if_index, 0); if (mif->connection.index != ~0) { unix_file_del (&unix_main, unix_main.file_pool + mif->connection.index); mif->connection.index = ~0; mif->connection.fd = -1; /* closed in unix_file_del */ } // TODO: properly munmap + close memif-owned shared memory segments vec_free (mif->regions); } void memif_disconnect (vlib_main_t * vm, memif_if_t * mif) { if (mif->interrupt_line.index != ~0) { unix_file_del (&unix_main, unix_main.file_pool + mif->interrupt_line.index); mif->interrupt_line.index = ~0; mif->interrupt_line.fd = -1; /* closed in unix_file_del */ } memif_disconnect_do (vm, mif); } static clib_error_t * memif_process_connect_req (memif_pending_conn_t * pending_conn, memif_msg_t * req, struct ucred *slave_cr, int shm_fd, int int_fd) { memif_main_t *mm = &memif_main; vlib_main_t *vm = vlib_get_main (); int fd = pending_conn->connection.fd; unix_file_t *uf = 0; memif_if_t *mif = 0; memif_msg_t resp = { 0 }; unix_file_t template = { 0 }; void *shm; uword *p; u8 retval = 0; static clib_error_t *error = 0; if (shm_fd == -1) { DEBUG_LOG ("Connection request is missing shared memory file descriptor"); retval = 1; goto response; } if (int_fd == -1) { DEBUG_LOG ("Connection request is missing interrupt line file descriptor"); retval = 2; goto response; } if (slave_cr == NULL) { DEBUG_LOG ("Connection request is missing slave credentials"); retval = 3; goto response; } p = mhash_get (&mm->if_index_by_key, &req->key); if (!p) { DEBUG_LOG ("Connection request with unmatched key (0x%" PRIx64 ")", req->key); retval = 4; goto response; } mif = vec_elt_at_index (mm->interfaces, *p); if (mif->listener_index != pending_conn->listener_index) { DEBUG_LOG ("Connection request with non-matching listener (%d vs. %d)", pending_conn->listener_index, mif->listener_index); retval = 5; goto response; } if (mif->flags & MEMIF_IF_FLAG_IS_SLAVE) { DEBUG_LOG ("Memif slave does not accept connection requests"); retval = 6; goto response; } if (mif->connection.fd != -1) { DEBUG_LOG ("Memif with key 0x%" PRIx64 " is already connected", mif->key); retval = 7; goto response; } if ((mif->flags & MEMIF_IF_FLAG_ADMIN_UP) == 0) { /* just silently decline the request */ retval = 8; goto response; } if (req->shared_mem_size < sizeof (memif_shm_t)) { DEBUG_LOG ("Unexpectedly small shared memory segment received from slave."); retval = 9; goto response; } if ((shm = mmap (NULL, req->shared_mem_size, PROT_READ | PROT_WRITE, MAP_SHARED, shm_fd, 0)) == MAP_FAILED) { DEBUG_UNIX_LOG ("Failed to map shared memory segment received from slave memif"); error = clib_error_return_unix (0, "mmap fd %d", shm_fd); retval = 10; goto response; } if (((memif_shm_t *) shm)->cookie != 0xdeadbeef) { DEBUG_LOG ("Possibly corrupted shared memory segment received from slave memif"); munmap (shm, req->shared_mem_size); retval = 11; goto response; } mif->log2_ring_size = req->log2_ring_size; mif->num_s2m_rings = req->num_s2m_rings; mif->num_m2s_rings = req->num_m2s_rings; mif->buffer_size = req->buffer_size; mif->remote_pid = slave_cr->pid; mif->remote_uid = slave_cr->uid; vec_add1 (mif->regions, shm); /* register interrupt line */ mif->interrupt_line.fd = int_fd; template.read_function = memif_int_fd_read_ready; template.file_descriptor = int_fd; template.private_data = mif->if_index; mif->interrupt_line.index = unix_file_add (&unix_main, &template); /* change context for future messages */ uf = vec_elt_at_index (unix_main.file_pool, pending_conn->connection.index); uf->private_data = mif->if_index << 1; mif->connection = pending_conn->connection; pool_put (mm->pending_conns, pending_conn); pending_conn = 0; memif_connect (vm, mif); response: resp.version = MEMIF_VERSION; resp.type = MEMIF_MSG_TYPE_CONNECT_RESP; resp.retval = retval; if (send (fd, &resp, sizeof (resp), 0) < 0) { DEBUG_UNIX_LOG ("Failed to send connection response"); error = clib_error_return_unix (0, "send fd %d", fd); if (pending_conn) memif_remove_pending_conn (pending_conn); else memif_disconnect (vm, mif); } if (retval > 0) { if (shm_fd >= 0) close (shm_fd); if (int_fd >= 0) close (int_fd); } return error; } static clib_error_t * memif_process_connect_resp (memif_if_t * mif, memif_msg_t * resp) { vlib_main_t *vm = vlib_get_main (); if ((mif->flags & MEMIF_IF_FLAG_IS_SLAVE) == 0) { DEBUG_LOG ("Memif master does not accept connection responses"); return 0; } if ((mif->flags & MEMIF_IF_FLAG_CONNECTING) == 0) { DEBUG_LOG ("Unexpected connection response"); return 0; } if (resp->retval == 0) memif_connect (vm, mif); else memif_disconnect (vm, mif); return 0; } static clib_error_t * memif_conn_fd_read_ready (unix_file_t * uf) { memif_main_t *mm = &memif_main; vlib_main_t *vm = vlib_get_main (); memif_if_t *mif = 0; memif_pending_conn_t *pending_conn = 0; int fd_array[2] = { -1, -1 }; char ctl[CMSG_SPACE (sizeof (fd_array)) + CMSG_SPACE (sizeof (struct ucred))] = { 0 }; struct msghdr mh = { 0 }; struct iovec iov[1]; struct ucred *cr = 0; memif_msg_t msg = { 0 }; struct cmsghdr *cmsg; ssize_t size; static clib_error_t *error = 0; iov[0].iov_base = (void *) &msg; iov[0].iov_len = sizeof (memif_msg_t); mh.msg_iov = iov; mh.msg_iovlen = 1; mh.msg_control = ctl; mh.msg_controllen = sizeof (ctl); /* grab the appropriate context */ if (uf->private_data & 1) pending_conn = vec_elt_at_index (mm->pending_conns, uf->private_data >> 1); else mif = vec_elt_at_index (mm->interfaces, uf->private_data >> 1); /* receive the incoming message */ size = recvmsg (uf->file_descriptor, &mh, 0); if (size != sizeof (memif_msg_t)) { if (size == 0) { if (pending_conn) memif_remove_pending_conn (pending_conn); else memif_disconnect_do (vm, mif); return error; } DEBUG_UNIX_LOG ("Malformed message received on fd %d", uf->file_descriptor); error = clib_error_return_unix (0, "recvmsg fd %d", uf->file_descriptor); goto disconnect; } /* check version of the sender's memif plugin */ if (msg.version != MEMIF_VERSION) { DEBUG_LOG ("Memif version mismatch"); goto disconnect; } /* process the message based on its type */ switch (msg.type) { case MEMIF_MSG_TYPE_CONNECT_REQ: if (pending_conn == 0) { DEBUG_LOG ("Received unexpected connection request"); return 0; } /* Read anciliary data */ cmsg = CMSG_FIRSTHDR (&mh); while (cmsg) { if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_CREDENTIALS) { cr = (struct ucred *) CMSG_DATA (cmsg); } else if (cmsg->cmsg_level == SOL_SOCKET && cmsg->cmsg_type == SCM_RIGHTS) { memcpy (fd_array, CMSG_DATA (cmsg), sizeof (fd_array)); } cmsg = CMSG_NXTHDR (&mh, cmsg); } return memif_process_connect_req (pending_conn, &msg, cr, fd_array[0], fd_array[1]); case MEMIF_MSG_TYPE_CONNECT_RESP: if (mif == 0) { DEBUG_LOG ("Received unexpected connection response"); return 0; } return memif_process_connect_resp (mif, &msg); case MEMIF_MSG_TYPE_DISCONNECT: goto disconnect; default: DEBUG_LOG ("Received unknown message type"); goto disconnect; } return 0; disconnect: if (pending_conn) memif_remove_pending_conn (pending_conn); else memif_disconnect (vm, mif); return error; } static clib_error_t * memif_int_fd_read_ready (unix_file_t * uf) { memif_main_t *mm = &memif_main; vnet_main_t *vnm = vnet_get_main (); memif_if_t *mif = vec_elt_at_index (mm->interfaces, uf->private_data); u8 b; ssize_t size; size = read (uf->file_descriptor, &b, sizeof (b)); if (0 == size) { /* interrupt line was disconnected */ unix_file_del (&unix_main, unix_main.file_pool + mif->interrupt_line.index); mif->interrupt_line.index = ~0; mif->interrupt_line.fd = -1; } else vnet_device_input_set_interrupt_pending (vnm, mif->hw_if_index, 0); return 0; } static clib_error_t * memif_conn_fd_accept_ready (unix_file_t * uf) { memif_main_t *mm = &memif_main; memif_listener_t *listener = 0; memif_pending_conn_t *pending_conn = 0; int addr_len; struct sockaddr_un client; int conn_fd; unix_file_t template = { 0 }; listener = pool_elt_at_index (mm->listeners, uf->private_data); addr_len = sizeof (client); conn_fd = accept (uf->file_descriptor, (struct sockaddr *) &client, (socklen_t *) & addr_len); if (conn_fd < 0) return clib_error_return_unix (0, "accept fd %d", uf->file_descriptor); pool_get (mm->pending_conns, pending_conn); pending_conn->index = pending_conn - mm->pending_conns; pending_conn->listener_index = listener->index; pending_conn->connection.fd = conn_fd; template.read_function = memif_conn_fd_read_ready; template.file_descriptor = conn_fd; template.private_data = (pending_conn->index << 1) | 1; pending_conn->connection.index = unix_file_add (&unix_main, &template); return 0; } static void memif_connect_master (vlib_main_t * vm, memif_if_t * mif) { memif_msg_t msg; struct msghdr mh = { 0 }; struct iovec iov[1]; struct cmsghdr *cmsg; int mfd = -1; int rv; int fd_array[2] = { -1, -1 }; char ctl[CMSG_SPACE (sizeof (fd_array))]; memif_ring_t *ring = NULL; int i, j; void *shm = 0; u64 buffer_offset; unix_file_t template = { 0 }; msg.version = MEMIF_VERSION; msg.type = MEMIF_MSG_TYPE_CONNECT_REQ; msg.key = mif->key; msg.log2_ring_size = mif->log2_ring_size; msg.num_s2m_rings = mif->num_s2m_rings; msg.num_m2s_rings = mif->num_m2s_rings; msg.buffer_size = mif->buffer_size; buffer_offset = sizeof (memif_shm_t) + (mif->num_s2m_rings + mif->num_m2s_rings) * (sizeof (memif_ring_t) + sizeof (memif_desc_t) * (1 << mif->log2_ring_size)); msg.shared_mem_size = buffer_offset + mif->buffer_size * (1 << mif->log2_ring_size) * (mif->num_s2m_rings + mif->num_m2s_rings); if ((mfd = memfd_create ("shared mem", MFD_ALLOW_SEALING)) == -1) { DEBUG_LOG ("Failed to create anonymous file"); goto error; } if ((fcntl (mfd, F_ADD_SEALS, F_SEAL_SHRINK)) == -1) { DEBUG_UNIX_LOG ("Failed to seal an anonymous file off from truncating"); goto error; } if ((ftruncate (mfd, msg.shared_mem_size)) == -1) { DEBUG_UNIX_LOG ("Failed to extend the size of an anonymous file"); goto error; } if ((shm = mmap (NULL, msg.shared_mem_size, PROT_READ | PROT_WRITE, MAP_SHARED, mfd, 0)) == MAP_FAILED) { DEBUG_UNIX_LOG ("Failed to map anonymous file into memory"); goto error; } vec_add1 (mif->regions, shm); ((memif_shm_t *) mif->regions[0])->cookie = 0xdeadbeef; for (i = 0; i < mif->num_s2m_rings; i++) { ring = memif_get_ring (mif, MEMIF_RING_S2M, i); ring->head = ring->tail = 0; for (j = 0; j < (1 << mif->log2_ring_size); j++) { u16 slot = i * (1 << mif->log2_ring_size) + j; ring->desc[j].region = 0; ring->desc[j].offset = buffer_offset + (u32) (slot * mif->buffer_size); ring->desc[j].buffer_length = mif->buffer_size; } } for (i = 0; i < mif->num_m2s_rings; i++) { ring = memif_get_ring (mif, MEMIF_RING_M2S, i); ring->head = ring->tail = 0; for (j = 0; j < (1 << mif->log2_ring_size); j++) { u16 slot = (i + mif->num_s2m_rings) * (1 << mif->log2_ring_size) + j; ring->desc[j].region = 0; ring->desc[j].offset = buffer_offset + (u32) (slot * mif->buffer_size); ring->desc[j].buffer_length = mif->buffer_size; } } iov[0].iov_base = (void *) &msg; iov[0].iov_len = sizeof (memif_msg_t); mh.msg_iov = iov; mh.msg_iovlen = 1; /* create interrupt socket */ if (socketpair (AF_UNIX, SOCK_STREAM, 0, fd_array) < 0) { DEBUG_UNIX_LOG ("Failed to create a pair of connected sockets"); goto error; } mif->interrupt_line.fd = fd_array[0]; template.read_function = memif_int_fd_read_ready; template.file_descriptor = mif->interrupt_line.fd; template.private_data = mif->if_index; mif->interrupt_line.index = unix_file_add (&unix_main, &template); memset (&ctl, 0, sizeof (ctl)); mh.msg_control = ctl; mh.msg_controllen = sizeof (ctl); cmsg = CMSG_FIRSTHDR (&mh); cmsg->cmsg_len = CMSG_LEN (sizeof (fd_array)); cmsg->cmsg_level = SOL_SOCKET; cmsg->cmsg_type = SCM_RIGHTS; fd_array[0] = mfd; memcpy (CMSG_DATA (cmsg), fd_array, sizeof (fd_array)); mif->flags |= MEMIF_IF_FLAG_CONNECTING; rv = sendmsg (mif->connection.fd, &mh, 0); if (rv < 0) { DEBUG_UNIX_LOG ("Failed to send memif connection request"); goto error; } /* No need to keep the descriptor open, * mmap creates an extra reference to the underlying file */ close (mfd); mfd = -1; /* This FD is given to peer, so we can close it */ close (fd_array[1]); fd_array[1] = -1; return; error: if (mfd > -1) close (mfd); if (fd_array[1] > -1) close (fd_array[1]); memif_disconnect (vm, mif); } static uword memif_process (vlib_main_t * vm, vlib_node_runtime_t * rt, vlib_frame_t * f) { memif_main_t *mm = &memif_main; memif_if_t *mif; struct sockaddr_un sun; int sockfd; uword *event_data = 0, event_type; unix_file_t template = { 0 }; u8 enabled = 0; f64 start_time, last_run_duration = 0, now; sockfd = socket (AF_UNIX, SOCK_STREAM, 0); if (sockfd < 0) { DEBUG_UNIX_LOG ("socket AF_UNIX"); return 0; } sun.sun_family = AF_UNIX; template.read_function = memif_conn_fd_read_ready; while (1) { if (enabled) vlib_process_wait_for_event_or_clock (vm, (f64) 3 - last_run_duration); else vlib_process_wait_for_event (vm); event_type = vlib_process_get_events (vm, &event_data); vec_reset_length (event_data); switch (event_type) { case ~0: break; case MEMIF_PROCESS_EVENT_START: enabled = 1; break; case MEMIF_PROCESS_EVENT_STOP: enabled = 0; continue; default: ASSERT (0); } last_run_duration = start_time = vlib_time_now (vm); /* *INDENT-OFF* */ pool_foreach (mif, mm->interfaces, ({ /* Allow no more than 10us without a pause */ now = vlib_time_now (vm); if (now > start_time + 10e-6) { vlib_process_suspend (vm, 100e-6); /* suspend for 100 us */ start_time = vlib_time_now (vm); } if ((mif->flags & MEMIF_IF_FLAG_ADMIN_UP) == 0) continue; if (mif->flags & MEMIF_IF_FLAG_CONNECTING) continue; if (mif->flags & MEMIF_IF_FLAG_CONNECTED) continue; if (mif->flags & MEMIF_IF_FLAG_IS_SLAVE) { strncpy (sun.sun_path, (char *) mif->socket_filename, sizeof (sun.sun_path) - 1); if (connect (sockfd, (struct sockaddr *) &sun, sizeof (struct sockaddr_un)) == 0) { mif->connection.fd = sockfd; template.file_descriptor = sockfd; template.private_data = mif->if_index << 1; mif->connection.index = unix_file_add (&unix_main, &template); memif_connect_master (vm, mif); /* grab another fd */ sockfd = socket (AF_UNIX, SOCK_STREAM, 0); if (sockfd < 0) { DEBUG_UNIX_LOG ("socket AF_UNIX"); return 0; } } } })); /* *INDENT-ON* */ last_run_duration = vlib_time_now (vm) - last_run_duration; } return 0; } /* *INDENT-OFF* */ VLIB_REGISTER_NODE (memif_process_node,static) = { .function = memif_process, .type = VLIB_NODE_TYPE_PROCESS, .name = "memif-process", }; /* *INDENT-ON* */ static void memif_close_if (memif_main_t * mm, memif_if_t * mif) { vlib_main_t *vm = vlib_get_main (); memif_listener_t *listener = 0; memif_pending_conn_t *pending_conn = 0; memif_disconnect (vm, mif); if (mif->listener_index != (uword) ~ 0) { listener = pool_elt_at_index (mm->listeners, mif->listener_index); if (--listener->usage_counter == 0) { /* not used anymore -> remove the socket and pending connections */ /* *INDENT-OFF* */ pool_foreach (pending_conn, mm->pending_conns, ({ if (pending_conn->listener_index == mif->listener_index) { memif_remove_pending_conn (pending_conn); } })); /* *INDENT-ON* */ unix_file_del (&unix_main, unix_main.file_pool + listener->socket.index); pool_put (mm->listeners, listener); unlink ((char *) mif->socket_filename); } } clib_spinlock_free (&mif->lockp); mhash_unset (&mm->if_index_by_key, &mif->key, &mif->if_index); vec_free (mif->socket_filename); vec_free (mif->ring_data); memset (mif, 0, sizeof (*mif)); pool_put (mm->interfaces, mif); } int memif_worker_thread_enable () { /* if worker threads are enabled, switch to polling mode */ /* *INDENT-OFF* */ foreach_vlib_main (( { vlib_node_set_state (this_vlib_main, memif_input_node.index, VLIB_NODE_STATE_POLLING); })); /* *INDENT-ON* */ return 0; } int memif_worker_thread_disable () { /* *INDENT-OFF* */ foreach_vlib_main (( { vlib_node_set_state (this_vlib_main, memif_input_node.index, VLIB_NODE_STATE_INTERRUPT); })); /* *INDENT-ON* */ return 0; } int memif_create_if (vlib_main_t * vm, memif_create_if_args_t * args) { memif_main_t *mm = &memif_main; vlib_thread_main_t *tm = vlib_get_thread_main (); vnet_main_t *vnm = vnet_get_main (); memif_if_t *mif = 0; vnet_sw_interface_t *sw; clib_error_t *error = 0; int ret = 0; uword *p; vnet_hw_interface_t *hw; p = mhash_get (&mm->if_index_by_key, &args->key); if (p) return VNET_API_ERROR_SUBIF_ALREADY_EXISTS; pool_get (mm->interfaces, mif); memset (mif, 0, sizeof (*mif)); mif->key = args->key; mif->if_index = mif - mm->interfaces; mif->sw_if_index = mif->hw_if_index = mif->per_interface_next_index = ~0; mif->listener_index = ~0; mif->connection.index = mif->interrupt_line.index = ~0; mif->connection.fd = mif->interrupt_line.fd = -1; if (tm->n_vlib_mains > 1) clib_spinlock_init (&mif->lockp); if (!args->hw_addr_set) { f64 now = vlib_time_now (vm); u32 rnd; rnd = (u32) (now * 1e6); rnd = random_u32 (&rnd); memcpy (args->hw_addr + 2, &rnd, sizeof (rnd)); args->hw_addr[0] = 2; args->hw_addr[1] = 0xfe; } error = ethernet_register_interface (vnm, memif_device_class.index, mif->if_index, args->hw_addr, &mif->hw_if_index, memif_eth_flag_change); if (error) { clib_error_report (error); ret = VNET_API_ERROR_SYSCALL_ERROR_1; goto error; } sw = vnet_get_hw_sw_interface (vnm, mif->hw_if_index); mif->sw_if_index = sw->sw_if_index; mif->log2_ring_size = args->log2_ring_size; mif->buffer_size = args->buffer_size; /* TODO: make configurable */ mif->num_s2m_rings = 1; mif->num_m2s_rings = 1; mhash_set_mem (&mm->if_index_by_key, &args->key, &mif->if_index, 0); if (args->socket_filename != 0) mif->socket_filename = args->socket_filename; else mif->socket_filename = vec_dup (mm->default_socket_filename); args->sw_if_index = mif->sw_if_index; if (args->is_master) { struct sockaddr_un un = { 0 }; struct stat file_stat; int on = 1; memif_listener_t *listener = 0; if (stat ((char *) mif->socket_filename, &file_stat) == 0) { if (!S_ISSOCK (file_stat.st_mode)) { errno = ENOTSOCK; ret = VNET_API_ERROR_SYSCALL_ERROR_2; goto error; } /* *INDENT-OFF* */ pool_foreach (listener, mm->listeners, ({ if (listener->sock_dev == file_stat.st_dev && listener->sock_ino == file_stat.st_ino) { /* attach memif to the existing listener */ mif->listener_index = listener->index; ++listener->usage_counter; goto signal; } })); /* *INDENT-ON* */ unlink ((char *) mif->socket_filename); } pool_get (mm->listeners, listener); memset (listener, 0, sizeof (*listener)); listener->socket.fd = -1; listener->socket.index = ~0; listener->index = listener - mm->listeners; listener->usage_counter = 1; if ((listener->socket.fd = socket (AF_UNIX, SOCK_STREAM, 0)) < 0) { ret = VNET_API_ERROR_SYSCALL_ERROR_3; goto error; } un.sun_family = AF_UNIX; strncpy ((char *) un.sun_path, (char *) mif->socket_filename, sizeof (un.sun_path) - 1); if (setsockopt (listener->socket.fd, SOL_SOCKET, SO_PASSCRED, &on, sizeof (on)) < 0) { ret = VNET_API_ERROR_SYSCALL_ERROR_4; goto error; } if (bind (listener->socket.fd, (struct sockaddr *) &un, sizeof (un)) == -1) { ret = VNET_API_ERROR_SYSCALL_ERROR_5; goto error; } if (listen (listener->socket.fd, 1) == -1) { ret = VNET_API_ERROR_SYSCALL_ERROR_6; goto error; } if (stat ((char *) mif->socket_filename, &file_stat) == -1) { ret = VNET_API_ERROR_SYSCALL_ERROR_7; goto error; } listener->sock_dev = file_stat.st_dev; listener->sock_ino = file_stat.st_ino; unix_file_t template = { 0 }; template.read_function = memif_conn_fd_accept_ready; template.file_descriptor = listener->socket.fd; template.private_data = listener->index; listener->socket.index = unix_file_add (&unix_main, &template); mif->listener_index = listener->index; } else { mif->flags |= MEMIF_IF_FLAG_IS_SLAVE; } hw = vnet_get_hw_interface (vnm, mif->hw_if_index); hw->flags |= VNET_HW_INTERFACE_FLAG_SUPPORTS_INT_MODE; vnet_hw_interface_set_input_node (vnm, mif->hw_if_index, memif_input_node.index); vnet_hw_interface_assign_rx_thread (vnm, mif->hw_if_index, 0, ~0); ret = vnet_hw_interface_set_rx_mode (vnm, mif->hw_if_index, 0, VNET_HW_INTERFACE_RX_MODE_INTERRUPT); if (ret) clib_warning ("Warning: unable to set rx mode for interface %d: " "rc=%d", mif->hw_if_index, ret); #if 0 /* use configured or generate random MAC address */ if (!args->hw_addr_set && tm->n_vlib_mains > 1 && pool_elts (mm->interfaces) == 1) memif_worker_thread_enable (); #endif signal: if (pool_elts (mm->interfaces) == 1) { vlib_process_signal_event (vm, memif_process_node.index, MEMIF_PROCESS_EVENT_START, 0); } return 0; error: if (mif->hw_if_index != ~0) { ethernet_delete_interface (vnm, mif->hw_if_index); mif->hw_if_index = ~0; } memif_close_if (mm, mif); return ret; } int memif_delete_if (vlib_main_t * vm, u64 key) { vnet_main_t *vnm = vnet_get_main (); memif_main_t *mm = &memif_main; memif_if_t *mif; uword *p; int ret; p = mhash_get (&mm->if_index_by_key, &key); if (p == NULL) { clib_warning ("Memory interface with key 0x%" PRIx64 " does not exist", key); return VNET_API_ERROR_SYSCALL_ERROR_1; } mif = pool_elt_at_index (mm->interfaces, p[0]); mif->flags |= MEMIF_IF_FLAG_DELETING; ret = vnet_hw_interface_unassign_rx_thread (vnm, mif->hw_if_index, 0); if (ret) clib_warning ("Warning: unable to unassign interface %d: rc=%d", mif->hw_if_index, ret); /* bring down the interface */ vnet_hw_interface_set_flags (vnm, mif->hw_if_index, 0); vnet_sw_interface_set_flags (vnm, mif->sw_if_index, 0); /* remove the interface */ ethernet_delete_interface (vnm, mif->hw_if_index); mif->hw_if_index = ~0; memif_close_if (mm, mif); if (pool_elts (mm->interfaces) == 0) { vlib_process_signal_event (vm, memif_process_node.index, MEMIF_PROCESS_EVENT_STOP, 0); } #if 0 if (tm->n_vlib_mains > 1 && pool_elts (mm->interfaces) == 0) memif_worker_thread_disable (); #endif return 0; } static clib_error_t * memif_init (vlib_main_t * vm) { memif_main_t *mm = &memif_main; vlib_thread_main_t *tm = vlib_get_thread_main (); vlib_thread_registration_t *tr; uword *p; memset (mm, 0, sizeof (memif_main_t)); mm->input_cpu_first_index = 0; mm->input_cpu_count = 1; /* initialize binary API */ memif_plugin_api_hookup (vm); /* find out which cpus will be used for input */ p = hash_get_mem (tm->thread_registrations_by_name, "workers"); tr = p ? (vlib_thread_registration_t *) p[0] : 0; if (tr && tr->count > 0) { mm->input_cpu_first_index = tr->first_index; mm->input_cpu_count = tr->count; } mhash_init (&mm->if_index_by_key, sizeof (uword), sizeof (u64)); vec_validate_aligned (mm->rx_buffers, tm->n_vlib_mains - 1, CLIB_CACHE_LINE_BYTES); /* set default socket filename */ vec_validate (mm->default_socket_filename, strlen (MEMIF_DEFAULT_SOCKET_FILENAME)); strncpy ((char *) mm->default_socket_filename, MEMIF_DEFAULT_SOCKET_FILENAME, vec_len (mm->default_socket_filename) - 1); return 0; } VLIB_INIT_FUNCTION (memif_init); /* *INDENT-OFF* */ VLIB_PLUGIN_REGISTER () = { .version = VPP_BUILD_VER, .description = "Packet Memory Interface (experimetal)", }; /* *INDENT-ON* */ /* * fd.io coding-style-patch-verification: ON * * Local Variables: * eval: (c-set-style "gnu") * End: */