4 * Copyright(c) 2017 Intel Corporation. All rights reserved.
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
11 * * Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * * Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in
15 * the documentation and/or other materials provided with the
17 * * Neither the name of Intel Corporation nor the names of its
18 * contributors may be used to endorse or promote products derived
19 * from this software without specific prior written permission.
21 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
24 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
25 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
26 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
27 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
31 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
41 #include <rte_service.h>
42 #include "include/rte_service_component.h"
45 #include <rte_lcore.h>
46 #include <rte_common.h>
47 #include <rte_debug.h>
48 #include <rte_cycles.h>
49 #include <rte_atomic.h>
50 #include <rte_memory.h>
51 #include <rte_malloc.h>
53 #define RTE_SERVICE_NUM_MAX 64
55 #define SERVICE_F_REGISTERED (1 << 0)
56 #define SERVICE_F_STATS_ENABLED (1 << 1)
57 #define SERVICE_F_START_CHECK (1 << 2)
59 /* runstates for services and lcores, denoting if they are active or not */
60 #define RUNSTATE_STOPPED 0
61 #define RUNSTATE_RUNNING 1
63 /* internal representation of a service */
64 struct rte_service_spec_impl {
65 /* public part of the struct */
66 struct rte_service_spec spec;
68 /* atomic lock that when set indicates a service core is currently
69 * running this service callback. When not set, a core may take the
70 * lock and then run the service callback.
72 rte_atomic32_t execute_lock;
74 /* API set/get-able variables */
77 uint8_t internal_flags;
79 /* per service statistics */
80 rte_atomic32_t num_mapped_cores;
82 uint64_t cycles_spent;
83 } __rte_cache_aligned;
85 /* the internal values of a service core */
87 /* map of services IDs are run on this core */
88 uint64_t service_mask;
89 uint8_t runstate; /* running or stopped */
90 uint8_t is_service_core; /* set if core is currently a service core */
92 /* extreme statistics */
93 uint64_t calls_per_service[RTE_SERVICE_NUM_MAX];
94 } __rte_cache_aligned;
96 static uint32_t rte_service_count;
97 static struct rte_service_spec_impl *rte_services;
98 static struct core_state *lcore_states;
99 static uint32_t rte_service_library_initialized;
101 int32_t rte_service_init(void)
103 if (rte_service_library_initialized) {
104 printf("service library init() called, init flag %d\n",
105 rte_service_library_initialized);
109 rte_services = rte_calloc("rte_services", RTE_SERVICE_NUM_MAX,
110 sizeof(struct rte_service_spec_impl),
111 RTE_CACHE_LINE_SIZE);
113 printf("error allocating rte services array\n");
117 lcore_states = rte_calloc("rte_service_core_states", RTE_MAX_LCORE,
118 sizeof(struct core_state), RTE_CACHE_LINE_SIZE);
120 printf("error allocating core states array\n");
126 struct rte_config *cfg = rte_eal_get_configuration();
127 for (i = 0; i < RTE_MAX_LCORE; i++) {
128 if (lcore_config[i].core_role == ROLE_SERVICE) {
129 if ((unsigned int)i == cfg->master_lcore)
131 rte_service_lcore_add(i);
136 rte_service_library_initialized = 1;
140 rte_free(rte_services);
142 rte_free(lcore_states);
146 /* returns 1 if service is registered and has not been unregistered
147 * Returns 0 if service never registered, or has been unregistered
150 service_valid(uint32_t id)
152 return !!(rte_services[id].internal_flags & SERVICE_F_REGISTERED);
155 /* validate ID and retrieve service pointer, or return error value */
156 #define SERVICE_VALID_GET_OR_ERR_RET(id, service, retval) do { \
157 if (id >= RTE_SERVICE_NUM_MAX || !service_valid(id)) \
159 service = &rte_services[id]; \
162 /* returns 1 if statistics should be collected for service
163 * Returns 0 if statistics should not be collected for service
166 service_stats_enabled(struct rte_service_spec_impl *impl)
168 return !!(impl->internal_flags & SERVICE_F_STATS_ENABLED);
172 service_mt_safe(struct rte_service_spec_impl *s)
174 return !!(s->spec.capabilities & RTE_SERVICE_CAP_MT_SAFE);
177 int32_t rte_service_set_stats_enable(uint32_t id, int32_t enabled)
179 struct rte_service_spec_impl *s;
180 SERVICE_VALID_GET_OR_ERR_RET(id, s, 0);
183 s->internal_flags |= SERVICE_F_STATS_ENABLED;
185 s->internal_flags &= ~(SERVICE_F_STATS_ENABLED);
190 int32_t rte_service_set_runstate_mapped_check(uint32_t id, int32_t enabled)
192 struct rte_service_spec_impl *s;
193 SERVICE_VALID_GET_OR_ERR_RET(id, s, 0);
196 s->internal_flags |= SERVICE_F_START_CHECK;
198 s->internal_flags &= ~(SERVICE_F_START_CHECK);
204 rte_service_get_count(void)
206 return rte_service_count;
209 int32_t rte_service_get_by_name(const char *name, uint32_t *service_id)
215 for (i = 0; i < RTE_SERVICE_NUM_MAX; i++) {
216 if (service_valid(i) &&
217 strcmp(name, rte_services[i].spec.name) == 0) {
227 rte_service_get_name(uint32_t id)
229 struct rte_service_spec_impl *s;
230 SERVICE_VALID_GET_OR_ERR_RET(id, s, 0);
235 rte_service_probe_capability(uint32_t id, uint32_t capability)
237 struct rte_service_spec_impl *s;
238 SERVICE_VALID_GET_OR_ERR_RET(id, s, -EINVAL);
239 return !!(s->spec.capabilities & capability);
243 rte_service_component_register(const struct rte_service_spec *spec,
247 int32_t free_slot = -1;
249 if (spec->callback == NULL || strlen(spec->name) == 0)
252 for (i = 0; i < RTE_SERVICE_NUM_MAX; i++) {
253 if (!service_valid(i)) {
259 if ((free_slot < 0) || (i == RTE_SERVICE_NUM_MAX))
262 struct rte_service_spec_impl *s = &rte_services[free_slot];
264 s->internal_flags |= SERVICE_F_REGISTERED | SERVICE_F_START_CHECK;
276 rte_service_component_unregister(uint32_t id)
279 struct rte_service_spec_impl *s;
280 SERVICE_VALID_GET_OR_ERR_RET(id, s, -EINVAL);
285 s->internal_flags &= ~(SERVICE_F_REGISTERED);
287 /* clear the run-bit in all cores */
288 for (i = 0; i < RTE_MAX_LCORE; i++)
289 lcore_states[i].service_mask &= ~(UINT64_C(1) << id);
291 memset(&rte_services[id], 0, sizeof(struct rte_service_spec_impl));
297 rte_service_component_runstate_set(uint32_t id, uint32_t runstate)
299 struct rte_service_spec_impl *s;
300 SERVICE_VALID_GET_OR_ERR_RET(id, s, -EINVAL);
303 s->comp_runstate = RUNSTATE_RUNNING;
305 s->comp_runstate = RUNSTATE_STOPPED;
312 rte_service_runstate_set(uint32_t id, uint32_t runstate)
314 struct rte_service_spec_impl *s;
315 SERVICE_VALID_GET_OR_ERR_RET(id, s, -EINVAL);
318 s->app_runstate = RUNSTATE_RUNNING;
320 s->app_runstate = RUNSTATE_STOPPED;
327 rte_service_runstate_get(uint32_t id)
329 struct rte_service_spec_impl *s;
330 SERVICE_VALID_GET_OR_ERR_RET(id, s, -EINVAL);
333 int check_disabled = !(s->internal_flags & SERVICE_F_START_CHECK);
334 int lcore_mapped = (rte_atomic32_read(&s->num_mapped_cores) > 0);
336 return (s->app_runstate == RUNSTATE_RUNNING) &&
337 (s->comp_runstate == RUNSTATE_RUNNING) &&
338 (check_disabled | lcore_mapped);
342 rte_service_runner_do_callback(struct rte_service_spec_impl *s,
343 struct core_state *cs, uint32_t service_idx)
345 void *userdata = s->spec.callback_userdata;
347 if (service_stats_enabled(s)) {
348 uint64_t start = rte_rdtsc();
349 s->spec.callback(userdata);
350 uint64_t end = rte_rdtsc();
351 s->cycles_spent += end - start;
352 cs->calls_per_service[service_idx]++;
355 s->spec.callback(userdata);
359 static inline int32_t
360 service_run(uint32_t i, struct core_state *cs, uint64_t service_mask)
362 if (!service_valid(i))
364 struct rte_service_spec_impl *s = &rte_services[i];
365 if (s->comp_runstate != RUNSTATE_RUNNING ||
366 s->app_runstate != RUNSTATE_RUNNING ||
367 !(service_mask & (UINT64_C(1) << i)))
370 /* check do we need cmpset, if MT safe or <= 1 core
371 * mapped, atomic ops are not required.
373 const int use_atomics = (service_mt_safe(s) == 0) &&
374 (rte_atomic32_read(&s->num_mapped_cores) > 1);
376 if (!rte_atomic32_cmpset((uint32_t *)&s->execute_lock, 0, 1))
379 rte_service_runner_do_callback(s, cs, i);
380 rte_atomic32_clear(&s->execute_lock);
382 rte_service_runner_do_callback(s, cs, i);
387 int32_t rte_service_run_iter_on_app_lcore(uint32_t id,
388 uint32_t serialize_mt_unsafe)
390 /* run service on calling core, using all-ones as the service mask */
391 if (!service_valid(id))
394 struct core_state *cs = &lcore_states[rte_lcore_id()];
395 struct rte_service_spec_impl *s = &rte_services[id];
397 /* Atomically add this core to the mapped cores first, then examine if
398 * we can run the service. This avoids a race condition between
399 * checking the value, and atomically adding to the mapped count.
401 if (serialize_mt_unsafe)
402 rte_atomic32_inc(&s->num_mapped_cores);
404 if (service_mt_safe(s) == 0 &&
405 rte_atomic32_read(&s->num_mapped_cores) > 1) {
406 if (serialize_mt_unsafe)
407 rte_atomic32_dec(&s->num_mapped_cores);
411 int ret = service_run(id, cs, UINT64_MAX);
413 if (serialize_mt_unsafe)
414 rte_atomic32_dec(&s->num_mapped_cores);
420 rte_service_runner_func(void *arg)
424 const int lcore = rte_lcore_id();
425 struct core_state *cs = &lcore_states[lcore];
427 while (lcore_states[lcore].runstate == RUNSTATE_RUNNING) {
428 const uint64_t service_mask = cs->service_mask;
430 for (i = 0; i < RTE_SERVICE_NUM_MAX; i++) {
431 /* return value ignored as no change to code flow */
432 service_run(i, cs, service_mask);
438 lcore_config[lcore].state = WAIT;
444 rte_service_lcore_count(void)
448 for (i = 0; i < RTE_MAX_LCORE; i++)
449 count += lcore_states[i].is_service_core;
454 rte_service_lcore_list(uint32_t array[], uint32_t n)
456 uint32_t count = rte_service_lcore_count();
465 for (i = 0; i < RTE_MAX_LCORE; i++) {
466 struct core_state *cs = &lcore_states[i];
467 if (cs->is_service_core) {
477 rte_service_lcore_count_services(uint32_t lcore)
479 if (lcore >= RTE_MAX_LCORE)
482 struct core_state *cs = &lcore_states[lcore];
483 if (!cs->is_service_core)
486 return __builtin_popcountll(cs->service_mask);
490 rte_service_start_with_defaults(void)
492 /* create a default mapping from cores to services, then start the
493 * services to make them transparent to unaware applications.
497 uint32_t count = rte_service_get_count();
499 int32_t lcore_iter = 0;
500 uint32_t ids[RTE_MAX_LCORE] = {0};
501 int32_t lcore_count = rte_service_lcore_list(ids, RTE_MAX_LCORE);
503 if (lcore_count == 0)
506 for (i = 0; (int)i < lcore_count; i++)
507 rte_service_lcore_start(ids[i]);
509 for (i = 0; i < count; i++) {
510 /* do 1:1 core mapping here, with each service getting
511 * assigned a single core by default. Adding multiple services
512 * should multiplex to a single core, or 1:1 if there are the
513 * same amount of services as service-cores
515 ret = rte_service_map_lcore_set(i, ids[lcore_iter], 1);
520 if (lcore_iter >= lcore_count)
523 ret = rte_service_runstate_set(i, 1);
532 service_update(struct rte_service_spec *service, uint32_t lcore,
533 uint32_t *set, uint32_t *enabled)
538 for (i = 0; i < RTE_SERVICE_NUM_MAX; i++) {
539 if ((struct rte_service_spec *)&rte_services[i] == service &&
546 if (sid == -1 || lcore >= RTE_MAX_LCORE)
549 if (!lcore_states[lcore].is_service_core)
552 uint64_t sid_mask = UINT64_C(1) << sid;
554 uint64_t lcore_mapped = lcore_states[lcore].service_mask &
557 if (*set && !lcore_mapped) {
558 lcore_states[lcore].service_mask |= sid_mask;
559 rte_atomic32_inc(&rte_services[sid].num_mapped_cores);
561 if (!*set && lcore_mapped) {
562 lcore_states[lcore].service_mask &= ~(sid_mask);
563 rte_atomic32_dec(&rte_services[sid].num_mapped_cores);
568 *enabled = !!(lcore_states[lcore].service_mask & (sid_mask));
576 rte_service_map_lcore_set(uint32_t id, uint32_t lcore, uint32_t enabled)
578 struct rte_service_spec_impl *s;
579 SERVICE_VALID_GET_OR_ERR_RET(id, s, -EINVAL);
580 uint32_t on = enabled > 0;
581 return service_update(&s->spec, lcore, &on, 0);
585 rte_service_map_lcore_get(uint32_t id, uint32_t lcore)
587 struct rte_service_spec_impl *s;
588 SERVICE_VALID_GET_OR_ERR_RET(id, s, -EINVAL);
590 int ret = service_update(&s->spec, lcore, 0, &enabled);
597 set_lcore_state(uint32_t lcore, int32_t state)
599 /* mark core state in hugepage backed config */
600 struct rte_config *cfg = rte_eal_get_configuration();
601 cfg->lcore_role[lcore] = state;
603 /* mark state in process local lcore_config */
604 lcore_config[lcore].core_role = state;
606 /* update per-lcore optimized state tracking */
607 lcore_states[lcore].is_service_core = (state == ROLE_SERVICE);
610 int32_t rte_service_lcore_reset_all(void)
612 /* loop over cores, reset all to mask 0 */
614 for (i = 0; i < RTE_MAX_LCORE; i++) {
615 if (lcore_states[i].is_service_core) {
616 lcore_states[i].service_mask = 0;
617 set_lcore_state(i, ROLE_RTE);
618 lcore_states[i].runstate = RUNSTATE_STOPPED;
621 for (i = 0; i < RTE_SERVICE_NUM_MAX; i++)
622 rte_atomic32_set(&rte_services[i].num_mapped_cores, 0);
630 rte_service_lcore_add(uint32_t lcore)
632 if (lcore >= RTE_MAX_LCORE)
634 if (lcore_states[lcore].is_service_core)
637 set_lcore_state(lcore, ROLE_SERVICE);
639 /* ensure that after adding a core the mask and state are defaults */
640 lcore_states[lcore].service_mask = 0;
641 lcore_states[lcore].runstate = RUNSTATE_STOPPED;
645 return rte_eal_wait_lcore(lcore);
649 rte_service_lcore_del(uint32_t lcore)
651 if (lcore >= RTE_MAX_LCORE)
654 struct core_state *cs = &lcore_states[lcore];
655 if (!cs->is_service_core)
658 if (cs->runstate != RUNSTATE_STOPPED)
661 set_lcore_state(lcore, ROLE_RTE);
668 rte_service_lcore_start(uint32_t lcore)
670 if (lcore >= RTE_MAX_LCORE)
673 struct core_state *cs = &lcore_states[lcore];
674 if (!cs->is_service_core)
677 if (cs->runstate == RUNSTATE_RUNNING)
680 /* set core to run state first, and then launch otherwise it will
681 * return immediately as runstate keeps it in the service poll loop
683 lcore_states[lcore].runstate = RUNSTATE_RUNNING;
685 int ret = rte_eal_remote_launch(rte_service_runner_func, 0, lcore);
686 /* returns -EBUSY if the core is already launched, 0 on success */
691 rte_service_lcore_stop(uint32_t lcore)
693 if (lcore >= RTE_MAX_LCORE)
696 if (lcore_states[lcore].runstate == RUNSTATE_STOPPED)
700 uint64_t service_mask = lcore_states[lcore].service_mask;
701 for (i = 0; i < RTE_SERVICE_NUM_MAX; i++) {
702 int32_t enabled = service_mask & (UINT64_C(1) << i);
703 int32_t service_running = rte_service_runstate_get(i);
704 int32_t only_core = (1 ==
705 rte_atomic32_read(&rte_services[i].num_mapped_cores));
707 /* if the core is mapped, and the service is running, and this
708 * is the only core that is mapped, the service would cease to
709 * run if this core stopped, so fail instead.
711 if (enabled && service_running && only_core)
715 lcore_states[lcore].runstate = RUNSTATE_STOPPED;
721 rte_service_dump_one(FILE *f, struct rte_service_spec_impl *s,
722 uint64_t all_cycles, uint32_t reset)
724 /* avoid divide by zero */
732 fprintf(f, " %s: stats %d\tcalls %"PRIu64"\tcycles %"
733 PRIu64"\tavg: %"PRIu64"\n",
734 s->spec.name, service_stats_enabled(s), s->calls,
735 s->cycles_spent, s->cycles_spent / calls);
744 service_dump_calls_per_lcore(FILE *f, uint32_t lcore, uint32_t reset)
747 struct core_state *cs = &lcore_states[lcore];
749 fprintf(f, "%02d\t", lcore);
750 for (i = 0; i < RTE_SERVICE_NUM_MAX; i++) {
751 if (!service_valid(i))
753 fprintf(f, "%"PRIu64"\t", cs->calls_per_service[i]);
755 cs->calls_per_service[i] = 0;
760 int32_t rte_service_dump(FILE *f, uint32_t id)
763 int print_one = (id != UINT32_MAX);
765 uint64_t total_cycles = 0;
767 for (i = 0; i < RTE_SERVICE_NUM_MAX; i++) {
768 if (!service_valid(i))
770 total_cycles += rte_services[i].cycles_spent;
773 /* print only the specified service */
775 struct rte_service_spec_impl *s;
776 SERVICE_VALID_GET_OR_ERR_RET(id, s, -EINVAL);
777 fprintf(f, "Service %s Summary\n", s->spec.name);
779 rte_service_dump_one(f, s, total_cycles, reset);
783 /* print all services, as UINT32_MAX was passed as id */
784 fprintf(f, "Services Summary\n");
785 for (i = 0; i < RTE_SERVICE_NUM_MAX; i++) {
786 if (!service_valid(i))
789 rte_service_dump_one(f, &rte_services[i], total_cycles, reset);
792 fprintf(f, "Service Cores Summary\n");
793 for (i = 0; i < RTE_MAX_LCORE; i++) {
794 if (lcore_config[i].core_role != ROLE_SERVICE)
798 service_dump_calls_per_lcore(f, i, reset);