2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
7 * http://www.apache.org/licenses/LICENSE-2.0
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
16 #include <vppinfra/format.h>
17 #include <vppinfra/dlmalloc.h>
18 #include <vppinfra/os.h>
19 #include <vppinfra/lock.h>
20 #include <vppinfra/hash.h>
21 #include <vppinfra/elf_clib.h>
22 #include <vppinfra/sanitizer.h>
24 void *clib_per_cpu_mheaps[CLIB_MAX_MHEAPS];
25 void *clib_per_numa_mheaps[CLIB_MAX_NUMAS];
29 /* Address of callers: outer first, inner last. */
32 /* Count of allocations with this traceback. */
35 /* Count of bytes allocated with this traceback. */
38 /* Offset of this item */
47 mheap_trace_t *traces;
49 /* Indices of free traces. */
52 /* Hash table mapping callers to trace index. */
53 uword *trace_by_callers;
55 /* Hash table mapping mheap offset to trace index. */
56 uword *trace_index_by_offset;
58 /* So we can easily shut off current segment trace, if any */
59 void *current_traced_mheap;
63 mheap_trace_main_t mheap_trace_main;
66 mheap_get_trace (uword offset, uword size)
68 mheap_trace_main_t *tm = &mheap_trace_main;
70 uword i, n_callers, trace_index, *p;
74 if (tm->enabled == 0 || (clib_mem_get_heap () != tm->current_traced_mheap))
77 /* Spurious Coverity warnings be gone. */
78 clib_memset (&trace, 0, sizeof (trace));
80 /* Skip our frame and mspace_get_aligned's frame */
81 n_callers = clib_backtrace (trace.callers, ARRAY_LEN (trace.callers), 2);
85 clib_spinlock_lock (&tm->lock);
87 /* Turn off tracing to avoid embarrassment... */
88 save_enabled = tm->enabled;
91 if (!tm->trace_by_callers)
92 tm->trace_by_callers =
93 hash_create_shmem (0, sizeof (trace.callers), sizeof (uword));
95 p = hash_get_mem (tm->trace_by_callers, &trace.callers);
99 t = tm->traces + trace_index;
103 i = vec_len (tm->trace_free_list);
106 trace_index = tm->trace_free_list[i - 1];
107 _vec_len (tm->trace_free_list) = i - 1;
111 mheap_trace_t *old_start = tm->traces;
112 mheap_trace_t *old_end = vec_end (tm->traces);
114 vec_add2 (tm->traces, t, 1);
116 if (tm->traces != old_start)
121 hash_foreach_pair (p, tm->trace_by_callers,
123 q = uword_to_pointer (p->key, mheap_trace_t *);
124 ASSERT (q >= old_start && q < old_end);
125 p->key = pointer_to_uword (tm->traces + (q - old_start));
129 trace_index = t - tm->traces;
132 t = tm->traces + trace_index;
134 t->n_allocations = 0;
136 hash_set_mem (tm->trace_by_callers, t->callers, trace_index);
139 t->n_allocations += 1;
141 t->offset = offset; /* keep a sample to autopsy */
142 hash_set (tm->trace_index_by_offset, offset, t - tm->traces);
143 tm->enabled = save_enabled;
144 clib_spinlock_unlock (&tm->lock);
148 mheap_put_trace (uword offset, uword size)
151 uword trace_index, *p;
152 mheap_trace_main_t *tm = &mheap_trace_main;
155 if (tm->enabled == 0)
158 clib_spinlock_lock (&tm->lock);
160 /* Turn off tracing for a moment */
161 save_enabled = tm->enabled;
164 p = hash_get (tm->trace_index_by_offset, offset);
167 tm->enabled = save_enabled;
168 clib_spinlock_unlock (&tm->lock);
173 hash_unset (tm->trace_index_by_offset, offset);
174 ASSERT (trace_index < vec_len (tm->traces));
176 t = tm->traces + trace_index;
177 ASSERT (t->n_allocations > 0);
178 ASSERT (t->n_bytes >= size);
179 t->n_allocations -= 1;
181 if (t->n_allocations == 0)
183 hash_unset_mem (tm->trace_by_callers, t->callers);
184 vec_add1 (tm->trace_free_list, trace_index);
185 clib_memset (t, 0, sizeof (t[0]));
187 tm->enabled = save_enabled;
188 clib_spinlock_unlock (&tm->lock);
192 mheap_trace_main_free (mheap_trace_main_t * tm)
194 vec_free (tm->traces);
195 vec_free (tm->trace_free_list);
196 hash_free (tm->trace_by_callers);
197 hash_free (tm->trace_index_by_offset);
200 /* Initialize CLIB heap based on memory/size given by user.
201 Set memory to 0 and CLIB will try to allocate its own heap. */
203 clib_mem_init_internal (void *memory, uword memory_size, int set_heap)
209 heap = create_mspace_with_base (memory, memory_size, 1 /* locked */ );
210 mspace_disable_expand (heap);
213 heap = create_mspace (memory_size, 1 /* locked */ );
215 CLIB_MEM_POISON (mspace_least_addr (heap), mspace_footprint (heap));
218 clib_mem_set_heap (heap);
220 if (mheap_trace_main.lock == 0)
221 clib_spinlock_init (&mheap_trace_main.lock);
227 clib_mem_init (void *memory, uword memory_size)
229 return clib_mem_init_internal (memory, memory_size,
230 1 /* do clib_mem_set_heap */ );
234 clib_mem_init_thread_safe (void *memory, uword memory_size)
236 return clib_mem_init_internal (memory, memory_size,
237 1 /* do clib_mem_set_heap */ );
241 clib_mem_init_thread_safe_numa (void *memory, uword memory_size, u8 numa)
243 clib_mem_vm_alloc_t alloc = { 0 };
247 alloc.size = memory_size;
248 alloc.flags = CLIB_MEM_VM_F_NUMA_FORCE;
249 alloc.numa_node = numa;
250 if ((err = clib_mem_vm_ext_alloc (&alloc)))
252 clib_error_report (err);
256 heap = clib_mem_init_internal (memory, memory_size,
257 0 /* do NOT clib_mem_set_heap */ );
265 format_clib_mem_usage (u8 * s, va_list * va)
267 int verbose = va_arg (*va, int);
268 return format (s, "$$$$ heap at %llx verbose %d", clib_mem_get_heap (),
273 * Magic decoder ring for mallinfo stats (ala dlmalloc):
275 * size_t arena; / * Non-mmapped space allocated (bytes) * /
276 * size_t ordblks; / * Number of free chunks * /
277 * size_t smblks; / * Number of free fastbin blocks * /
278 * size_t hblks; / * Number of mmapped regions * /
279 * size_t hblkhd; / * Space allocated in mmapped regions (bytes) * /
280 * size_t usmblks; / * Maximum total allocated space (bytes) * /
281 * size_t fsmblks; / * Space in freed fastbin blocks (bytes) * /
282 * size_t uordblks; / * Total allocated space (bytes) * /
283 * size_t fordblks; / * Total free space (bytes) * /
284 * size_t keepcost; / * Top-most, releasable space (bytes) * /
289 format_msize (u8 * s, va_list * va)
291 uword a = va_arg (*va, uword);
294 s = format (s, "%.2fG", (((f64) a) / ((f64) (1ULL << 30))));
295 else if (a >= 1ULL << 20)
296 s = format (s, "%.2fM", (((f64) a) / ((f64) (1ULL << 20))));
297 else if (a >= 1ULL << 10)
298 s = format (s, "%.2fK", (((f64) a) / ((f64) (1ULL << 10))));
300 s = format (s, "%lld", a);
305 mheap_trace_sort (const void *_t1, const void *_t2)
307 const mheap_trace_t *t1 = _t1;
308 const mheap_trace_t *t2 = _t2;
311 cmp = (word) t2->n_bytes - (word) t1->n_bytes;
313 cmp = (word) t2->n_allocations - (word) t1->n_allocations;
318 format_mheap_trace (u8 * s, va_list * va)
320 mheap_trace_main_t *tm = va_arg (*va, mheap_trace_main_t *);
321 int verbose = va_arg (*va, int);
325 clib_spinlock_lock (&tm->lock);
326 if (vec_len (tm->traces) > 0 &&
327 clib_mem_get_heap () == tm->current_traced_mheap)
331 /* Make a copy of traces since we'll be sorting them. */
332 mheap_trace_t *t, *traces_copy;
333 u32 indent, total_objects_traced;
335 traces_copy = vec_dup (tm->traces);
337 qsort (traces_copy, vec_len (traces_copy), sizeof (traces_copy[0]),
340 total_objects_traced = 0;
341 s = format (s, "\n");
342 vec_foreach (t, traces_copy)
344 /* Skip over free elements. */
345 if (t->n_allocations == 0)
348 total_objects_traced += t->n_allocations;
350 /* When not verbose only report allocations of more than 1k. */
351 if (!verbose && t->n_bytes < 1024)
354 if (t == traces_copy)
355 s = format (s, "%=9s%=9s %=10s Traceback\n", "Bytes", "Count",
357 s = format (s, "%9d%9d %p", t->n_bytes, t->n_allocations, t->offset);
358 indent = format_get_indent (s);
359 for (i = 0; i < ARRAY_LEN (t->callers) && t->callers[i]; i++)
362 s = format (s, "%U", format_white_space, indent);
363 #if defined(CLIB_UNIX) && !defined(__APPLE__)
364 /* $$$$ does this actually work? */
366 format (s, " %U\n", format_clib_elf_symbol_with_address,
369 s = format (s, " %p\n", t->callers[i]);
374 s = format (s, "%d total traced objects\n", total_objects_traced);
376 vec_free (traces_copy);
378 clib_spinlock_unlock (&tm->lock);
379 if (have_traces == 0)
380 s = format (s, "no traced allocations\n");
387 format_mheap (u8 * s, va_list * va)
389 void *heap = va_arg (*va, u8 *);
390 int verbose = va_arg (*va, int);
391 struct dlmallinfo mi;
392 mheap_trace_main_t *tm = &mheap_trace_main;
394 mi = mspace_mallinfo (heap);
396 s = format (s, "total: %U, used: %U, free: %U, trimmable: %U",
397 format_msize, mi.arena,
398 format_msize, mi.uordblks,
399 format_msize, mi.fordblks, format_msize, mi.keepcost);
402 s = format (s, "\n free chunks %llu free fastbin blks %llu",
403 mi.ordblks, mi.smblks);
405 format (s, "\n max total allocated %U", format_msize, mi.usmblks);
408 if (mspace_is_traced (heap))
409 s = format (s, "\n%U", format_mheap_trace, tm, verbose);
414 clib_mem_usage (clib_mem_usage_t * u)
416 clib_warning ("unimp");
420 mheap_usage (void *heap, clib_mem_usage_t * usage)
422 struct dlmallinfo mi = mspace_mallinfo (heap);
424 /* TODO: Fill in some more values */
425 usage->object_count = 0;
426 usage->bytes_total = mi.arena;
427 usage->bytes_overhead = 0;
428 usage->bytes_max = 0;
429 usage->bytes_used = mi.uordblks;
430 usage->bytes_free = mi.fordblks;
431 usage->bytes_free_reclaimed = 0;
434 /* Call serial number for debugger breakpoints. */
435 uword clib_mem_validate_serial = 0;
438 clib_mem_validate (void)
440 clib_warning ("unimp");
444 mheap_trace (void *v, int enable)
446 (void) mspace_enable_disable_trace (v, enable);
449 mheap_trace_main_free (&mheap_trace_main);
453 clib_mem_trace (int enable)
455 mheap_trace_main_t *tm = &mheap_trace_main;
456 void *current_heap = clib_mem_get_heap ();
458 tm->enabled = enable;
459 mheap_trace (current_heap, enable);
462 tm->current_traced_mheap = current_heap;
464 tm->current_traced_mheap = 0;
468 clib_mem_is_traced (void)
470 return mspace_is_traced (clib_mem_get_heap ());
474 clib_mem_trace_enable_disable (uword enable)
477 mheap_trace_main_t *tm = &mheap_trace_main;
480 tm->enabled = enable;
485 * These API functions seem like layering violations, but
486 * by introducing them we greatly reduce the number
487 * of code changes required to use dlmalloc spaces
490 mheap_alloc_with_lock (void *memory, uword size, int locked)
494 return create_mspace (size, locked);
497 rv = create_mspace_with_base (memory, size, locked);
499 mspace_disable_expand (rv);
505 * fd.io coding-style-patch-verification: ON
508 * eval: (c-set-style "gnu")