28 #define FRAME_QUEUE_NELTS 64 61 name_copy =
format (0,
"%s%c", msg_name, 0);
77 .format =
"bar-trace-%s-#%d",
78 .format_args =
"T4i4",
83 u32 caller,
count, t_entry, t_open, t_closed;
87 ed->count = (int) vlib_worker_threads[0].barrier_sync_count;
89 (vlib_worker_threads[0].barrier_caller);
90 ed->t_entry = (int) (1000000.0 * t_entry);
91 ed->t_open = (int) (1000000.0 * t_open);
92 ed->t_closed = (int) (1000000.0 * t_closed);
104 .format =
"bar-syncrec-%s-#%d",
105 .format_args =
"T4i4",
114 ed->depth = (int) vlib_worker_threads[0].recursion_level - 1;
116 (vlib_worker_threads[0].barrier_caller);
128 .format =
"bar-relrrec-#%d",
138 ed->depth = (int) vlib_worker_threads[0].recursion_level;
150 .format =
"bar-rel-#%d-e%d-u%d-t%d",
151 .format_args =
"i4i4i4i4",
156 u32 count, t_entry, t_update_main, t_closed_total;
160 ed->t_entry = (int) (1000000.0 * t_entry);
161 ed->t_update_main = (int) (1000000.0 * t_update_main);
162 ed->t_closed_total = (int) (1000000.0 * t_closed_total);
163 ed->count = (int) vlib_worker_threads[0].barrier_sync_count;
184 int pthread_setname_np (pthread_t __target_thread,
const char *__name);
186 pthread_t
thread = pthread_self ();
190 rv = pthread_setname_np (thread, name);
202 return ((
i32) ((*tr0)->no_data_structure_clone)
203 - ((
i32) ((*tr1)->no_data_structure_clone)));
212 fp = fopen (filename,
"r");
218 if (fgets ((
char *) buffer, 256, fp))
222 strlen ((
char *) buffer));
223 if (
unformat (&in,
"%U", unformat_bitmap_list, &r) != 1)
242 u32 n_vlib_mains = 1;
299 pthread_setaffinity_np (pthread_self (),
sizeof (cpu_set_t), &cpuset);
307 _vec_len (vlib_worker_threads) = 1;
312 w->
lwp = syscall (SYS_gettid);
318 struct sched_param sched_param;
319 if (!sched_getparam (w->
lwp, &sched_param))
343 first_index += tr->
count;
355 if (clib_bitmap_get(avail_cpu, c) == 0)
356 return clib_error_return (0,
"cpu %u is not available to be used" 357 " for the '%s' thread",c, tr->name);
359 avail_cpu = clib_bitmap_set(avail_cpu, c, 0);
366 for (j = 0; j < tr->
count; j++)
371 "no available cpus to be used for" 372 " the '%s' thread", tr->
name);
396 memset (fq, 0,
sizeof (*fq));
404 fformat (stderr,
"WARNING: fq->tail unaligned\n");
406 fformat (stderr,
"WARNING: fq->head unaligned\n");
408 fformat (stderr,
"WARNING: fq->elts unaligned\n");
411 fformat (stderr,
"WARNING: fq->elts[0] size %d\n",
412 sizeof (fq->
elts[0]));
413 if (nelts & (nelts - 1))
415 fformat (stderr,
"FATAL: nelts MUST be a power of 2\n");
432 vlib_frame_queue_dequeue_internal (
int thread_id,
440 u32 node_runtime_index;
460 node_runtime_index = elt->node_runtime_index;
465 case VLIB_FRAME_QUEUE_ELT_FREE_BUFFERS:
468 case VLIB_FRAME_QUEUE_ELT_FREE_FRAME:
481 case VLIB_FRAME_QUEUE_ELT_API_MSG:
485 clib_warning (
"bogus frame queue message, type %d", msg_type);
503 return vlib_frame_queue_dequeue_internal (thread_id, vm, nm);
519 new_tail = __sync_add_and_fetch (&fq->
tail, 1);
530 elt = fq->
elts + (new_tail & (fq->
nelts - 1));
541 elt->node_runtime_index = node_runtime_index;
594 w->
lwp = syscall (SYS_gettid);
609 const char *sys_cpu_path =
"/sys/devices/system/cpu/cpu";
611 int core_id = -1, socket_id = -1;
613 p =
format (p,
"%s%u/topology/core_id%c", sys_cpu_path, cpu_id, 0);
617 format (p,
"%s%u/topology/physical_package_id%c", sys_cpu_path, cpu_id,
630 void *(*fp_arg) (
void *) = fp;
641 CPU_SET (cpu_id, &cpuset);
643 if (pthread_create (&worker,
NULL , fp_arg, (
void *) w))
646 if (pthread_setaffinity_np (worker,
sizeof (cpu_set_t), &cpuset))
664 u32 worker_thread_index;
684 if (n_vlib_mains > 1)
714 worker_thread_index = 1;
728 for (k = 0; k < tr->
count; k++)
732 vec_add2 (vlib_worker_threads, w, 1);
736 #if USE_DLMALLOC == 0 755 (
char *)
format (0,
"%s %d", tr->
name, k + 1);
789 u32 save_node_runtime_index;
796 nf->
flags = save_flags;
865 (
vlib_mains[0]->error_main.counters_last_clear,
877 ASSERT (fl_orig - orig_freelist_pool
880 fl_clone[0] = fl_orig[0];
886 worker_thread_index++;
897 for (j = 0; j < tr->
count; j++)
899 vec_add2 (vlib_worker_threads, w, 1);
902 #if USE_DLMALLOC == 0 918 (
char *)
format (0,
"%s %d", tr->
name, j + 1);
926 worker_thread_index = 1;
937 for (j = 0; j < tr->
count; j++)
939 w = vlib_worker_threads + worker_thread_index++;
951 w = vlib_worker_threads + worker_thread_index++;
952 err = vlib_launch_thread_int (vlib_worker_thread_bootstrap_fn,
955 clib_error_report (err);
1009 n = nm_clone->
nodes[j];
1057 u32 save_node_runtime_index;
1064 nf->
flags = save_flags;
1067 old_nodes_clone = nm_clone->
nodes;
1068 nm_clone->
nodes = 0;
1080 new_n = nm->
nodes[j];
1081 old_n_clone = old_nodes_clone[j];
1083 clib_memcpy (new_n_clone, new_n,
sizeof (*new_n));
1087 if (j >= vec_len (old_nodes_clone))
1134 for (j = 0; j <
vec_len (old_rt); j++)
1161 for (j = 0; j <
vec_len (old_rt); j++)
1188 u32 *r = va_arg (*args,
u32 *);
1191 #define _(v,f,s) else if (unformat (input, s)) *r = SCHED_POLICY_##f; 1226 if (
unformat (input,
"use-pthreads"))
1234 else if (
unformat (input,
"coremask-%s %U", &name,
1235 unformat_bitmap_mask, &bitmap) ||
1236 unformat (input,
"corelist-%s %U", &name,
1237 unformat_bitmap_list, &bitmap))
1247 "corelist cannot be set for '%s' threads",
1260 else if (
unformat (input,
"%s %u", &name, &count))
1269 (0,
"number of %s threads not configurable", tr->
name);
1291 "scheduling priority (%d) is not allowed for `normal` scheduling policy",
1313 #if !defined (__x86_64__) && !defined (__i386__) && !defined (__aarch64__) && !defined (__powerpc64__) && !defined(__arm__) 1315 __sync_fetch_and_add_8 (
void)
1317 fformat (stderr,
"%s called\n", __FUNCTION__);
1322 __sync_add_and_fetch_8 (
void)
1324 fformat (stderr,
"%s called\n", __FUNCTION__);
1365 #ifndef BARRIER_MINIMUM_OPEN_LIMIT 1366 #define BARRIER_MINIMUM_OPEN_LIMIT 0.001 1369 #ifndef BARRIER_MINIMUM_OPEN_FACTOR 1370 #define BARRIER_MINIMUM_OPEN_FACTOR 3 1395 if (++vlib_worker_threads[0].recursion_level > 1)
1415 clib_warning (
"clock change: would have waited for %.4f seconds",
1431 fformat (stderr,
"%s: worker thread deadlock\n", __FUNCTION__);
1462 f64 t_update_main = 0.0;
1463 int refork_needed = 0;
1474 if (--vlib_worker_threads[0].recursion_level > 0)
1510 fformat (stderr,
"%s: worker thread deadlock\n", __FUNCTION__);
1526 fformat (stderr,
"%s: worker thread refork deadlock\n",
1603 for (elix = 0; elix < fqt->
nelts; elix++)
1606 if (1 || elt->
valid)
1642 while (n_left_to_node >= 4)
1650 n_left_to_node -= 4;
1653 while (n_left_to_node > 0)
1727 if (frame_queue_nelts == 0)
1730 ASSERT (frame_queue_nelts >= 8);
1788 (*fp) (callback, args, arg_size);
1791 clib_warning (
"BUG: rpc_call_main_thread_cb_fn NULL!");
_vlib_init_function_list_elt_t * worker_init_function_registrations
#define vec_validate(V, I)
Make sure vector is long enough for given index (no header, unspecified alignment) ...
static void barrier_trace_release_rec(f64 t_entry)
static void barrier_trace_sync(f64 t_entry, f64 t_open, f64 t_closed)
uword * pending_rpc_requests
vlib_main_t vlib_global_main
never_inline void vlib_node_runtime_sync_stats(vlib_main_t *vm, vlib_node_runtime_t *r, uword n_calls, uword n_vectors, uword n_clocks)
vlib_process_t ** processes
#define VLIB_PENDING_FRAME_NO_NEXT_FRAME
static void vlib_buffer_free(vlib_main_t *vm, u32 *buffers, u32 n_buffers)
Free buffers Frees the entire buffer chain for each buffer.
u8 runtime_data[0]
Function dependent node-runtime data.
int vlib_frame_queue_enqueue(vlib_main_t *vm, u32 node_runtime_index, u32 frame_queue_index, vlib_frame_t *frame, vlib_frame_queue_msg_type_t type)
#define VLIB_MAIN_LOOP_ENTER_FUNCTION(x)
word elog_track_register(elog_main_t *em, elog_track_t *t)
register an event track
void * mheap_alloc(void *memory, uword size)
static f64 vlib_time_now(vlib_main_t *vm)
#define vec_add2_aligned(V, P, N, A)
Add N elements to end of vector V, return pointer to new elements in P.
clib_error_t * threads_init(vlib_main_t *vm)
u32 vlib_frame_queue_main_init(u32 node_index, u32 frame_queue_nelts)
void * thread_function_arg
#define vec_add1(V, E)
Add 1 element to end of vector (unspecified alignment).
static int sort_registrations_by_no_clone(void *a0, void *a1)
static u64 clib_cpu_time_now(void)
frame_queue_trace_t * frame_queue_traces
void vlib_process_signal_event_mt_helper(vlib_process_signal_event_mt_args_t *args)
#define vec_add2(V, P, N)
Add N elements to end of vector V, return pointer to new elements in P.
void vnet_main_fixup(vlib_fork_fixup_t which)
static uword * clib_bitmap_set(uword *ai, uword i, uword value)
Sets the ith bit of a bitmap to new_value Removes trailing zeros from the bitmap. ...
#define hash_set_mem(h, key, value)
void vlib_worker_thread_fn(void *arg)
u32 unformat_sched_policy(unformat_input_t *input, va_list *args)
#define vec_validate_aligned(V, I, A)
Make sure vector is long enough for given index (no header, specified alignment)
struct vlib_thread_registration_ * next
u32 buffer_index[VLIB_FRAME_SIZE]
vlib_main_t ** vlib_mains
static void vlib_get_thread_core_socket(vlib_worker_thread_t *w, unsigned cpu_id)
#define clib_bitmap_dup(v)
Duplicate a bitmap.
#define vec_reset_length(v)
Reset vector length to zero NULL-pointer tolerant.
u16 thread_index
thread this node runs on
#define vlib_worker_thread_barrier_sync(X)
u64 * counters_last_clear
static void vlib_worker_thread_barrier_check(void)
vlib_thread_registration_t * next
#define vec_add1_aligned(V, E, A)
Add 1 element to end of vector (alignment specified).
#define VLIB_NODE_RUNTIME_DATA_SIZE
vlib_node_stats_t stats_last_clear
memset(h->entries, 0, sizeof(h->entries[0])*entries)
#define clib_smp_atomic_add(addr, increment)
#define pool_foreach(VAR, POOL, BODY)
Iterate through pool.
void vlib_worker_thread_node_runtime_update(void)
u64 count[FRAME_QUEUE_MAX_NELTS]
#define VLIB_INIT_FUNCTION(x)
#define VLIB_INVALID_NODE_INDEX
vlib_frame_queue_msg_type_t
vlib_frame_queue_elt_t ** handoff_queue_elt_by_thread_index
#define vec_elt_at_index(v, i)
Get vector value at index i checking that i is in bounds.
vlib_frame_t * vlib_get_frame_to_node(vlib_main_t *vm, u32 to_node_index)
#define clib_error_return(e, args...)
uword * lock
SMP lock, non-zero means locking required.
#define BARRIER_MINIMUM_OPEN_FACTOR
clib_error_t * vlib_call_init_exit_functions(vlib_main_t *vm, _vlib_init_function_list_elt_t *head, int call_once)
vlib_frame_queue_elt_t * elts
pthread_t thread[MAX_CONNS]
vlib_node_runtime_t * nodes_by_type[VLIB_N_NODE_TYPE]
void vlib_set_thread_name(char *name)
void vl_msg_api_handler_no_free(void *)
#define hash_create_string(elts, value_bytes)
#define BARRIER_SYNC_TIMEOUT
void * rpc_call_main_thread_cb_fn
VLIB_REGISTER_THREAD(worker_thread_reg, static)
vlib_worker_thread_t * vlib_worker_threads
#define clib_bitmap_foreach(i, ai, body)
Macro to iterate across set bits in a bitmap.
vlib_node_stats_t stats_total
u16 state
Input node state.
static void vlib_process_signal_event(vlib_main_t *vm, uword node_index, uword type_opaque, uword data)
static uword clib_bitmap_first_set(uword *ai)
Return the lowest numbered set bit in a bitmap.
u8 * vlib_thread_stack_init(uword thread_index)
static void vlib_next_frame_init(vlib_next_frame_t *nf)
vlib_error_main_t error_main
static u32 vlib_frame_index(vlib_main_t *vm, vlib_frame_t *f)
vlib_thread_callbacks_t cb
#define VLIB_FRAME_NO_FREE_AFTER_DISPATCH
int vlib_thread_cb_register(struct vlib_main_t *vm, vlib_thread_callbacks_t *cb)
const char * barrier_context
char * name
Track name vector.
#define clib_error_return_unix(e, args...)
void vlib_put_frame_to_node(vlib_main_t *vm, u32 to_node_index, vlib_frame_t *f)
static void * clib_mem_get_per_cpu_heap(void)
void vlib_frame_free(vlib_main_t *vm, vlib_node_runtime_t *r, vlib_frame_t *f)
static clib_error_t * vlib_launch_thread_int(void *fp, vlib_worker_thread_t *w, unsigned cpu_id)
void vlib_worker_thread_node_refork(void)
clib_error_t *(* vlib_thread_set_lcore_cb)(u32 thread, u16 cpu)
vlib_buffer_free_list_t * buffer_free_list_pool
u32 node_index
Node index.
u32 elog_global_id_for_msg_name(const char *msg_name)
uword * init_functions_called
void clib_time_init(clib_time_t *c)
vlib_thread_main_t vlib_thread_main
clib_error_t * clib_sysfs_read(char *file_name, char *fmt,...)
void(* thread_function)(void *)
static clib_error_t * cpu_config(vlib_main_t *vm, unformat_input_t *input)
#define pool_get_aligned(P, E, A)
Allocate an object E from a pool P (general version).
i32 n_vectors[FRAME_QUEUE_MAX_NELTS]
vlib_frame_queue_t * vlib_frame_queue_alloc(int nelts)
#define clib_mem_alloc_no_fail(size)
#define VLIB_EARLY_CONFIG_FUNCTION(x, n,...)
vlib_frame_queue_t ** vlib_frame_queues
DLMALLOC_EXPORT mspace create_mspace(size_t capacity, int locked)
static_always_inline uword vlib_get_thread_index(void)
vlib_pending_frame_t * pending_frames
vlib_thread_function_t * function
int vlib_frame_queue_dequeue(vlib_main_t *vm, vlib_frame_queue_main_t *fqm)
#define vec_free(V)
Free vector's memory (no header).
static void * clib_mem_set_heap(void *heap)
#define clib_warning(format, args...)
static vlib_node_runtime_t * vlib_node_get_runtime(vlib_main_t *vm, u32 node_index)
Get node runtime by node index.
#define clib_memcpy(a, b, c)
frame_queue_nelt_counter_t * frame_queue_histogram
#define VLIB_FRAME_PENDING
static uword clib_bitmap_get(uword *ai, uword i)
Gets the ith bit value from a bitmap.
#define ELOG_TYPE_DECLARE(f)
void vlib_worker_thread_init(vlib_worker_thread_t *w)
uword os_get_nthreads(void)
static void * clib_mem_get_heap(void)
volatile u32 * wait_at_barrier
#define FRAME_QUEUE_NELTS
vlib_frame_queue_per_thread_data_t * per_thread_data
void vlib_stat_segment_unlock(void)
vlib_frame_queue_t ** congested_handoff_queue_by_thread_index
#define hash_create(elts, value_bytes)
static void barrier_trace_sync_rec(f64 t_entry)
vlib_frame_queue_main_t * frame_queue_mains
static void clib_mem_free(void *p)
#define clib_error_report(e)
#define clib_bitmap_free(v)
Free a bitmap.
void vlib_worker_thread_barrier_sync_int(vlib_main_t *vm)
int need_vlib_worker_thread_node_runtime_update
uword * thread_registrations_by_name
#define BARRIER_MINIMUM_OPEN_LIMIT
clib_error_t *(* vlib_launch_thread_cb)(void *fp, vlib_worker_thread_t *w, unsigned cpu_id)
volatile u32 * node_reforks_required
static vlib_main_t * vlib_get_main(void)
void vlib_node_sync_stats(vlib_main_t *vm, vlib_node_t *n)
static uword clib_bitmap_count_set_bits(uword *ai)
Return the number of set bits in a bitmap.
static void barrier_trace_release(f64 t_entry, f64 t_closed_total, f64 t_update_main)
void vlib_worker_loop(vlib_main_t *vm)
#define vec_dup_aligned(V, A)
Return copy of vector (no header, alignment specified).
u32 elog_string(elog_main_t *em, char *fmt,...)
add a string to the event-log string table
f64 barrier_no_close_before
static clib_error_t * start_workers(vlib_main_t *vm)
#define vec_len(v)
Number of elements in vector (rvalue-only, NULL tolerant)
void vlib_rpc_call_main_thread(void *callback, u8 *args, u32 arg_size)
vlib_node_main_t node_main
vlib_next_frame_t * next_frames
#define vec_sort_with_function(vec, f)
Sort a vector using the supplied element comparison function.
int no_data_structure_clone
static void * vlib_frame_vector_args(vlib_frame_t *f)
Get pointer to frame vector data.
#define VLIB_THREAD_STACK_SIZE
vlib_frame_size_t * frame_sizes
#define hash_get_mem(h, key)
static void worker_thread_node_runtime_update_internal(void)
static void * clib_mem_alloc_aligned(uword size, uword align)
volatile u32 * workers_at_barrier
uword clib_calljmp(uword(*func)(uword func_arg), uword func_arg, void *stack)
static uword * clib_sysfs_list_to_bitmap(char *filename)
void vlib_worker_thread_barrier_release(vlib_main_t *vm)
static vlib_thread_main_t * vlib_get_thread_main()
static f64 vlib_time_now_ticks(vlib_main_t *vm, u64 n)
static vlib_node_t * vlib_get_node(vlib_main_t *vm, u32 i)
Get vlib node by index.
void vlib_stat_segment_lock(void)
#define vec_foreach(var, vec)
Vector iterator.
void * vlib_worker_thread_bootstrap_fn(void *arg)
#define CLIB_MEMORY_BARRIER()
uword * cpu_socket_bitmap
#define foreach_sched_policy
vlib_thread_registration_t ** registrations
#define vec_validate_init_empty(V, I, INIT)
Make sure vector is long enough for given index and initialize empty space (no header, unspecified alignment)
#define CLIB_CACHE_LINE_BYTES
vlib_thread_registration_t * registration
volatile u32 worker_thread_release
void vlib_worker_thread_fork_fixup(vlib_fork_fixup_t which)
clib_random_buffer_t random_buffer
#define VLIB_FRAME_FREE_AFTER_DISPATCH
clib_error_t * vlib_thread_init(vlib_main_t *vm)