blob: 34ab5be8650dc8ed1830e10be940f0616279b721 [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15#ifndef included_vlib_threads_h
16#define included_vlib_threads_h
17
18#include <vlib/main.h>
Pavel Kotucek1e765832016-09-23 08:54:14 +020019#include <linux/sched.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070020
Damjan Marion6a7acc22016-12-19 16:28:36 +010021extern vlib_main_t **vlib_mains;
Ed Warnickecb9cada2015-12-08 15:45:58 -070022
Dave Barach9b8ffd92016-07-08 08:13:45 -040023void vlib_set_thread_name (char *name);
Ed Warnickecb9cada2015-12-08 15:45:58 -070024
25/* arg is actually a vlib__thread_t * */
Dave Barach9b8ffd92016-07-08 08:13:45 -040026typedef void (vlib_thread_function_t) (void *arg);
Ed Warnickecb9cada2015-12-08 15:45:58 -070027
Dave Barach9b8ffd92016-07-08 08:13:45 -040028typedef struct vlib_thread_registration_
29{
Ed Warnickecb9cada2015-12-08 15:45:58 -070030 /* constructor generated list of thread registrations */
Dave Barach9b8ffd92016-07-08 08:13:45 -040031 struct vlib_thread_registration_ *next;
Ed Warnickecb9cada2015-12-08 15:45:58 -070032
33 /* config parameters */
Dave Barach9b8ffd92016-07-08 08:13:45 -040034 char *name;
35 char *short_name;
36 vlib_thread_function_t *function;
Ed Warnickecb9cada2015-12-08 15:45:58 -070037 uword mheap_size;
38 int fixed_count;
39 u32 count;
40 int no_data_structure_clone;
Bud Grise68adab92016-02-12 10:36:11 -050041 u32 frame_queue_nelts;
42
Ed Warnickecb9cada2015-12-08 15:45:58 -070043 /* All threads of this type run on pthreads */
44 int use_pthreads;
45 u32 first_index;
Dave Barach9b8ffd92016-07-08 08:13:45 -040046 uword *coremask;
Ed Warnickecb9cada2015-12-08 15:45:58 -070047} vlib_thread_registration_t;
48
Damjan Marion3f46baf2016-02-06 19:16:21 +010049/*
50 * Frames have their cpu / vlib_main_t index in the low-order N bits
51 * Make VLIB_MAX_CPUS a power-of-two, please...
Ed Warnickecb9cada2015-12-08 15:45:58 -070052 */
Damjan Marion3f46baf2016-02-06 19:16:21 +010053
Christophe Fontainefef15b42016-04-09 12:38:49 +090054#ifndef VLIB_MAX_CPUS
Damjan Marion3f46baf2016-02-06 19:16:21 +010055#define VLIB_MAX_CPUS 256
Christophe Fontainefef15b42016-04-09 12:38:49 +090056#endif
Ed Warnickecb9cada2015-12-08 15:45:58 -070057
Damjan Marionce8debf2016-02-06 19:16:21 +010058#if VLIB_MAX_CPUS > CLIB_MAX_MHEAPS
59#error Please increase number of per-cpu mheaps
60#endif
61
Dave Barach9b8ffd92016-07-08 08:13:45 -040062#define VLIB_CPU_MASK (VLIB_MAX_CPUS - 1) /* 0x3f, max */
Ed Warnickecb9cada2015-12-08 15:45:58 -070063#define VLIB_OFFSET_MASK (~VLIB_CPU_MASK)
64
65#define VLIB_LOG2_THREAD_STACK_SIZE (20)
66#define VLIB_THREAD_STACK_SIZE (1<<VLIB_LOG2_THREAD_STACK_SIZE)
67
Dave Barach9b8ffd92016-07-08 08:13:45 -040068typedef enum
69{
70 VLIB_FRAME_QUEUE_ELT_DISPATCH_FRAME,
Ed Warnickecb9cada2015-12-08 15:45:58 -070071} vlib_frame_queue_msg_type_t;
72
Dave Barach9b8ffd92016-07-08 08:13:45 -040073typedef struct
74{
Damjan Marionb0d680b2016-11-04 14:41:44 +010075 CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
Ed Warnickecb9cada2015-12-08 15:45:58 -070076 volatile u32 valid;
Dave Barach9b8ffd92016-07-08 08:13:45 -040077 u32 msg_type;
Ed Warnickecb9cada2015-12-08 15:45:58 -070078 u32 n_vectors;
79 u32 last_n_vectors;
80
81 /* 256 * 4 = 1024 bytes, even mult of cache line size */
82 u32 buffer_index[VLIB_FRAME_SIZE];
Dave Barach9b8ffd92016-07-08 08:13:45 -040083}
84vlib_frame_queue_elt_t;
Ed Warnickecb9cada2015-12-08 15:45:58 -070085
Dave Barach9b8ffd92016-07-08 08:13:45 -040086typedef struct
87{
Ed Warnickecb9cada2015-12-08 15:45:58 -070088 /* First cache line */
Damjan Marionb0d680b2016-11-04 14:41:44 +010089 CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
Ed Warnickecb9cada2015-12-08 15:45:58 -070090 volatile u32 *wait_at_barrier;
91 volatile u32 *workers_at_barrier;
Ed Warnickecb9cada2015-12-08 15:45:58 -070092
93 /* Second Cache Line */
Damjan Marionb0d680b2016-11-04 14:41:44 +010094 CLIB_CACHE_LINE_ALIGN_MARK (cacheline1);
Ed Warnickecb9cada2015-12-08 15:45:58 -070095 void *thread_mheap;
Dave Barach9b8ffd92016-07-08 08:13:45 -040096 u8 *thread_stack;
97 void (*thread_function) (void *);
98 void *thread_function_arg;
99 i64 recursion_level;
100 elog_track_t elog_track;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700101 u32 instance_id;
102 vlib_thread_registration_t *registration;
103 u8 *name;
Bud Grise42f20062016-03-16 13:09:46 -0400104 u64 barrier_sync_count;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700105
106 long lwp;
Pavel Kotucek98765202016-10-07 08:37:28 +0200107 int lcore_id;
108 pthread_t thread_id;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700109} vlib_worker_thread_t;
110
Damjan Marion6a7acc22016-12-19 16:28:36 +0100111extern vlib_worker_thread_t *vlib_worker_threads;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700112
Dave Barach9b8ffd92016-07-08 08:13:45 -0400113typedef struct
114{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700115 /* enqueue side */
Damjan Marionb0d680b2016-11-04 14:41:44 +0100116 CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700117 volatile u64 tail;
118 u64 enqueues;
119 u64 enqueue_ticks;
120 u64 enqueue_vectors;
121 u32 enqueue_full_events;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700122
123 /* dequeue side */
Damjan Marionb0d680b2016-11-04 14:41:44 +0100124 CLIB_CACHE_LINE_ALIGN_MARK (cacheline1);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700125 volatile u64 head;
126 u64 dequeues;
127 u64 dequeue_ticks;
128 u64 dequeue_vectors;
129 u64 trace;
130 u64 vector_threshold;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700131
132 /* dequeue hint to enqueue side */
Damjan Marionb0d680b2016-11-04 14:41:44 +0100133 CLIB_CACHE_LINE_ALIGN_MARK (cacheline2);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700134 volatile u64 head_hint;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700135
136 /* read-only, constant, shared */
Damjan Marionb0d680b2016-11-04 14:41:44 +0100137 CLIB_CACHE_LINE_ALIGN_MARK (cacheline3);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700138 vlib_frame_queue_elt_t *elts;
139 u32 nelts;
Dave Barach9b8ffd92016-07-08 08:13:45 -0400140}
141vlib_frame_queue_t;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700142
Damjan Marionaaef1eb2016-11-08 17:37:01 +0100143typedef struct
144{
145 u32 node_index;
146 vlib_frame_queue_t **vlib_frame_queues;
147
148 /* for frame queue tracing */
149 frame_queue_trace_t *frame_queue_traces;
150 frame_queue_nelt_counter_t *frame_queue_histogram;
151} vlib_frame_queue_main_t;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700152
153/* Called early, in thread 0's context */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400154clib_error_t *vlib_thread_init (vlib_main_t * vm);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700155
Dave Barach9b8ffd92016-07-08 08:13:45 -0400156vlib_worker_thread_t *vlib_alloc_thread (vlib_main_t * vm);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700157
Dave Barach9b8ffd92016-07-08 08:13:45 -0400158int vlib_frame_queue_enqueue (vlib_main_t * vm, u32 node_runtime_index,
159 u32 frame_queue_index, vlib_frame_t * frame,
160 vlib_frame_queue_msg_type_t type);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700161
Dave Barach9b8ffd92016-07-08 08:13:45 -0400162int vlib_frame_queue_dequeue (int thread_id,
163 vlib_main_t * vm, vlib_node_main_t * nm);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700164
165u64 dispatch_node (vlib_main_t * vm,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400166 vlib_node_runtime_t * node,
167 vlib_node_type_t type,
168 vlib_node_state_t dispatch_state,
169 vlib_frame_t * frame, u64 last_time_stamp);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700170
171u64 dispatch_pending_node (vlib_main_t * vm,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400172 vlib_pending_frame_t * p, u64 last_time_stamp);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700173
Dave Barach9b8ffd92016-07-08 08:13:45 -0400174void vlib_worker_thread_node_runtime_update (void);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700175
Dave Barach9b8ffd92016-07-08 08:13:45 -0400176void vlib_create_worker_threads (vlib_main_t * vm, int n,
177 void (*thread_function) (void *));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700178
179void vlib_worker_thread_init (vlib_worker_thread_t * w);
Damjan Marionaaef1eb2016-11-08 17:37:01 +0100180u32 vlib_frame_queue_main_init (u32 node_index, u32 frame_queue_nelts);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700181
182/* Check for a barrier sync request every 30ms */
183#define BARRIER_SYNC_DELAY (0.030000)
184
185#if CLIB_DEBUG > 0
186/* long barrier timeout, for gdb... */
187#define BARRIER_SYNC_TIMEOUT (600.1)
188#else
189#define BARRIER_SYNC_TIMEOUT (1.0)
190#endif
191
Dave Barach9b8ffd92016-07-08 08:13:45 -0400192void vlib_worker_thread_barrier_sync (vlib_main_t * vm);
193void vlib_worker_thread_barrier_release (vlib_main_t * vm);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700194
Dave Barach9b8ffd92016-07-08 08:13:45 -0400195always_inline void
196vlib_smp_unsafe_warning (void)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700197{
198 if (CLIB_DEBUG > 0)
199 {
Dave Barach9b8ffd92016-07-08 08:13:45 -0400200 if (os_get_cpu_number ())
201 fformat (stderr, "%s: SMP unsafe warning...\n", __FUNCTION__);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700202 }
203}
204
Dave Barach9b8ffd92016-07-08 08:13:45 -0400205typedef enum
206{
207 VLIB_WORKER_THREAD_FORK_FIXUP_ILLEGAL = 0,
208 VLIB_WORKER_THREAD_FORK_FIXUP_NEW_SW_IF_INDEX,
Ed Warnickecb9cada2015-12-08 15:45:58 -0700209} vlib_fork_fixup_t;
210
211void vlib_worker_thread_fork_fixup (vlib_fork_fixup_t which);
212
Dave Barach9b8ffd92016-07-08 08:13:45 -0400213static inline void
214vlib_worker_thread_barrier_check (void)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700215{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400216 if (PREDICT_FALSE (*vlib_worker_threads->wait_at_barrier))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700217 {
Dave Barach9b8ffd92016-07-08 08:13:45 -0400218 clib_smp_atomic_add (vlib_worker_threads->workers_at_barrier, 1);
219 while (*vlib_worker_threads->wait_at_barrier)
220 ;
221 clib_smp_atomic_add (vlib_worker_threads->workers_at_barrier, -1);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700222 }
223}
224
225#define foreach_vlib_main(body) \
226do { \
227 vlib_main_t ** __vlib_mains = 0, *this_vlib_main; \
228 int ii; \
229 \
230 if (vec_len (vlib_mains) == 0) \
231 vec_add1 (__vlib_mains, &vlib_global_main); \
232 else \
233 { \
234 for (ii = 0; ii < vec_len (vlib_mains); ii++) \
235 { \
236 this_vlib_main = vlib_mains[ii]; \
237 if (this_vlib_main) \
238 vec_add1 (__vlib_mains, this_vlib_main); \
239 } \
240 } \
241 \
242 for (ii = 0; ii < vec_len (__vlib_mains); ii++) \
243 { \
244 this_vlib_main = __vlib_mains[ii]; \
245 /* body uses this_vlib_main... */ \
246 (body); \
247 } \
248 vec_free (__vlib_mains); \
249} while (0);
250
Pavel Kotucek1e765832016-09-23 08:54:14 +0200251#define foreach_sched_policy \
252 _(SCHED_OTHER, OTHER, "other") \
253 _(SCHED_BATCH, BATCH, "batch") \
254 _(SCHED_IDLE, IDLE, "idle") \
255 _(SCHED_FIFO, FIFO, "fifo") \
256 _(SCHED_RR, RR, "rr")
257
258typedef enum
259{
260#define _(v,f,s) SCHED_POLICY_##f = v,
261 foreach_sched_policy
262#undef _
263 SCHED_POLICY_N,
264} sched_policy_t;
265
Dave Barach9b8ffd92016-07-08 08:13:45 -0400266typedef struct
267{
Ed Warnickecb9cada2015-12-08 15:45:58 -0700268 /* Link list of registrations, built by constructors */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400269 vlib_thread_registration_t *next;
270
Ed Warnickecb9cada2015-12-08 15:45:58 -0700271 /* Vector of registrations, w/ non-data-structure clones at the top */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400272 vlib_thread_registration_t **registrations;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700273
Dave Barach9b8ffd92016-07-08 08:13:45 -0400274 uword *thread_registrations_by_name;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700275
Dave Barach9b8ffd92016-07-08 08:13:45 -0400276 vlib_worker_thread_t *worker_threads;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700277
Dave Barach9b8ffd92016-07-08 08:13:45 -0400278 /*
279 * Launch all threads as pthreads,
280 * not eal_rte_launch (strict affinity) threads
Ed Warnickecb9cada2015-12-08 15:45:58 -0700281 */
282 int use_pthreads;
283
284 /* Number of vlib_main / vnet_main clones */
285 u32 n_vlib_mains;
286
287 /* Number of thread stacks to create */
288 u32 n_thread_stacks;
289
290 /* Number of pthreads */
291 u32 n_pthreads;
292
293 /* Number of DPDK eal threads */
294 u32 n_eal_threads;
295
296 /* Number of cores to skip, must match the core mask */
297 u32 skip_cores;
298
299 /* Thread prefix name */
300 u8 *thread_prefix;
301
302 /* main thread lcore */
303 u8 main_lcore;
304
305 /* Bitmap of available CPU cores */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400306 uword *cpu_core_bitmap;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700307
308 /* Bitmap of available CPU sockets (NUMA nodes) */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400309 uword *cpu_socket_bitmap;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700310
Damjan Marionaaef1eb2016-11-08 17:37:01 +0100311 /* Worker handoff queues */
312 vlib_frame_queue_main_t *frame_queue_mains;
Damjan Marion0f8ecf02016-06-27 08:30:30 +0200313
314 /* worker thread initialization barrier */
315 volatile u32 worker_thread_release;
316
Pavel Kotucek1e765832016-09-23 08:54:14 +0200317 /* scheduling policy */
318 u32 sched_policy;
319
320 /* scheduling policy priority */
321 u32 sched_priority;
322
Ed Warnickecb9cada2015-12-08 15:45:58 -0700323} vlib_thread_main_t;
324
Damjan Marion6a7acc22016-12-19 16:28:36 +0100325extern vlib_thread_main_t vlib_thread_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700326
327#define VLIB_REGISTER_THREAD(x,...) \
328 __VA_ARGS__ vlib_thread_registration_t x; \
329static void __vlib_add_thread_registration_##x (void) \
330 __attribute__((__constructor__)) ; \
331static void __vlib_add_thread_registration_##x (void) \
332{ \
333 vlib_thread_main_t * tm = &vlib_thread_main; \
334 x.next = tm->next; \
335 tm->next = &x; \
336} \
Dave Barach9b8ffd92016-07-08 08:13:45 -0400337__VA_ARGS__ vlib_thread_registration_t x
Ed Warnickecb9cada2015-12-08 15:45:58 -0700338
Damjan Marion64034362016-11-07 22:19:55 +0100339always_inline u32
340vlib_num_workers ()
341{
342 return vlib_thread_main.n_vlib_mains - 1;
343}
344
345always_inline u32
346vlib_get_worker_cpu_index (u32 worker_index)
347{
348 return worker_index + 1;
349}
350
Damjan Marion3a4ed392016-11-08 13:20:42 +0100351always_inline u32
352vlib_get_worker_index (u32 cpu_index)
353{
354 return cpu_index - 1;
355}
356
357always_inline u32
358vlib_get_current_worker_index ()
359{
360 return os_get_cpu_number () - 1;
361}
362
Damjan Marion64034362016-11-07 22:19:55 +0100363always_inline vlib_main_t *
364vlib_get_worker_vlib_main (u32 worker_index)
365{
366 vlib_main_t *vm;
367 vlib_thread_main_t *tm = &vlib_thread_main;
368 ASSERT (worker_index < tm->n_vlib_mains - 1);
369 vm = vlib_mains[worker_index + 1];
370 ASSERT (vm);
371 return vm;
372}
373
Damjan Marionaaef1eb2016-11-08 17:37:01 +0100374static inline void
375vlib_put_frame_queue_elt (vlib_frame_queue_elt_t * hf)
376{
377 CLIB_MEMORY_BARRIER ();
378 hf->valid = 1;
379}
380
381static inline vlib_frame_queue_elt_t *
382vlib_get_frame_queue_elt (u32 frame_queue_index, u32 index)
383{
384 vlib_frame_queue_t *fq;
385 vlib_frame_queue_elt_t *elt;
386 vlib_thread_main_t *tm = &vlib_thread_main;
387 vlib_frame_queue_main_t *fqm =
388 vec_elt_at_index (tm->frame_queue_mains, frame_queue_index);
389 u64 new_tail;
390
391 fq = fqm->vlib_frame_queues[index];
392 ASSERT (fq);
393
394 new_tail = __sync_add_and_fetch (&fq->tail, 1);
395
396 /* Wait until a ring slot is available */
397 while (new_tail >= fq->head_hint + fq->nelts)
398 vlib_worker_thread_barrier_check ();
399
400 elt = fq->elts + (new_tail & (fq->nelts - 1));
401
402 /* this would be very bad... */
403 while (elt->valid)
404 ;
405
406 elt->msg_type = VLIB_FRAME_QUEUE_ELT_DISPATCH_FRAME;
407 elt->last_n_vectors = elt->n_vectors = 0;
408
409 return elt;
410}
411
412static inline vlib_frame_queue_t *
413is_vlib_frame_queue_congested (u32 frame_queue_index,
414 u32 index,
415 u32 queue_hi_thresh,
416 vlib_frame_queue_t **
417 handoff_queue_by_worker_index)
418{
419 vlib_frame_queue_t *fq;
420 vlib_thread_main_t *tm = &vlib_thread_main;
421 vlib_frame_queue_main_t *fqm =
422 vec_elt_at_index (tm->frame_queue_mains, frame_queue_index);
423
424 fq = handoff_queue_by_worker_index[index];
425 if (fq != (vlib_frame_queue_t *) (~0))
426 return fq;
427
428 fq = fqm->vlib_frame_queues[index];
429 ASSERT (fq);
430
431 if (PREDICT_FALSE (fq->tail >= (fq->head_hint + queue_hi_thresh)))
432 {
433 /* a valid entry in the array will indicate the queue has reached
434 * the specified threshold and is congested
435 */
436 handoff_queue_by_worker_index[index] = fq;
437 fq->enqueue_full_events++;
438 return fq;
439 }
440
441 return NULL;
442}
443
444static inline vlib_frame_queue_elt_t *
445vlib_get_worker_handoff_queue_elt (u32 frame_queue_index,
446 u32 vlib_worker_index,
447 vlib_frame_queue_elt_t **
448 handoff_queue_elt_by_worker_index)
449{
450 vlib_frame_queue_elt_t *elt;
451
452 if (handoff_queue_elt_by_worker_index[vlib_worker_index])
453 return handoff_queue_elt_by_worker_index[vlib_worker_index];
454
455 elt = vlib_get_frame_queue_elt (frame_queue_index, vlib_worker_index);
456
457 handoff_queue_elt_by_worker_index[vlib_worker_index] = elt;
458
459 return elt;
460}
461
Ed Warnickecb9cada2015-12-08 15:45:58 -0700462#endif /* included_vlib_threads_h */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400463
464/*
465 * fd.io coding-style-patch-verification: ON
466 *
467 * Local Variables:
468 * eval: (c-set-style "gnu")
469 * End:
470 */