blob: 0e65c817ae151a2a3dec2995a4e14968327425c4 [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15/*
16 * main.h: VLIB main data structure
17 *
18 * Copyright (c) 2008 Eliot Dresselhaus
19 *
20 * Permission is hereby granted, free of charge, to any person obtaining
21 * a copy of this software and associated documentation files (the
22 * "Software"), to deal in the Software without restriction, including
23 * without limitation the rights to use, copy, modify, merge, publish,
24 * distribute, sublicense, and/or sell copies of the Software, and to
25 * permit persons to whom the Software is furnished to do so, subject to
26 * the following conditions:
27 *
28 * The above copyright notice and this permission notice shall be
29 * included in all copies or substantial portions of the Software.
30 *
31 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35 * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36 * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37 * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38 */
39
40#ifndef included_vlib_main_h
41#define included_vlib_main_h
42
43#include <vppinfra/elog.h>
44#include <vppinfra/format.h>
45#include <vppinfra/longjmp.h>
46#include <vppinfra/pool.h>
47#include <vppinfra/random_buffer.h>
48#include <vppinfra/time.h>
Dave Barach4d1a8662018-09-10 12:31:15 -040049#include <vppinfra/pmc.h>
Dave Barach3ae28732018-11-16 17:19:00 -050050#include <vppinfra/pcap.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070051
52#include <pthread.h>
53
54
55/* By default turn off node/error event logging.
56 Override with -DVLIB_ELOG_MAIN_LOOP */
57#ifndef VLIB_ELOG_MAIN_LOOP
58#define VLIB_ELOG_MAIN_LOOP 0
59#endif
60
Dave Barach5ecd5a52019-02-25 15:27:28 -050061typedef struct
62{
Dave Barach33909772019-09-23 10:27:27 -040063 /* Trace RX pkts */
64 u8 pcap_rx_enable;
65 /* Trace TX pkts */
66 u8 pcap_tx_enable;
67 /* Trace drop pkts */
68 u8 pcap_drop_enable;
69 u8 pad1;
70 u32 max_bytes_per_pkt;
Dave Barach5ecd5a52019-02-25 15:27:28 -050071 u32 pcap_sw_if_index;
72 pcap_main_t pcap_main;
Dave Barach9137e542019-09-13 17:47:50 -040073 u32 filter_classify_table_index;
Dave Barach5ecd5a52019-02-25 15:27:28 -050074} vnet_pcap_t;
75
Dave Barach87d24db2019-12-04 17:19:12 -050076typedef struct
77{
78 u8 trace_filter_enable;
79 u32 trace_classify_table_index;
80 u32 trace_filter_set_index;
81} vlib_trace_filter_t;
82
Dave Barach9b8ffd92016-07-08 08:13:45 -040083typedef struct vlib_main_t
84{
Damjan Marionbe3f4d52018-03-27 21:06:10 +020085 CLIB_CACHE_LINE_ALIGN_MARK (cacheline0);
Ed Warnickecb9cada2015-12-08 15:45:58 -070086 /* Instruction level timing state. */
87 clib_time_t clib_time;
Dave Baracha4324a92019-02-19 17:05:30 -050088 /* Offset from main thread time */
89 f64 time_offset;
90 f64 time_last_barrier_release;
Ed Warnickecb9cada2015-12-08 15:45:58 -070091
92 /* Time stamp of last node dispatch. */
93 u64 cpu_time_last_node_dispatch;
94
95 /* Time stamp when main loop was entered (time 0). */
96 u64 cpu_time_main_loop_start;
97
98 /* Incremented once for each main loop. */
99 u32 main_loop_count;
100
101 /* Count of vectors processed this main loop. */
102 u32 main_loop_vectors_processed;
103 u32 main_loop_nodes_processed;
104
Dave Baracha8df85c2019-10-01 13:34:23 -0400105 /* Internal node vectors, calls */
106 u64 internal_node_vectors;
107 u64 internal_node_calls;
108 u64 internal_node_vectors_last_clear;
109 u64 internal_node_calls_last_clear;
110
111 /* Instantaneous vector rate */
112 u32 internal_node_last_vectors_per_main_loop;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700113
Dave Barach4d1a8662018-09-10 12:31:15 -0400114 /* Main loop hw / sw performance counters */
Dave Barach5f2cfb22019-05-20 10:28:57 -0400115 void (**vlib_node_runtime_perf_counter_cbs) (struct vlib_main_t *,
116 u64 *, u64 *,
117 vlib_node_runtime_t *,
118 vlib_frame_t *, int);
119 void (**vlib_node_runtime_perf_counter_cb_tmp) (struct vlib_main_t *,
120 u64 *, u64 *,
121 vlib_node_runtime_t *,
122 vlib_frame_t *, int);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700123 /* Every so often we switch to the next counter. */
124#define VLIB_LOG2_MAIN_LOOPS_PER_STATS_UPDATE 7
125
126 /* Jump target to exit main loop with given code. */
127 u32 main_loop_exit_set;
Dave Barach903651c2017-10-13 19:16:56 -0400128 /* Set e.g. in the SIGTERM signal handler, checked in a safe place... */
129 volatile u32 main_loop_exit_now;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700130 clib_longjmp_t main_loop_exit;
131#define VLIB_MAIN_LOOP_EXIT_NONE 0
132#define VLIB_MAIN_LOOP_EXIT_PANIC 1
133 /* Exit via CLI. */
134#define VLIB_MAIN_LOOP_EXIT_CLI 2
135
136 /* Error marker to use when exiting main loop. */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400137 clib_error_t *main_loop_error;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700138
139 /* Name for e.g. syslog. */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400140 char *name;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700141
Dave Barach6a5adc32018-07-04 10:56:23 -0400142 /* Start of the heap. */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400143 void *heap_base;
Dave Barach6a5adc32018-07-04 10:56:23 -0400144
145 /* Truncated version, to create frame indices */
146 void *heap_aligned_base;
147
148 /* Size of the heap */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700149 uword heap_size;
150
Damjan Mariond50e3472019-01-20 00:03:56 +0100151 /* buffer main structure. */
152 vlib_buffer_main_t *buffer_main;
153
Damjan Marion68b4da62018-09-30 18:26:20 +0200154 /* physical memory main structure. */
155 vlib_physmem_main_t physmem_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700156
157 /* Node graph main structure. */
158 vlib_node_main_t node_main;
159
160 /* Command line interface. */
161 vlib_cli_main_t cli_main;
162
163 /* Packet trace buffer. */
164 vlib_trace_main_t trace_main;
165
Dave Barach3ae28732018-11-16 17:19:00 -0500166 /* Pcap dispatch trace main */
167 pcap_main_t dispatch_pcap_main;
168 uword dispatch_pcap_enable;
Dave Barache5948fb2019-08-29 18:01:30 -0400169 u32 *dispatch_buffer_trace_nodes;
Dave Barach7fff3d22018-11-27 16:52:59 -0500170 u8 *pcap_buffer;
Dave Barach3ae28732018-11-16 17:19:00 -0500171
Dave Barach5ecd5a52019-02-25 15:27:28 -0500172 /* pcap rx / tx tracing */
Dave Barach33909772019-09-23 10:27:27 -0400173 vnet_pcap_t pcap;
Dave Barach5ecd5a52019-02-25 15:27:28 -0500174
Dave Barach87d24db2019-12-04 17:19:12 -0500175 /* Packet trace capture filter */
176 vlib_trace_filter_t trace_filter;
177
Ed Warnickecb9cada2015-12-08 15:45:58 -0700178 /* Error handling. */
179 vlib_error_main_t error_main;
180
181 /* Punt packets to underlying operating system for when fast switching
182 code does not know what to do. */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400183 void (*os_punt_frame) (struct vlib_main_t * vm,
184 struct vlib_node_runtime_t * node,
185 vlib_frame_t * frame);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700186
Ed Warnickecb9cada2015-12-08 15:45:58 -0700187 /* Stream index to use for distribution when MC is enabled. */
188 u32 mc_stream_index;
189
Dave Barach9b8ffd92016-07-08 08:13:45 -0400190 vlib_one_time_waiting_process_t *procs_waiting_for_mc_stream_join;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700191
192 /* Event logger. */
193 elog_main_t elog_main;
194
Dave Barachc3a06552018-10-01 09:25:32 -0400195 /* Event logger trace flags */
196 int elog_trace_api_messages;
197 int elog_trace_cli_commands;
Dave Barach900cbad2019-01-31 19:12:51 -0500198 int elog_trace_graph_dispatch;
199 int elog_trace_graph_circuit;
200 u32 elog_trace_graph_circuit_node_index;
Dave Barachc3a06552018-10-01 09:25:32 -0400201
Ed Warnickecb9cada2015-12-08 15:45:58 -0700202 /* Node call and return event types. */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400203 elog_event_type_t *node_call_elog_event_types;
204 elog_event_type_t *node_return_elog_event_types;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700205
Dave Barach9b8ffd92016-07-08 08:13:45 -0400206 elog_event_type_t *error_elog_event_types;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700207
208 /* Seed for random number generator. */
209 uword random_seed;
210
211 /* Buffer of random data for various uses. */
212 clib_random_buffer_t random_buffer;
213
214 /* Hash table to record which init functions have been called. */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400215 uword *init_functions_called;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700216
Damjan Marion0a78fa12019-01-19 23:45:36 +0100217 /* thread, cpu and numa_node indices */
Damjan Marion586afd72017-04-05 19:18:20 +0200218 u32 thread_index;
Damjan Marionee721412019-01-27 17:54:11 +0100219 u32 cpu_id;
Damjan Marion0a78fa12019-01-19 23:45:36 +0100220 u32 numa_node;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700221
Ed Warnickecb9cada2015-12-08 15:45:58 -0700222 /* List of init functions to call, setup by constructors */
223 _vlib_init_function_list_elt_t *init_function_registrations;
Damjan Marione9f929b2017-03-16 11:32:09 +0100224 _vlib_init_function_list_elt_t *worker_init_function_registrations;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700225 _vlib_init_function_list_elt_t *main_loop_enter_function_registrations;
226 _vlib_init_function_list_elt_t *main_loop_exit_function_registrations;
227 _vlib_init_function_list_elt_t *api_init_function_registrations;
228 vlib_config_function_runtime_t *config_function_registrations;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700229
Dave Barachdae88b92016-04-19 09:38:35 -0400230 /* control-plane API queue signal pending, length indication */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700231 volatile u32 queue_signal_pending;
Dave Barachdae88b92016-04-19 09:38:35 -0400232 volatile u32 api_queue_nonempty;
Dave Barach9b8ffd92016-07-08 08:13:45 -0400233 void (*queue_signal_callback) (struct vlib_main_t *);
Dave Barachbfdedbd2016-01-20 09:11:55 -0500234 u8 **argv;
Damjan Marionce359db2017-03-16 16:15:38 +0100235
Dave Barach4d1a8662018-09-10 12:31:15 -0400236 /* Top of (worker) dispatch loop callback */
Dave Barach5f2cfb22019-05-20 10:28:57 -0400237 void (**volatile worker_thread_main_loop_callbacks) (struct vlib_main_t *);
238 void (**volatile worker_thread_main_loop_callback_tmp)
239 (struct vlib_main_t *);
240 clib_spinlock_t worker_thread_main_loop_callback_lock;
Dave Barach4d1a8662018-09-10 12:31:15 -0400241
Damjan Marionce359db2017-03-16 16:15:38 +0100242 /* debugging */
243 volatile int parked_at_barrier;
Dave Barach81481312017-05-16 09:08:14 -0400244
245 /* Attempt to do a post-mortem elog dump */
246 int elog_post_mortem_dump;
247
Colin Tregenza Dancer21596182017-09-04 15:27:49 +0100248 /*
249 * Need to call vlib_worker_thread_node_runtime_update before
250 * releasing worker thread barrier. Only valid in vlib_global_main.
251 */
252 int need_vlib_worker_thread_node_runtime_update;
253
Dave Barach000a0292020-02-17 17:07:12 -0500254 /* Dispatch loop time accounting */
255 u64 loops_this_reporting_interval;
256 f64 loop_interval_end;
257 f64 loop_interval_start;
258 f64 loops_per_second;
259 f64 seconds_per_loop;
260 f64 damping_constant;
261
Colin Tregenza Dancereb1ac172017-09-06 20:23:24 +0100262 /*
263 * Barrier epoch - Set to current time, each time barrier_sync or
264 * barrier_release is called with zero recursion.
265 */
266 f64 barrier_epoch;
267
268 /* Earliest barrier can be closed again */
269 f64 barrier_no_close_before;
270
Dave Barach80965f52019-03-11 09:57:38 -0400271 /* Need to check the frame queues */
272 volatile uword check_frame_queues;
273
Dave Barachf6c68d72018-11-01 08:12:52 -0400274 /* RPC requests, main thread only */
Dave Barach2877eee2017-12-15 12:22:57 -0500275 uword *pending_rpc_requests;
Dave Barachf6c68d72018-11-01 08:12:52 -0400276 uword *processing_rpc_requests;
277 clib_spinlock_t pending_rpc_lock;
Dave Barach2877eee2017-12-15 12:22:57 -0500278
Ed Warnickecb9cada2015-12-08 15:45:58 -0700279} vlib_main_t;
280
281/* Global main structure. */
Damjan Marion6a7acc22016-12-19 16:28:36 +0100282extern vlib_main_t vlib_global_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700283
Damjan Marione9d52d52017-03-09 15:42:26 +0100284void vlib_worker_loop (vlib_main_t * vm);
285
Ed Warnickecb9cada2015-12-08 15:45:58 -0700286always_inline f64
287vlib_time_now (vlib_main_t * vm)
Dave Barach9b8ffd92016-07-08 08:13:45 -0400288{
Dave Baracha4324a92019-02-19 17:05:30 -0500289 return clib_time_now (&vm->clib_time) + vm->time_offset;
Dave Barach9b8ffd92016-07-08 08:13:45 -0400290}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700291
292always_inline f64
293vlib_time_now_ticks (vlib_main_t * vm, u64 n)
Dave Barach9b8ffd92016-07-08 08:13:45 -0400294{
295 return clib_time_now_internal (&vm->clib_time, n);
296}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700297
298/* Busy wait for specified time. */
299always_inline void
300vlib_time_wait (vlib_main_t * vm, f64 wait)
301{
302 f64 t = vlib_time_now (vm);
303 f64 limit = t + wait;
304 while (t < limit)
305 t = vlib_time_now (vm);
306}
307
308/* Time a piece of code. */
309#define vlib_time_code(vm,body) \
310do { \
311 f64 _t[2]; \
312 _t[0] = vlib_time_now (vm); \
313 do { body; } while (0); \
314 _t[1] = vlib_time_now (vm); \
315 clib_warning ("%.7e", _t[1] - _t[0]); \
316} while (0)
317
318#define vlib_wait_with_timeout(vm,suspend_time,timeout_time,test) \
319({ \
320 uword __vlib_wait_with_timeout = 0; \
321 f64 __vlib_wait_time = 0; \
322 while (! (__vlib_wait_with_timeout = (test)) \
323 && __vlib_wait_time < (timeout_time)) \
324 { \
325 vlib_process_suspend (vm, suspend_time); \
326 __vlib_wait_time += suspend_time; \
327 } \
328 __vlib_wait_with_timeout; \
329})
330
331always_inline void
332vlib_panic_with_error (vlib_main_t * vm, clib_error_t * error)
333{
334 vm->main_loop_error = error;
335 clib_longjmp (&vm->main_loop_exit, VLIB_MAIN_LOOP_EXIT_PANIC);
336}
337
338#define vlib_panic_with_msg(vm,args...) \
339 vlib_panic_with_error (vm, clib_error_return (0, args))
340
341always_inline void
342vlib_panic (vlib_main_t * vm)
Dave Barach9b8ffd92016-07-08 08:13:45 -0400343{
344 vlib_panic_with_error (vm, 0);
345}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700346
Ed Warnickecb9cada2015-12-08 15:45:58 -0700347
Ed Warnickecb9cada2015-12-08 15:45:58 -0700348always_inline f64
Dave Baracha8df85c2019-10-01 13:34:23 -0400349vlib_internal_node_vector_rate (vlib_main_t * vm)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700350{
Dave Baracha8df85c2019-10-01 13:34:23 -0400351 u64 vectors;
352 u64 calls;
353
354 calls = vm->internal_node_calls - vm->internal_node_calls_last_clear;
355
356 if (PREDICT_FALSE (calls == 0))
357 return 0.0;
358
359 vectors = vm->internal_node_vectors - vm->internal_node_vectors_last_clear;
360
361 return (f64) vectors / (f64) calls;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700362}
363
Dave Baracha8df85c2019-10-01 13:34:23 -0400364always_inline void
365vlib_clear_internal_node_vector_rate (vlib_main_t * vm)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700366{
Dave Baracha8df85c2019-10-01 13:34:23 -0400367 vm->internal_node_calls_last_clear = vm->internal_node_calls;
368 vm->internal_node_vectors_last_clear = vm->internal_node_vectors;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700369}
370
Ed Warnickecb9cada2015-12-08 15:45:58 -0700371always_inline void
372vlib_increment_main_loop_counter (vlib_main_t * vm)
373{
Dave Baracha8df85c2019-10-01 13:34:23 -0400374 vm->main_loop_count++;
375 vm->internal_node_last_vectors_per_main_loop = 0;
Dave Barach903651c2017-10-13 19:16:56 -0400376
377 if (PREDICT_FALSE (vm->main_loop_exit_now))
378 clib_longjmp (&vm->main_loop_exit, VLIB_MAIN_LOOP_EXIT_CLI);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700379}
380
Dave Baracha8df85c2019-10-01 13:34:23 -0400381always_inline u32
382vlib_last_vectors_per_main_loop (vlib_main_t * vm)
383{
384 return vm->internal_node_last_vectors_per_main_loop;
385}
386
Dave Barach9b8ffd92016-07-08 08:13:45 -0400387always_inline void vlib_set_queue_signal_callback
388 (vlib_main_t * vm, void (*fp) (vlib_main_t *))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700389{
390 vm->queue_signal_callback = fp;
391}
392
393/* Main routine. */
394int vlib_main (vlib_main_t * vm, unformat_input_t * input);
395
Damjan Marionf55f9b82017-05-10 21:06:28 +0200396/* Thread stacks, for os_get_thread_index */
Damjan Marion6a7acc22016-12-19 16:28:36 +0100397extern u8 **vlib_thread_stacks;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700398
399/* Number of thread stacks that the application needs */
400u32 vlib_app_num_thread_stacks_needed (void) __attribute__ ((weak));
401
Dave Barach6931f592016-05-13 12:55:01 -0400402extern void vlib_node_sync_stats (vlib_main_t * vm, vlib_node_t * n);
403
Dave Barach1201a802018-11-20 12:08:39 -0500404#define VLIB_PCAP_MAJOR_VERSION 1
405#define VLIB_PCAP_MINOR_VERSION 0
406
Dave Barache5948fb2019-08-29 18:01:30 -0400407typedef struct
408{
409 u8 *filename;
410 int enable;
411 int status;
412 u32 packets_to_capture;
413 u32 buffer_trace_node_index;
414 u32 buffer_traces_to_capture;
415} vlib_pcap_dispatch_trace_args_t;
416
417int vlib_pcap_dispatch_trace_configure (vlib_pcap_dispatch_trace_args_t *);
418
Ed Warnickecb9cada2015-12-08 15:45:58 -0700419#endif /* included_vlib_main_h */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400420
421/*
422 * fd.io coding-style-patch-verification: ON
423 *
424 * Local Variables:
425 * eval: (c-set-style "gnu")
426 * End:
427 */