blob: fd9937fe3e64636e1e2c608671ac5385d9a3915e [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15/*
16 * main.c: main vector processing loop
17 *
18 * Copyright (c) 2008 Eliot Dresselhaus
19 *
20 * Permission is hereby granted, free of charge, to any person obtaining
21 * a copy of this software and associated documentation files (the
22 * "Software"), to deal in the Software without restriction, including
23 * without limitation the rights to use, copy, modify, merge, publish,
24 * distribute, sublicense, and/or sell copies of the Software, and to
25 * permit persons to whom the Software is furnished to do so, subject to
26 * the following conditions:
27 *
28 * The above copyright notice and this permission notice shall be
29 * included in all copies or substantial portions of the Software.
30 *
31 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
32 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
33 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
34 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
35 * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
36 * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
37 * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
38 */
39
40#include <math.h>
41#include <vppinfra/format.h>
42#include <vlib/vlib.h>
43#include <vlib/threads.h>
Dave Barach5c20a012017-06-13 08:48:31 -040044#include <vppinfra/tw_timer_1t_3w_1024sl_ov.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070045
Damjan Marion04a7f052017-07-10 15:06:17 +020046#include <vlib/unix/unix.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070047#include <vlib/unix/cj.h>
48
49CJ_GLOBAL_LOG_PROTOTYPE;
50
Ed Warnickecb9cada2015-12-08 15:45:58 -070051/* Actually allocate a few extra slots of vector data to support
52 speculative vector enqueues which overflow vector data in next frame. */
53#define VLIB_FRAME_SIZE_ALLOC (VLIB_FRAME_SIZE + 4)
54
Damjan Marion6a7acc22016-12-19 16:28:36 +010055u32 wraps;
56
Ed Warnickecb9cada2015-12-08 15:45:58 -070057always_inline u32
58vlib_frame_bytes (u32 n_scalar_bytes, u32 n_vector_bytes)
59{
60 u32 n_bytes;
61
62 /* Make room for vlib_frame_t plus scalar arguments. */
63 n_bytes = vlib_frame_vector_byte_offset (n_scalar_bytes);
64
65 /* Make room for vector arguments.
66 Allocate a few extra slots of vector data to support
67 speculative vector enqueues which overflow vector data in next frame. */
68#define VLIB_FRAME_SIZE_EXTRA 4
69 n_bytes += (VLIB_FRAME_SIZE + VLIB_FRAME_SIZE_EXTRA) * n_vector_bytes;
70
71 /* Magic number is first 32bit number after vector data.
72 Used to make sure that vector data is never overrun. */
73#define VLIB_FRAME_MAGIC (0xabadc0ed)
74 n_bytes += sizeof (u32);
75
76 /* Pad to cache line. */
77 n_bytes = round_pow2 (n_bytes, CLIB_CACHE_LINE_BYTES);
78
79 return n_bytes;
80}
81
82always_inline u32 *
83vlib_frame_find_magic (vlib_frame_t * f, vlib_node_t * node)
84{
Dave Barach9b8ffd92016-07-08 08:13:45 -040085 void *p = f;
Ed Warnickecb9cada2015-12-08 15:45:58 -070086
87 p += vlib_frame_vector_byte_offset (node->scalar_size);
88
89 p += (VLIB_FRAME_SIZE + VLIB_FRAME_SIZE_EXTRA) * node->vector_size;
90
91 return p;
92}
93
94static vlib_frame_size_t *
95get_frame_size_info (vlib_node_main_t * nm,
96 u32 n_scalar_bytes, u32 n_vector_bytes)
97{
98 uword key = (n_scalar_bytes << 16) | n_vector_bytes;
Dave Barach9b8ffd92016-07-08 08:13:45 -040099 uword *p, i;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700100
101 p = hash_get (nm->frame_size_hash, key);
102 if (p)
103 i = p[0];
104 else
105 {
106 i = vec_len (nm->frame_sizes);
107 vec_validate (nm->frame_sizes, i);
108 hash_set (nm->frame_size_hash, key, i);
109 }
110
111 return vec_elt_at_index (nm->frame_sizes, i);
112}
113
114static u32
Dave Barach9b8ffd92016-07-08 08:13:45 -0400115vlib_frame_alloc_to_node (vlib_main_t * vm, u32 to_node_index,
116 u32 frame_flags)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700117{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400118 vlib_node_main_t *nm = &vm->node_main;
119 vlib_frame_size_t *fs;
120 vlib_node_t *to_node;
121 vlib_frame_t *f;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700122 u32 fi, l, n, scalar_size, vector_size;
123
124 to_node = vlib_get_node (vm, to_node_index);
125
126 scalar_size = to_node->scalar_size;
127 vector_size = to_node->vector_size;
128
129 fs = get_frame_size_info (nm, scalar_size, vector_size);
130 n = vlib_frame_bytes (scalar_size, vector_size);
131 if ((l = vec_len (fs->free_frame_indices)) > 0)
132 {
133 /* Allocate from end of free list. */
134 fi = fs->free_frame_indices[l - 1];
135 f = vlib_get_frame_no_check (vm, fi);
136 _vec_len (fs->free_frame_indices) = l - 1;
137 }
138 else
139 {
Damjan Marion3f46baf2016-02-06 19:16:21 +0100140 f = clib_mem_alloc_aligned_no_fail (n, VLIB_FRAME_ALIGN);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700141 fi = vlib_frame_index_no_check (vm, f);
142 }
143
144 /* Poison frame when debugging. */
145 if (CLIB_DEBUG > 0)
Dave Barachd84ba852017-08-22 17:56:46 -0400146 memset (f, 0xfe, n);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700147
148 /* Insert magic number. */
149 {
Dave Barach9b8ffd92016-07-08 08:13:45 -0400150 u32 *magic;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700151
152 magic = vlib_frame_find_magic (f, to_node);
153 *magic = VLIB_FRAME_MAGIC;
154 }
155
156 f->flags = VLIB_FRAME_IS_ALLOCATED | frame_flags;
157 f->n_vectors = 0;
158 f->scalar_size = scalar_size;
159 f->vector_size = vector_size;
160
161 fs->n_alloc_frames += 1;
162
163 return fi;
164}
165
166/* Allocate a frame for from FROM_NODE to TO_NODE via TO_NEXT_INDEX.
167 Returns frame index. */
168static u32
Dave Barach9b8ffd92016-07-08 08:13:45 -0400169vlib_frame_alloc (vlib_main_t * vm, vlib_node_runtime_t * from_node_runtime,
170 u32 to_next_index)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700171{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400172 vlib_node_t *from_node;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700173
174 from_node = vlib_get_node (vm, from_node_runtime->node_index);
175 ASSERT (to_next_index < vec_len (from_node->next_nodes));
176
Dave Barach9b8ffd92016-07-08 08:13:45 -0400177 return vlib_frame_alloc_to_node (vm, from_node->next_nodes[to_next_index],
Ed Warnickecb9cada2015-12-08 15:45:58 -0700178 /* frame_flags */ 0);
179}
180
181vlib_frame_t *
182vlib_get_frame_to_node (vlib_main_t * vm, u32 to_node_index)
183{
184 u32 fi = vlib_frame_alloc_to_node (vm, to_node_index,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400185 /* frame_flags */
186 VLIB_FRAME_FREE_AFTER_DISPATCH);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700187 return vlib_get_frame (vm, fi);
188}
189
Dave Barach9b8ffd92016-07-08 08:13:45 -0400190void
191vlib_put_frame_to_node (vlib_main_t * vm, u32 to_node_index, vlib_frame_t * f)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700192{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400193 vlib_pending_frame_t *p;
194 vlib_node_t *to_node;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700195
196 if (f->n_vectors == 0)
197 return;
198
199 to_node = vlib_get_node (vm, to_node_index);
200
201 vec_add2 (vm->node_main.pending_frames, p, 1);
202
203 f->flags |= VLIB_FRAME_PENDING;
204 p->frame_index = vlib_frame_index (vm, f);
205 p->node_runtime_index = to_node->runtime_index;
206 p->next_frame_index = VLIB_PENDING_FRAME_NO_NEXT_FRAME;
207}
208
209/* Free given frame. */
210void
Dave Barach9b8ffd92016-07-08 08:13:45 -0400211vlib_frame_free (vlib_main_t * vm, vlib_node_runtime_t * r, vlib_frame_t * f)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700212{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400213 vlib_node_main_t *nm = &vm->node_main;
214 vlib_node_t *node;
215 vlib_frame_size_t *fs;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700216 u32 frame_index;
Dave Barach9b8ffd92016-07-08 08:13:45 -0400217
Ed Warnickecb9cada2015-12-08 15:45:58 -0700218 ASSERT (f->flags & VLIB_FRAME_IS_ALLOCATED);
219
220 node = vlib_get_node (vm, r->node_index);
221 fs = get_frame_size_info (nm, node->scalar_size, node->vector_size);
222
223 frame_index = vlib_frame_index (vm, f);
224
225 ASSERT (f->flags & VLIB_FRAME_IS_ALLOCATED);
226
227 /* No next frames may point to freed frame. */
228 if (CLIB_DEBUG > 0)
229 {
Dave Barach9b8ffd92016-07-08 08:13:45 -0400230 vlib_next_frame_t *nf;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700231 vec_foreach (nf, vm->node_main.next_frames)
232 ASSERT (nf->frame_index != frame_index);
233 }
234
235 f->flags &= ~VLIB_FRAME_IS_ALLOCATED;
236
237 vec_add1 (fs->free_frame_indices, frame_index);
238 ASSERT (fs->n_alloc_frames > 0);
239 fs->n_alloc_frames -= 1;
240}
241
242static clib_error_t *
243show_frame_stats (vlib_main_t * vm,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400244 unformat_input_t * input, vlib_cli_command_t * cmd)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700245{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400246 vlib_node_main_t *nm = &vm->node_main;
247 vlib_frame_size_t *fs;
248
Ed Warnickecb9cada2015-12-08 15:45:58 -0700249 vlib_cli_output (vm, "%=6s%=12s%=12s", "Size", "# Alloc", "# Free");
250 vec_foreach (fs, nm->frame_sizes)
Dave Barach9b8ffd92016-07-08 08:13:45 -0400251 {
252 u32 n_alloc = fs->n_alloc_frames;
253 u32 n_free = vec_len (fs->free_frame_indices);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700254
Dave Barach9b8ffd92016-07-08 08:13:45 -0400255 if (n_alloc + n_free > 0)
256 vlib_cli_output (vm, "%=6d%=12d%=12d",
257 fs - nm->frame_sizes, n_alloc, n_free);
258 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700259
260 return 0;
261}
262
Dave Barach9b8ffd92016-07-08 08:13:45 -0400263/* *INDENT-OFF* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700264VLIB_CLI_COMMAND (show_frame_stats_cli, static) = {
265 .path = "show vlib frame-allocation",
266 .short_help = "Show node dispatch frame statistics",
267 .function = show_frame_stats,
268};
Dave Barach9b8ffd92016-07-08 08:13:45 -0400269/* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700270
271/* Change ownership of enqueue rights to given next node. */
272static void
273vlib_next_frame_change_ownership (vlib_main_t * vm,
274 vlib_node_runtime_t * node_runtime,
275 u32 next_index)
276{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400277 vlib_node_main_t *nm = &vm->node_main;
278 vlib_next_frame_t *next_frame;
279 vlib_node_t *node, *next_node;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700280
281 node = vec_elt (nm->nodes, node_runtime->node_index);
282
283 /* Only internal & input nodes are allowed to call other nodes. */
284 ASSERT (node->type == VLIB_NODE_TYPE_INTERNAL
285 || node->type == VLIB_NODE_TYPE_INPUT
286 || node->type == VLIB_NODE_TYPE_PROCESS);
287
288 ASSERT (vec_len (node->next_nodes) == node_runtime->n_next_nodes);
289
Dave Barach9b8ffd92016-07-08 08:13:45 -0400290 next_frame =
291 vlib_node_runtime_get_next_frame (vm, node_runtime, next_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700292 next_node = vec_elt (nm->nodes, node->next_nodes[next_index]);
293
294 if (next_node->owner_node_index != VLIB_INVALID_NODE_INDEX)
295 {
296 /* Get frame from previous owner. */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400297 vlib_next_frame_t *owner_next_frame;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700298 vlib_next_frame_t tmp;
299
300 owner_next_frame =
301 vlib_node_get_next_frame (vm,
302 next_node->owner_node_index,
303 next_node->owner_next_index);
304
305 /* Swap target next frame with owner's. */
306 tmp = owner_next_frame[0];
307 owner_next_frame[0] = next_frame[0];
308 next_frame[0] = tmp;
309
310 /*
311 * If next_frame is already pending, we have to track down
312 * all pending frames and fix their next_frame_index fields.
313 */
314 if (next_frame->flags & VLIB_FRAME_PENDING)
Dave Barach9b8ffd92016-07-08 08:13:45 -0400315 {
316 vlib_pending_frame_t *p;
317 if (next_frame->frame_index != ~0)
318 {
319 vec_foreach (p, nm->pending_frames)
320 {
321 if (p->frame_index == next_frame->frame_index)
322 {
323 p->next_frame_index =
324 next_frame - vm->node_main.next_frames;
325 }
326 }
327 }
328 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700329 }
330 else
331 {
332 /* No previous owner. Take ownership. */
333 next_frame->flags |= VLIB_FRAME_OWNER;
334 }
Dave Barach9b8ffd92016-07-08 08:13:45 -0400335
Ed Warnickecb9cada2015-12-08 15:45:58 -0700336 /* Record new owner. */
337 next_node->owner_node_index = node->index;
338 next_node->owner_next_index = next_index;
339
340 /* Now we should be owner. */
341 ASSERT (next_frame->flags & VLIB_FRAME_OWNER);
Dave Barach9b8ffd92016-07-08 08:13:45 -0400342}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700343
344/* Make sure that magic number is still there.
345 Otherwise, it is likely that caller has overrun frame arguments. */
346always_inline void
347validate_frame_magic (vlib_main_t * vm,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400348 vlib_frame_t * f, vlib_node_t * n, uword next_index)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700349{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400350 vlib_node_t *next_node = vlib_get_node (vm, n->next_nodes[next_index]);
351 u32 *magic = vlib_frame_find_magic (f, next_node);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700352 ASSERT (VLIB_FRAME_MAGIC == magic[0]);
353}
354
355vlib_frame_t *
356vlib_get_next_frame_internal (vlib_main_t * vm,
357 vlib_node_runtime_t * node,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400358 u32 next_index, u32 allocate_new_next_frame)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700359{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400360 vlib_frame_t *f;
361 vlib_next_frame_t *nf;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700362 u32 n_used;
363
364 nf = vlib_node_runtime_get_next_frame (vm, node, next_index);
365
366 /* Make sure this next frame owns right to enqueue to destination frame. */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400367 if (PREDICT_FALSE (!(nf->flags & VLIB_FRAME_OWNER)))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700368 vlib_next_frame_change_ownership (vm, node, next_index);
369
370 /* ??? Don't need valid flag: can use frame_index == ~0 */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400371 if (PREDICT_FALSE (!(nf->flags & VLIB_FRAME_IS_ALLOCATED)))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700372 {
373 nf->frame_index = vlib_frame_alloc (vm, node, next_index);
374 nf->flags |= VLIB_FRAME_IS_ALLOCATED;
375 }
376
377 f = vlib_get_frame (vm, nf->frame_index);
378
379 /* Has frame been removed from pending vector (e.g. finished dispatching)?
380 If so we can reuse frame. */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400381 if ((nf->flags & VLIB_FRAME_PENDING) && !(f->flags & VLIB_FRAME_PENDING))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700382 {
383 nf->flags &= ~VLIB_FRAME_PENDING;
384 f->n_vectors = 0;
385 }
386
387 /* Allocate new frame if current one is already full. */
388 n_used = f->n_vectors;
389 if (n_used >= VLIB_FRAME_SIZE || (allocate_new_next_frame && n_used > 0))
390 {
391 /* Old frame may need to be freed after dispatch, since we'll have
Dave Barach9b8ffd92016-07-08 08:13:45 -0400392 two redundant frames from node -> next node. */
393 if (!(nf->flags & VLIB_FRAME_NO_FREE_AFTER_DISPATCH))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700394 {
Dave Barach9b8ffd92016-07-08 08:13:45 -0400395 vlib_frame_t *f_old = vlib_get_frame (vm, nf->frame_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700396 f_old->flags |= VLIB_FRAME_FREE_AFTER_DISPATCH;
397 }
398
399 /* Allocate new frame to replace full one. */
400 nf->frame_index = vlib_frame_alloc (vm, node, next_index);
401 f = vlib_get_frame (vm, nf->frame_index);
402 n_used = f->n_vectors;
403 }
404
405 /* Should have free vectors in frame now. */
406 ASSERT (n_used < VLIB_FRAME_SIZE);
407
408 if (CLIB_DEBUG > 0)
409 {
410 validate_frame_magic (vm, f,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400411 vlib_get_node (vm, node->node_index), next_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700412 }
413
414 return f;
415}
416
417static void
418vlib_put_next_frame_validate (vlib_main_t * vm,
419 vlib_node_runtime_t * rt,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400420 u32 next_index, u32 n_vectors_left)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700421{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400422 vlib_node_main_t *nm = &vm->node_main;
423 vlib_next_frame_t *nf;
424 vlib_frame_t *f;
425 vlib_node_runtime_t *next_rt;
426 vlib_node_t *next_node;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700427 u32 n_before, n_after;
428
429 nf = vlib_node_runtime_get_next_frame (vm, rt, next_index);
430 f = vlib_get_frame (vm, nf->frame_index);
431
432 ASSERT (n_vectors_left <= VLIB_FRAME_SIZE);
433 n_after = VLIB_FRAME_SIZE - n_vectors_left;
434 n_before = f->n_vectors;
435
436 ASSERT (n_after >= n_before);
437
438 next_rt = vec_elt_at_index (nm->nodes_by_type[VLIB_NODE_TYPE_INTERNAL],
439 nf->node_runtime_index);
440 next_node = vlib_get_node (vm, next_rt->node_index);
441 if (n_after > 0 && next_node->validate_frame)
442 {
Dave Barach9b8ffd92016-07-08 08:13:45 -0400443 u8 *msg = next_node->validate_frame (vm, rt, f);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700444 if (msg)
445 {
446 clib_warning ("%v", msg);
447 ASSERT (0);
448 }
449 vec_free (msg);
450 }
451}
452
453void
454vlib_put_next_frame (vlib_main_t * vm,
455 vlib_node_runtime_t * r,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400456 u32 next_index, u32 n_vectors_left)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700457{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400458 vlib_node_main_t *nm = &vm->node_main;
459 vlib_next_frame_t *nf;
460 vlib_frame_t *f;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700461 u32 n_vectors_in_frame;
462
Damjan Marion04a7f052017-07-10 15:06:17 +0200463 if (vm->buffer_main->callbacks_registered == 0 && CLIB_DEBUG > 0)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700464 vlib_put_next_frame_validate (vm, r, next_index, n_vectors_left);
465
466 nf = vlib_node_runtime_get_next_frame (vm, r, next_index);
467 f = vlib_get_frame (vm, nf->frame_index);
468
469 /* Make sure that magic number is still there. Otherwise, caller
470 has overrun frame meta data. */
471 if (CLIB_DEBUG > 0)
472 {
Dave Barach9b8ffd92016-07-08 08:13:45 -0400473 vlib_node_t *node = vlib_get_node (vm, r->node_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700474 validate_frame_magic (vm, f, node, next_index);
475 }
476
477 /* Convert # of vectors left -> number of vectors there. */
478 ASSERT (n_vectors_left <= VLIB_FRAME_SIZE);
479 n_vectors_in_frame = VLIB_FRAME_SIZE - n_vectors_left;
480
481 f->n_vectors = n_vectors_in_frame;
482
483 /* If vectors were added to frame, add to pending vector. */
484 if (PREDICT_TRUE (n_vectors_in_frame > 0))
485 {
Dave Barach9b8ffd92016-07-08 08:13:45 -0400486 vlib_pending_frame_t *p;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700487 u32 v0, v1;
Dave Barach9b8ffd92016-07-08 08:13:45 -0400488
Ed Warnickecb9cada2015-12-08 15:45:58 -0700489 r->cached_next_index = next_index;
490
491 if (!(f->flags & VLIB_FRAME_PENDING))
Dave Barach9b8ffd92016-07-08 08:13:45 -0400492 {
493 __attribute__ ((unused)) vlib_node_t *node;
494 vlib_node_t *next_node;
495 vlib_node_runtime_t *next_runtime;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700496
Dave Barach9b8ffd92016-07-08 08:13:45 -0400497 node = vlib_get_node (vm, r->node_index);
498 next_node = vlib_get_next_node (vm, r->node_index, next_index);
499 next_runtime = vlib_node_get_runtime (vm, next_node->index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700500
Dave Barach9b8ffd92016-07-08 08:13:45 -0400501 vec_add2 (nm->pending_frames, p, 1);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700502
Dave Barach9b8ffd92016-07-08 08:13:45 -0400503 p->frame_index = nf->frame_index;
504 p->node_runtime_index = nf->node_runtime_index;
505 p->next_frame_index = nf - nm->next_frames;
506 nf->flags |= VLIB_FRAME_PENDING;
507 f->flags |= VLIB_FRAME_PENDING;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700508
Dave Barach9b8ffd92016-07-08 08:13:45 -0400509 /*
510 * If we're going to dispatch this frame on another thread,
511 * force allocation of a new frame. Otherwise, we create
512 * a dangling frame reference. Each thread has its own copy of
513 * the next_frames vector.
514 */
Damjan Marion586afd72017-04-05 19:18:20 +0200515 if (0 && r->thread_index != next_runtime->thread_index)
Dave Barach9b8ffd92016-07-08 08:13:45 -0400516 {
517 nf->frame_index = ~0;
518 nf->flags &= ~(VLIB_FRAME_PENDING | VLIB_FRAME_IS_ALLOCATED);
519 }
520 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700521
522 /* Copy trace flag from next_frame and from runtime. */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400523 nf->flags |=
524 (nf->flags & VLIB_NODE_FLAG_TRACE) | (r->
525 flags & VLIB_NODE_FLAG_TRACE);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700526
527 v0 = nf->vectors_since_last_overflow;
528 v1 = v0 + n_vectors_in_frame;
529 nf->vectors_since_last_overflow = v1;
530 if (PREDICT_FALSE (v1 < v0))
531 {
Dave Barach9b8ffd92016-07-08 08:13:45 -0400532 vlib_node_t *node = vlib_get_node (vm, r->node_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700533 vec_elt (node->n_vectors_by_next_node, next_index) += v0;
534 }
535 }
536}
537
538/* Sync up runtime (32 bit counters) and main node stats (64 bit counters). */
539never_inline void
540vlib_node_runtime_sync_stats (vlib_main_t * vm,
541 vlib_node_runtime_t * r,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400542 uword n_calls, uword n_vectors, uword n_clocks)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700543{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400544 vlib_node_t *n = vlib_get_node (vm, r->node_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700545
546 n->stats_total.calls += n_calls + r->calls_since_last_overflow;
547 n->stats_total.vectors += n_vectors + r->vectors_since_last_overflow;
548 n->stats_total.clocks += n_clocks + r->clocks_since_last_overflow;
549 n->stats_total.max_clock = r->max_clock;
550 n->stats_total.max_clock_n = r->max_clock_n;
551
552 r->calls_since_last_overflow = 0;
553 r->vectors_since_last_overflow = 0;
554 r->clocks_since_last_overflow = 0;
555}
556
Dave Barach9b8ffd92016-07-08 08:13:45 -0400557always_inline void __attribute__ ((unused))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700558vlib_process_sync_stats (vlib_main_t * vm,
559 vlib_process_t * p,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400560 uword n_calls, uword n_vectors, uword n_clocks)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700561{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400562 vlib_node_runtime_t *rt = &p->node_runtime;
563 vlib_node_t *n = vlib_get_node (vm, rt->node_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700564 vlib_node_runtime_sync_stats (vm, rt, n_calls, n_vectors, n_clocks);
565 n->stats_total.suspends += p->n_suspends;
566 p->n_suspends = 0;
567}
568
Dave Barach9b8ffd92016-07-08 08:13:45 -0400569void
570vlib_node_sync_stats (vlib_main_t * vm, vlib_node_t * n)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700571{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400572 vlib_node_runtime_t *rt;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700573
574 if (n->type == VLIB_NODE_TYPE_PROCESS)
575 {
576 /* Nothing to do for PROCESS nodes except in main thread */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400577 if (vm != &vlib_global_main)
578 return;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700579
Dave Barach9b8ffd92016-07-08 08:13:45 -0400580 vlib_process_t *p = vlib_get_process_from_node (vm, n);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700581 n->stats_total.suspends += p->n_suspends;
582 p->n_suspends = 0;
583 rt = &p->node_runtime;
584 }
585 else
Dave Barach9b8ffd92016-07-08 08:13:45 -0400586 rt =
587 vec_elt_at_index (vm->node_main.nodes_by_type[n->type],
588 n->runtime_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700589
590 vlib_node_runtime_sync_stats (vm, rt, 0, 0, 0);
591
592 /* Sync up runtime next frame vector counters with main node structure. */
593 {
Dave Barach9b8ffd92016-07-08 08:13:45 -0400594 vlib_next_frame_t *nf;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700595 uword i;
596 for (i = 0; i < rt->n_next_nodes; i++)
597 {
598 nf = vlib_node_runtime_get_next_frame (vm, rt, i);
Dave Barach9b8ffd92016-07-08 08:13:45 -0400599 vec_elt (n->n_vectors_by_next_node, i) +=
600 nf->vectors_since_last_overflow;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700601 nf->vectors_since_last_overflow = 0;
602 }
603 }
604}
605
606always_inline u32
607vlib_node_runtime_update_stats (vlib_main_t * vm,
608 vlib_node_runtime_t * node,
609 uword n_calls,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400610 uword n_vectors, uword n_clocks)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700611{
612 u32 ca0, ca1, v0, v1, cl0, cl1, r;
613
614 cl0 = cl1 = node->clocks_since_last_overflow;
615 ca0 = ca1 = node->calls_since_last_overflow;
616 v0 = v1 = node->vectors_since_last_overflow;
617
618 ca1 = ca0 + n_calls;
619 v1 = v0 + n_vectors;
620 cl1 = cl0 + n_clocks;
621
622 node->calls_since_last_overflow = ca1;
623 node->clocks_since_last_overflow = cl1;
624 node->vectors_since_last_overflow = v1;
625 node->max_clock_n = node->max_clock > n_clocks ?
Dave Barach9b8ffd92016-07-08 08:13:45 -0400626 node->max_clock_n : n_vectors;
627 node->max_clock = node->max_clock > n_clocks ? node->max_clock : n_clocks;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700628
629 r = vlib_node_runtime_update_main_loop_vector_stats (vm, node, n_vectors);
630
631 if (PREDICT_FALSE (ca1 < ca0 || v1 < v0 || cl1 < cl0))
632 {
633 node->calls_since_last_overflow = ca0;
634 node->clocks_since_last_overflow = cl0;
635 node->vectors_since_last_overflow = v0;
636 vlib_node_runtime_sync_stats (vm, node, n_calls, n_vectors, n_clocks);
637 }
638
639 return r;
640}
641
642always_inline void
643vlib_process_update_stats (vlib_main_t * vm,
644 vlib_process_t * p,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400645 uword n_calls, uword n_vectors, uword n_clocks)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700646{
647 vlib_node_runtime_update_stats (vm, &p->node_runtime,
648 n_calls, n_vectors, n_clocks);
649}
650
651static clib_error_t *
652vlib_cli_elog_clear (vlib_main_t * vm,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400653 unformat_input_t * input, vlib_cli_command_t * cmd)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700654{
655 elog_reset_buffer (&vm->elog_main);
656 return 0;
657}
658
Dave Barach9b8ffd92016-07-08 08:13:45 -0400659/* *INDENT-OFF* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700660VLIB_CLI_COMMAND (elog_clear_cli, static) = {
Dave Barache5389bb2016-03-28 17:12:19 -0400661 .path = "event-logger clear",
662 .short_help = "Clear the event log",
Ed Warnickecb9cada2015-12-08 15:45:58 -0700663 .function = vlib_cli_elog_clear,
664};
Dave Barach9b8ffd92016-07-08 08:13:45 -0400665/* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700666
667#ifdef CLIB_UNIX
668static clib_error_t *
669elog_save_buffer (vlib_main_t * vm,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400670 unformat_input_t * input, vlib_cli_command_t * cmd)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700671{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400672 elog_main_t *em = &vm->elog_main;
673 char *file, *chroot_file;
674 clib_error_t *error = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700675
Dave Barach9b8ffd92016-07-08 08:13:45 -0400676 if (!unformat (input, "%s", &file))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700677 {
678 vlib_cli_output (vm, "expected file name, got `%U'",
679 format_unformat_error, input);
680 return 0;
681 }
682
683 /* It's fairly hard to get "../oopsie" through unformat; just in case */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400684 if (strstr (file, "..") || index (file, '/'))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700685 {
686 vlib_cli_output (vm, "illegal characters in filename '%s'", file);
687 return 0;
688 }
689
690 chroot_file = (char *) format (0, "/tmp/%s%c", file, 0);
691
Dave Barach9b8ffd92016-07-08 08:13:45 -0400692 vec_free (file);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700693
694 vlib_cli_output (vm, "Saving %wd of %wd events to %s",
Dave Barach9b8ffd92016-07-08 08:13:45 -0400695 elog_n_events_in_buffer (em),
696 elog_buffer_capacity (em), chroot_file);
697
Ed Warnickecb9cada2015-12-08 15:45:58 -0700698 vlib_worker_thread_barrier_sync (vm);
Dave Barach903fd512017-04-01 11:07:40 -0400699 error = elog_write_file (em, chroot_file, 1 /* flush ring */ );
Dave Barach9b8ffd92016-07-08 08:13:45 -0400700 vlib_worker_thread_barrier_release (vm);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700701 vec_free (chroot_file);
702 return error;
703}
704
Dave Barach81481312017-05-16 09:08:14 -0400705void
706elog_post_mortem_dump (void)
707{
708 vlib_main_t *vm = &vlib_global_main;
709 elog_main_t *em = &vm->elog_main;
710 u8 *filename;
711 clib_error_t *error;
712
713 if (!vm->elog_post_mortem_dump)
714 return;
715
716 filename = format (0, "/tmp/elog_post_mortem.%d%c", getpid (), 0);
717 error = elog_write_file (em, (char *) filename, 1 /* flush ring */ );
718 if (error)
719 clib_error_report (error);
720 vec_free (filename);
721}
722
Dave Barach9b8ffd92016-07-08 08:13:45 -0400723/* *INDENT-OFF* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700724VLIB_CLI_COMMAND (elog_save_cli, static) = {
Dave Barache5389bb2016-03-28 17:12:19 -0400725 .path = "event-logger save",
726 .short_help = "event-logger save <filename> (saves log in /tmp/<filename>)",
Ed Warnickecb9cada2015-12-08 15:45:58 -0700727 .function = elog_save_buffer,
728};
Dave Barach9b8ffd92016-07-08 08:13:45 -0400729/* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700730
Dave Barache5389bb2016-03-28 17:12:19 -0400731static clib_error_t *
732elog_stop (vlib_main_t * vm,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400733 unformat_input_t * input, vlib_cli_command_t * cmd)
Dave Barache5389bb2016-03-28 17:12:19 -0400734{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400735 elog_main_t *em = &vm->elog_main;
Dave Barache5389bb2016-03-28 17:12:19 -0400736
737 em->n_total_events_disable_limit = em->n_total_events;
738
739 vlib_cli_output (vm, "Stopped the event logger...");
740 return 0;
741}
742
Dave Barach9b8ffd92016-07-08 08:13:45 -0400743/* *INDENT-OFF* */
Dave Barache5389bb2016-03-28 17:12:19 -0400744VLIB_CLI_COMMAND (elog_stop_cli, static) = {
745 .path = "event-logger stop",
746 .short_help = "Stop the event-logger",
747 .function = elog_stop,
748};
Dave Barach9b8ffd92016-07-08 08:13:45 -0400749/* *INDENT-ON* */
Dave Barache5389bb2016-03-28 17:12:19 -0400750
751static clib_error_t *
752elog_restart (vlib_main_t * vm,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400753 unformat_input_t * input, vlib_cli_command_t * cmd)
Dave Barache5389bb2016-03-28 17:12:19 -0400754{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400755 elog_main_t *em = &vm->elog_main;
Dave Barache5389bb2016-03-28 17:12:19 -0400756
757 em->n_total_events_disable_limit = ~0;
758
759 vlib_cli_output (vm, "Restarted the event logger...");
760 return 0;
761}
762
Dave Barach9b8ffd92016-07-08 08:13:45 -0400763/* *INDENT-OFF* */
Dave Barache5389bb2016-03-28 17:12:19 -0400764VLIB_CLI_COMMAND (elog_restart_cli, static) = {
765 .path = "event-logger restart",
766 .short_help = "Restart the event-logger",
767 .function = elog_restart,
768};
Dave Barach9b8ffd92016-07-08 08:13:45 -0400769/* *INDENT-ON* */
Dave Barache5389bb2016-03-28 17:12:19 -0400770
771static clib_error_t *
772elog_resize (vlib_main_t * vm,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400773 unformat_input_t * input, vlib_cli_command_t * cmd)
Dave Barache5389bb2016-03-28 17:12:19 -0400774{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400775 elog_main_t *em = &vm->elog_main;
Dave Barache5389bb2016-03-28 17:12:19 -0400776 u32 tmp;
777
778 /* Stop the parade */
779 elog_reset_buffer (&vm->elog_main);
780
781 if (unformat (input, "%d", &tmp))
782 {
783 elog_alloc (em, tmp);
784 em->n_total_events_disable_limit = ~0;
785 }
Dave Barach9b8ffd92016-07-08 08:13:45 -0400786 else
Dave Barache5389bb2016-03-28 17:12:19 -0400787 return clib_error_return (0, "Must specify how many events in the ring");
788
789 vlib_cli_output (vm, "Resized ring and restarted the event logger...");
790 return 0;
791}
792
Dave Barach9b8ffd92016-07-08 08:13:45 -0400793/* *INDENT-OFF* */
Dave Barache5389bb2016-03-28 17:12:19 -0400794VLIB_CLI_COMMAND (elog_resize_cli, static) = {
795 .path = "event-logger resize",
796 .short_help = "event-logger resize <nnn>",
797 .function = elog_resize,
798};
Dave Barach9b8ffd92016-07-08 08:13:45 -0400799/* *INDENT-ON* */
Dave Barache5389bb2016-03-28 17:12:19 -0400800
Ed Warnickecb9cada2015-12-08 15:45:58 -0700801#endif /* CLIB_UNIX */
802
Dave Barach9b8ffd92016-07-08 08:13:45 -0400803static void
804elog_show_buffer_internal (vlib_main_t * vm, u32 n_events_to_show)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700805{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400806 elog_main_t *em = &vm->elog_main;
807 elog_event_t *e, *es;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700808 f64 dt;
809
810 /* Show events in VLIB time since log clock starts after VLIB clock. */
Dave Barach9b8ffd92016-07-08 08:13:45 -0400811 dt = (em->init_time.cpu - vm->clib_time.init_cpu_time)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700812 * vm->clib_time.seconds_per_clock;
813
814 es = elog_peek_events (em);
Dave Barach9b8ffd92016-07-08 08:13:45 -0400815 vlib_cli_output (vm, "%d of %d events in buffer, logger %s", vec_len (es),
816 em->event_ring_size,
817 em->n_total_events < em->n_total_events_disable_limit ?
818 "running" : "stopped");
Ed Warnickecb9cada2015-12-08 15:45:58 -0700819 vec_foreach (e, es)
Dave Barach9b8ffd92016-07-08 08:13:45 -0400820 {
821 vlib_cli_output (vm, "%18.9f: %U",
822 e->time + dt, format_elog_event, em, e);
823 n_events_to_show--;
824 if (n_events_to_show == 0)
825 break;
826 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700827 vec_free (es);
Dave Barach9b8ffd92016-07-08 08:13:45 -0400828
Ed Warnickecb9cada2015-12-08 15:45:58 -0700829}
830
831static clib_error_t *
832elog_show_buffer (vlib_main_t * vm,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400833 unformat_input_t * input, vlib_cli_command_t * cmd)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700834{
835 u32 n_events_to_show;
Dave Barach9b8ffd92016-07-08 08:13:45 -0400836 clib_error_t *error = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700837
838 n_events_to_show = 250;
839 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
840 {
841 if (unformat (input, "%d", &n_events_to_show))
842 ;
843 else if (unformat (input, "all"))
844 n_events_to_show = ~0;
845 else
846 return unformat_parse_error (input);
847 }
848 elog_show_buffer_internal (vm, n_events_to_show);
849 return error;
850}
851
Dave Barach9b8ffd92016-07-08 08:13:45 -0400852/* *INDENT-OFF* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700853VLIB_CLI_COMMAND (elog_show_cli, static) = {
854 .path = "show event-logger",
855 .short_help = "Show event logger info",
856 .function = elog_show_buffer,
857};
Dave Barach9b8ffd92016-07-08 08:13:45 -0400858/* *INDENT-ON* */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700859
Dave Barach9b8ffd92016-07-08 08:13:45 -0400860void
861vlib_gdb_show_event_log (void)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700862{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400863 elog_show_buffer_internal (vlib_get_main (), (u32) ~ 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700864}
865
Dave Barachfb6e59d2016-03-26 18:45:42 -0400866static inline void
Ed Warnickecb9cada2015-12-08 15:45:58 -0700867vlib_elog_main_loop_event (vlib_main_t * vm,
868 u32 node_index,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400869 u64 time, u32 n_vectors, u32 is_return)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700870{
Dave Barach9b8ffd92016-07-08 08:13:45 -0400871 vlib_main_t *evm = &vlib_global_main;
872 elog_main_t *em = &evm->elog_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700873
Dave Barachfb6e59d2016-03-26 18:45:42 -0400874 if (VLIB_ELOG_MAIN_LOOP && n_vectors)
875 elog_track (em,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400876 /* event type */
877 vec_elt_at_index (is_return
878 ? evm->node_return_elog_event_types
879 : evm->node_call_elog_event_types,
880 node_index),
881 /* track */
Damjan Marion586afd72017-04-05 19:18:20 +0200882 (vm->thread_index ? &vlib_worker_threads[vm->thread_index].
Dave Barach9b8ffd92016-07-08 08:13:45 -0400883 elog_track : &em->default_track),
884 /* data to log */ n_vectors);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700885}
886
Dave Barach7bee7732017-10-18 18:48:11 -0400887#if VLIB_BUFFER_TRACE_TRAJECTORY > 0
888void (*vlib_buffer_trace_trajectory_cb) (vlib_buffer_t * b, u32 node_index);
889void (*vlib_buffer_trace_trajectory_init_cb) (vlib_buffer_t * b);
890
Dave Barach9b8ffd92016-07-08 08:13:45 -0400891void
Dave Barach7bee7732017-10-18 18:48:11 -0400892vlib_buffer_trace_trajectory_init (vlib_buffer_t * b)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700893{
Dave Barach7bee7732017-10-18 18:48:11 -0400894 if (PREDICT_TRUE (vlib_buffer_trace_trajectory_init_cb != 0))
Ed Warnickecb9cada2015-12-08 15:45:58 -0700895 {
Dave Barach7bee7732017-10-18 18:48:11 -0400896 (*vlib_buffer_trace_trajectory_init_cb) (b);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700897 }
898}
899
Dave Barach7bee7732017-10-18 18:48:11 -0400900#endif
901
902static inline void
903add_trajectory_trace (vlib_buffer_t * b, u32 node_index)
904{
905#if VLIB_BUFFER_TRACE_TRAJECTORY > 0
906 if (PREDICT_TRUE (vlib_buffer_trace_trajectory_cb != 0))
907 {
908 (*vlib_buffer_trace_trajectory_cb) (b, node_index);
909 }
910#endif
911}
Ed Warnickecb9cada2015-12-08 15:45:58 -0700912
Damjan Marion9a332e12017-03-28 15:11:20 +0200913static_always_inline u64
Ed Warnickecb9cada2015-12-08 15:45:58 -0700914dispatch_node (vlib_main_t * vm,
915 vlib_node_runtime_t * node,
916 vlib_node_type_t type,
917 vlib_node_state_t dispatch_state,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400918 vlib_frame_t * frame, u64 last_time_stamp)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700919{
920 uword n, v;
921 u64 t;
Dave Barach9b8ffd92016-07-08 08:13:45 -0400922 vlib_node_main_t *nm = &vm->node_main;
923 vlib_next_frame_t *nf;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700924
925 if (CLIB_DEBUG > 0)
926 {
Dave Barach9b8ffd92016-07-08 08:13:45 -0400927 vlib_node_t *n = vlib_get_node (vm, node->node_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700928 ASSERT (n->type == type);
929 }
930
931 /* Only non-internal nodes may be disabled. */
932 if (type != VLIB_NODE_TYPE_INTERNAL && node->state != dispatch_state)
933 {
934 ASSERT (type != VLIB_NODE_TYPE_INTERNAL);
935 return last_time_stamp;
936 }
937
938 if ((type == VLIB_NODE_TYPE_PRE_INPUT || type == VLIB_NODE_TYPE_INPUT)
939 && dispatch_state != VLIB_NODE_STATE_INTERRUPT)
940 {
941 u32 c = node->input_main_loops_per_call;
942 /* Only call node when count reaches zero. */
943 if (c)
944 {
945 node->input_main_loops_per_call = c - 1;
946 return last_time_stamp;
947 }
948 }
949
950 /* Speculatively prefetch next frames. */
951 if (node->n_next_nodes > 0)
952 {
953 nf = vec_elt_at_index (nm->next_frames, node->next_frame_index);
954 CLIB_PREFETCH (nf, 4 * sizeof (nf[0]), WRITE);
955 }
956
957 vm->cpu_time_last_node_dispatch = last_time_stamp;
958
Damjan Marion586afd72017-04-05 19:18:20 +0200959 if (1 /* || vm->thread_index == node->thread_index */ )
Ed Warnickecb9cada2015-12-08 15:45:58 -0700960 {
961 vlib_main_t *stat_vm;
962
963 stat_vm = /* vlib_mains ? vlib_mains[0] : */ vm;
964
965 vlib_elog_main_loop_event (vm, node->node_index,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400966 last_time_stamp,
967 frame ? frame->n_vectors : 0,
968 /* is_after */ 0);
969
Ed Warnickecb9cada2015-12-08 15:45:58 -0700970 /*
971 * Turn this on if you run into
972 * "bad monkey" contexts, and you want to know exactly
973 * which nodes they've visited... See ixge.c...
974 */
975 if (VLIB_BUFFER_TRACE_TRAJECTORY && frame)
Dave Barach9b8ffd92016-07-08 08:13:45 -0400976 {
977 int i;
Dave Barach9b8ffd92016-07-08 08:13:45 -0400978 u32 *from;
979 from = vlib_frame_vector_args (frame);
980 for (i = 0; i < frame->n_vectors; i++)
981 {
982 vlib_buffer_t *b = vlib_get_buffer (vm, from[i]);
Dave Barach7bee7732017-10-18 18:48:11 -0400983 add_trajectory_trace (b, node->node_index);
Dave Barach9b8ffd92016-07-08 08:13:45 -0400984 }
985 n = node->function (vm, node, frame);
986 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700987 else
Dave Barach9b8ffd92016-07-08 08:13:45 -0400988 n = node->function (vm, node, frame);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700989
990 t = clib_cpu_time_now ();
991
Dave Barach9b8ffd92016-07-08 08:13:45 -0400992 vlib_elog_main_loop_event (vm, node->node_index, t, n, /* is_after */
993 1);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700994
995 vm->main_loop_vectors_processed += n;
996 vm->main_loop_nodes_processed += n > 0;
997
998 v = vlib_node_runtime_update_stats (stat_vm, node,
Dave Barach9b8ffd92016-07-08 08:13:45 -0400999 /* n_calls */ 1,
1000 /* n_vectors */ n,
1001 /* n_clocks */ t - last_time_stamp);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001002
1003 /* When in interrupt mode and vector rate crosses threshold switch to
1004 polling mode. */
Damjan Marion878c6092017-01-04 13:19:27 +01001005 if ((dispatch_state == VLIB_NODE_STATE_INTERRUPT)
1006 || (dispatch_state == VLIB_NODE_STATE_POLLING
Dave Barach9b8ffd92016-07-08 08:13:45 -04001007 && (node->flags
1008 & VLIB_NODE_FLAG_SWITCH_FROM_INTERRUPT_TO_POLLING_MODE)))
1009 {
Steven6aa75af2017-02-24 10:03:22 -08001010#ifdef DISPATCH_NODE_ELOG_REQUIRED
Dave Barach9b8ffd92016-07-08 08:13:45 -04001011 ELOG_TYPE_DECLARE (e) =
1012 {
1013 .function = (char *) __FUNCTION__,.format =
1014 "%s vector length %d, switching to %s",.format_args =
1015 "T4i4t4",.n_enum_strings = 2,.enum_strings =
1016 {
1017 "interrupt", "polling",},};
1018 struct
1019 {
1020 u32 node_name, vector_length, is_polling;
1021 } *ed;
Damjan Marion586afd72017-04-05 19:18:20 +02001022 vlib_worker_thread_t *w = vlib_worker_threads + vm->thread_index;
Steven6aa75af2017-02-24 10:03:22 -08001023#endif
Ed Warnickecb9cada2015-12-08 15:45:58 -07001024
Steven7312cc72017-03-15 21:18:55 -07001025 if ((dispatch_state == VLIB_NODE_STATE_INTERRUPT
1026 && v >= nm->polling_threshold_vector_length) &&
1027 !(node->flags &
1028 VLIB_NODE_FLAG_SWITCH_FROM_INTERRUPT_TO_POLLING_MODE))
Dave Barach9b8ffd92016-07-08 08:13:45 -04001029 {
1030 vlib_node_t *n = vlib_get_node (vm, node->node_index);
1031 n->state = VLIB_NODE_STATE_POLLING;
1032 node->state = VLIB_NODE_STATE_POLLING;
Dave Barach9b8ffd92016-07-08 08:13:45 -04001033 node->flags &=
1034 ~VLIB_NODE_FLAG_SWITCH_FROM_POLLING_TO_INTERRUPT_MODE;
1035 node->flags |=
1036 VLIB_NODE_FLAG_SWITCH_FROM_INTERRUPT_TO_POLLING_MODE;
1037 nm->input_node_counts_by_state[VLIB_NODE_STATE_INTERRUPT] -= 1;
1038 nm->input_node_counts_by_state[VLIB_NODE_STATE_POLLING] += 1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001039
Steven6aa75af2017-02-24 10:03:22 -08001040#ifdef DISPATCH_NODE_ELOG_REQUIRED
1041 ed = ELOG_TRACK_DATA (&vlib_global_main.elog_main, e,
1042 w->elog_track);
Dave Barach9b8ffd92016-07-08 08:13:45 -04001043 ed->node_name = n->name_elog_string;
1044 ed->vector_length = v;
1045 ed->is_polling = 1;
Steven6aa75af2017-02-24 10:03:22 -08001046#endif
Dave Barach9b8ffd92016-07-08 08:13:45 -04001047 }
1048 else if (dispatch_state == VLIB_NODE_STATE_POLLING
1049 && v <= nm->interrupt_threshold_vector_length)
1050 {
1051 vlib_node_t *n = vlib_get_node (vm, node->node_index);
1052 if (node->flags &
1053 VLIB_NODE_FLAG_SWITCH_FROM_POLLING_TO_INTERRUPT_MODE)
1054 {
1055 /* Switch to interrupt mode after dispatch in polling one more time.
1056 This allows driver to re-enable interrupts. */
1057 n->state = VLIB_NODE_STATE_INTERRUPT;
1058 node->state = VLIB_NODE_STATE_INTERRUPT;
1059 node->flags &=
1060 ~VLIB_NODE_FLAG_SWITCH_FROM_INTERRUPT_TO_POLLING_MODE;
1061 nm->input_node_counts_by_state[VLIB_NODE_STATE_POLLING] -=
1062 1;
1063 nm->input_node_counts_by_state[VLIB_NODE_STATE_INTERRUPT] +=
1064 1;
1065
1066 }
1067 else
1068 {
1069 node->flags |=
1070 VLIB_NODE_FLAG_SWITCH_FROM_POLLING_TO_INTERRUPT_MODE;
Steven6aa75af2017-02-24 10:03:22 -08001071#ifdef DISPATCH_NODE_ELOG_REQUIRED
1072 ed = ELOG_TRACK_DATA (&vlib_global_main.elog_main, e,
1073 w->elog_track);
Dave Barach9b8ffd92016-07-08 08:13:45 -04001074 ed->node_name = n->name_elog_string;
1075 ed->vector_length = v;
1076 ed->is_polling = 0;
Steven6aa75af2017-02-24 10:03:22 -08001077#endif
Dave Barach9b8ffd92016-07-08 08:13:45 -04001078 }
1079 }
1080 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001081 }
1082
1083 return t;
1084}
1085
Damjan Marion9a332e12017-03-28 15:11:20 +02001086static u64
Dave Baracha6269992017-06-07 08:18:49 -04001087dispatch_pending_node (vlib_main_t * vm, uword pending_frame_index,
1088 u64 last_time_stamp)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001089{
Dave Barach9b8ffd92016-07-08 08:13:45 -04001090 vlib_node_main_t *nm = &vm->node_main;
1091 vlib_frame_t *f;
1092 vlib_next_frame_t *nf, nf_dummy;
1093 vlib_node_runtime_t *n;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001094 u32 restore_frame_index;
Dave Baracha6269992017-06-07 08:18:49 -04001095 vlib_pending_frame_t *p;
1096
1097 /* See comment below about dangling references to nm->pending_frames */
1098 p = nm->pending_frames + pending_frame_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001099
1100 n = vec_elt_at_index (nm->nodes_by_type[VLIB_NODE_TYPE_INTERNAL],
1101 p->node_runtime_index);
1102
1103 f = vlib_get_frame (vm, p->frame_index);
1104 if (p->next_frame_index == VLIB_PENDING_FRAME_NO_NEXT_FRAME)
1105 {
1106 /* No next frame: so use dummy on stack. */
1107 nf = &nf_dummy;
1108 nf->flags = f->flags & VLIB_NODE_FLAG_TRACE;
1109 nf->frame_index = ~p->frame_index;
1110 }
1111 else
1112 nf = vec_elt_at_index (nm->next_frames, p->next_frame_index);
1113
1114 ASSERT (f->flags & VLIB_FRAME_IS_ALLOCATED);
1115
1116 /* Force allocation of new frame while current frame is being
1117 dispatched. */
1118 restore_frame_index = ~0;
1119 if (nf->frame_index == p->frame_index)
1120 {
1121 nf->frame_index = ~0;
1122 nf->flags &= ~VLIB_FRAME_IS_ALLOCATED;
Dave Barach9b8ffd92016-07-08 08:13:45 -04001123 if (!(n->flags & VLIB_NODE_FLAG_FRAME_NO_FREE_AFTER_DISPATCH))
Ed Warnickecb9cada2015-12-08 15:45:58 -07001124 restore_frame_index = p->frame_index;
1125 }
1126
1127 /* Frame must be pending. */
1128 ASSERT (f->flags & VLIB_FRAME_PENDING);
1129 ASSERT (f->n_vectors > 0);
1130
1131 /* Copy trace flag from next frame to node.
1132 Trace flag indicates that at least one vector in the dispatched
1133 frame is traced. */
1134 n->flags &= ~VLIB_NODE_FLAG_TRACE;
1135 n->flags |= (nf->flags & VLIB_FRAME_TRACE) ? VLIB_NODE_FLAG_TRACE : 0;
1136 nf->flags &= ~VLIB_FRAME_TRACE;
1137
1138 last_time_stamp = dispatch_node (vm, n,
1139 VLIB_NODE_TYPE_INTERNAL,
1140 VLIB_NODE_STATE_POLLING,
1141 f, last_time_stamp);
1142
1143 f->flags &= ~VLIB_FRAME_PENDING;
1144
1145 /* Frame is ready to be used again, so restore it. */
1146 if (restore_frame_index != ~0)
1147 {
Dave Baracha6269992017-06-07 08:18:49 -04001148 /*
1149 * We musn't restore a frame that is flagged to be freed. This
1150 * shouldn't happen since frames to be freed post dispatch are
1151 * those used when the to-node frame becomes full i.e. they form a
1152 * sort of queue of frames to a single node. If we get here then
1153 * the to-node frame and the pending frame *were* the same, and so
1154 * we removed the to-node frame. Therefore this frame is no
1155 * longer part of the queue for that node and hence it cannot be
1156 * it's overspill.
Neale Ranns88170612016-11-22 08:29:51 +00001157 */
1158 ASSERT (!(f->flags & VLIB_FRAME_FREE_AFTER_DISPATCH));
1159
Dave Baracha6269992017-06-07 08:18:49 -04001160 /*
1161 * NB: dispatching node n can result in the creation and scheduling
1162 * of new frames, and hence in the reallocation of nm->pending_frames.
1163 * Recompute p, or no supper. This was broken for more than 10 years.
1164 */
1165 p = nm->pending_frames + pending_frame_index;
1166
1167 /*
1168 * p->next_frame_index can change during node dispatch if node
1169 * function decides to change graph hook up.
1170 */
Ed Warnickecb9cada2015-12-08 15:45:58 -07001171 nf = vec_elt_at_index (nm->next_frames, p->next_frame_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001172 nf->flags |= VLIB_FRAME_IS_ALLOCATED;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001173
Neale Ranns88170612016-11-22 08:29:51 +00001174 if (~0 == nf->frame_index)
1175 {
1176 /* no new frame has been assigned to this node, use the saved one */
1177 nf->frame_index = restore_frame_index;
1178 f->n_vectors = 0;
1179 }
1180 else
1181 {
1182 /* The node has gained a frame, implying packets from the current frame
1183 were re-queued to this same node. we don't need the saved one
1184 anymore */
1185 vlib_frame_free (vm, n, f);
1186 }
1187 }
1188 else
Ed Warnickecb9cada2015-12-08 15:45:58 -07001189 {
Neale Ranns88170612016-11-22 08:29:51 +00001190 if (f->flags & VLIB_FRAME_FREE_AFTER_DISPATCH)
1191 {
1192 ASSERT (!(n->flags & VLIB_NODE_FLAG_FRAME_NO_FREE_AFTER_DISPATCH));
1193 vlib_frame_free (vm, n, f);
1194 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001195 }
1196
1197 return last_time_stamp;
1198}
1199
1200always_inline uword
1201vlib_process_stack_is_valid (vlib_process_t * p)
Dave Barach9b8ffd92016-07-08 08:13:45 -04001202{
1203 return p->stack[0] == VLIB_PROCESS_STACK_MAGIC;
1204}
Ed Warnickecb9cada2015-12-08 15:45:58 -07001205
Dave Barach9b8ffd92016-07-08 08:13:45 -04001206typedef struct
1207{
1208 vlib_main_t *vm;
1209 vlib_process_t *process;
1210 vlib_frame_t *frame;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001211} vlib_process_bootstrap_args_t;
1212
1213/* Called in process stack. */
Dave Barach9b8ffd92016-07-08 08:13:45 -04001214static uword
1215vlib_process_bootstrap (uword _a)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001216{
Dave Barach9b8ffd92016-07-08 08:13:45 -04001217 vlib_process_bootstrap_args_t *a;
1218 vlib_main_t *vm;
1219 vlib_node_runtime_t *node;
1220 vlib_frame_t *f;
1221 vlib_process_t *p;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001222 uword n;
1223
1224 a = uword_to_pointer (_a, vlib_process_bootstrap_args_t *);
1225
1226 vm = a->vm;
1227 p = a->process;
1228 f = a->frame;
1229 node = &p->node_runtime;
1230
1231 n = node->function (vm, node, f);
1232
1233 ASSERT (vlib_process_stack_is_valid (p));
1234
1235 clib_longjmp (&p->return_longjmp, n);
1236
1237 return n;
1238}
1239
1240/* Called in main stack. */
1241static_always_inline uword
Dave Barach9b8ffd92016-07-08 08:13:45 -04001242vlib_process_startup (vlib_main_t * vm, vlib_process_t * p, vlib_frame_t * f)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001243{
1244 vlib_process_bootstrap_args_t a;
1245 uword r;
1246
1247 a.vm = vm;
1248 a.process = p;
1249 a.frame = f;
1250
1251 r = clib_setjmp (&p->return_longjmp, VLIB_PROCESS_RETURN_LONGJMP_RETURN);
1252 if (r == VLIB_PROCESS_RETURN_LONGJMP_RETURN)
1253 r = clib_calljmp (vlib_process_bootstrap, pointer_to_uword (&a),
1254 (void *) p->stack + (1 << p->log2_n_stack_bytes));
1255
1256 return r;
1257}
1258
1259static_always_inline uword
1260vlib_process_resume (vlib_process_t * p)
1261{
1262 uword r;
1263 p->flags &= ~(VLIB_PROCESS_IS_SUSPENDED_WAITING_FOR_CLOCK
1264 | VLIB_PROCESS_IS_SUSPENDED_WAITING_FOR_EVENT
1265 | VLIB_PROCESS_RESUME_PENDING);
1266 r = clib_setjmp (&p->return_longjmp, VLIB_PROCESS_RETURN_LONGJMP_RETURN);
1267 if (r == VLIB_PROCESS_RETURN_LONGJMP_RETURN)
1268 clib_longjmp (&p->resume_longjmp, VLIB_PROCESS_RESUME_LONGJMP_RESUME);
1269 return r;
1270}
1271
1272static u64
1273dispatch_process (vlib_main_t * vm,
Dave Barach9b8ffd92016-07-08 08:13:45 -04001274 vlib_process_t * p, vlib_frame_t * f, u64 last_time_stamp)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001275{
Dave Barach9b8ffd92016-07-08 08:13:45 -04001276 vlib_node_main_t *nm = &vm->node_main;
1277 vlib_node_runtime_t *node_runtime = &p->node_runtime;
1278 vlib_node_t *node = vlib_get_node (vm, node_runtime->node_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001279 u64 t;
1280 uword n_vectors, is_suspend;
1281
1282 if (node->state != VLIB_NODE_STATE_POLLING
1283 || (p->flags & (VLIB_PROCESS_IS_SUSPENDED_WAITING_FOR_CLOCK
1284 | VLIB_PROCESS_IS_SUSPENDED_WAITING_FOR_EVENT)))
1285 return last_time_stamp;
1286
1287 p->flags |= VLIB_PROCESS_IS_RUNNING;
1288
1289 t = last_time_stamp;
1290 vlib_elog_main_loop_event (vm, node_runtime->node_index, t,
1291 f ? f->n_vectors : 0, /* is_after */ 0);
1292
1293 /* Save away current process for suspend. */
1294 nm->current_process_index = node->runtime_index;
1295
1296 n_vectors = vlib_process_startup (vm, p, f);
1297
1298 nm->current_process_index = ~0;
1299
1300 ASSERT (n_vectors != VLIB_PROCESS_RETURN_LONGJMP_RETURN);
1301 is_suspend = n_vectors == VLIB_PROCESS_RETURN_LONGJMP_SUSPEND;
1302 if (is_suspend)
1303 {
Dave Barach9b8ffd92016-07-08 08:13:45 -04001304 vlib_pending_frame_t *pf;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001305
1306 n_vectors = 0;
1307 pool_get (nm->suspended_process_frames, pf);
1308 pf->node_runtime_index = node->runtime_index;
1309 pf->frame_index = f ? vlib_frame_index (vm, f) : ~0;
1310 pf->next_frame_index = ~0;
1311
1312 p->n_suspends += 1;
1313 p->suspended_process_frame_index = pf - nm->suspended_process_frames;
1314
1315 if (p->flags & VLIB_PROCESS_IS_SUSPENDED_WAITING_FOR_CLOCK)
Dave Barach5c20a012017-06-13 08:48:31 -04001316 {
1317 TWT (tw_timer_wheel) * tw =
1318 (TWT (tw_timer_wheel) *) nm->timing_wheel;
1319 p->stop_timer_handle =
1320 TW (tw_timer_start) (tw,
1321 vlib_timing_wheel_data_set_suspended_process
1322 (node->runtime_index) /* [sic] pool idex */ ,
1323 0 /* timer_id */ ,
1324 p->resume_clock_interval);
1325 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001326 }
1327 else
1328 p->flags &= ~VLIB_PROCESS_IS_RUNNING;
1329
1330 t = clib_cpu_time_now ();
1331
Dave Barach9b8ffd92016-07-08 08:13:45 -04001332 vlib_elog_main_loop_event (vm, node_runtime->node_index, t, is_suspend,
1333 /* is_after */ 1);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001334
1335 vlib_process_update_stats (vm, p,
Dave Barach9b8ffd92016-07-08 08:13:45 -04001336 /* n_calls */ !is_suspend,
Ed Warnickecb9cada2015-12-08 15:45:58 -07001337 /* n_vectors */ n_vectors,
1338 /* n_clocks */ t - last_time_stamp);
1339
1340 return t;
1341}
1342
Dave Barach9b8ffd92016-07-08 08:13:45 -04001343void
1344vlib_start_process (vlib_main_t * vm, uword process_index)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001345{
Dave Barach9b8ffd92016-07-08 08:13:45 -04001346 vlib_node_main_t *nm = &vm->node_main;
1347 vlib_process_t *p = vec_elt (nm->processes, process_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001348 dispatch_process (vm, p, /* frame */ 0, /* cpu_time_now */ 0);
1349}
1350
1351static u64
1352dispatch_suspended_process (vlib_main_t * vm,
Dave Barach9b8ffd92016-07-08 08:13:45 -04001353 uword process_index, u64 last_time_stamp)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001354{
Dave Barach9b8ffd92016-07-08 08:13:45 -04001355 vlib_node_main_t *nm = &vm->node_main;
1356 vlib_node_runtime_t *node_runtime;
1357 vlib_node_t *node;
1358 vlib_frame_t *f;
1359 vlib_process_t *p;
1360 vlib_pending_frame_t *pf;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001361 u64 t, n_vectors, is_suspend;
Dave Barach9b8ffd92016-07-08 08:13:45 -04001362
Ed Warnickecb9cada2015-12-08 15:45:58 -07001363 t = last_time_stamp;
1364
1365 p = vec_elt (nm->processes, process_index);
Dave Barach9b8ffd92016-07-08 08:13:45 -04001366 if (PREDICT_FALSE (!(p->flags & VLIB_PROCESS_IS_RUNNING)))
Ed Warnickecb9cada2015-12-08 15:45:58 -07001367 return last_time_stamp;
1368
1369 ASSERT (p->flags & (VLIB_PROCESS_IS_SUSPENDED_WAITING_FOR_CLOCK
1370 | VLIB_PROCESS_IS_SUSPENDED_WAITING_FOR_EVENT));
1371
Dave Barach9b8ffd92016-07-08 08:13:45 -04001372 pf =
1373 pool_elt_at_index (nm->suspended_process_frames,
1374 p->suspended_process_frame_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001375
1376 node_runtime = &p->node_runtime;
1377 node = vlib_get_node (vm, node_runtime->node_index);
1378 f = pf->frame_index != ~0 ? vlib_get_frame (vm, pf->frame_index) : 0;
1379
Dave Barach9b8ffd92016-07-08 08:13:45 -04001380 vlib_elog_main_loop_event (vm, node_runtime->node_index, t,
1381 f ? f->n_vectors : 0, /* is_after */ 0);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001382
1383 /* Save away current process for suspend. */
1384 nm->current_process_index = node->runtime_index;
1385
1386 n_vectors = vlib_process_resume (p);
1387 t = clib_cpu_time_now ();
1388
1389 nm->current_process_index = ~0;
1390
1391 is_suspend = n_vectors == VLIB_PROCESS_RETURN_LONGJMP_SUSPEND;
1392 if (is_suspend)
1393 {
1394 /* Suspend it again. */
1395 n_vectors = 0;
1396 p->n_suspends += 1;
1397 if (p->flags & VLIB_PROCESS_IS_SUSPENDED_WAITING_FOR_CLOCK)
Dave Barach5c20a012017-06-13 08:48:31 -04001398 {
1399 p->stop_timer_handle =
1400 TW (tw_timer_start) ((TWT (tw_timer_wheel) *) nm->timing_wheel,
1401 vlib_timing_wheel_data_set_suspended_process
1402 (node->runtime_index) /* [sic] pool idex */ ,
1403 0 /* timer_id */ ,
1404 p->resume_clock_interval);
1405 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001406 }
1407 else
1408 {
1409 p->flags &= ~VLIB_PROCESS_IS_RUNNING;
1410 p->suspended_process_frame_index = ~0;
1411 pool_put (nm->suspended_process_frames, pf);
1412 }
1413
1414 t = clib_cpu_time_now ();
Dave Barach9b8ffd92016-07-08 08:13:45 -04001415 vlib_elog_main_loop_event (vm, node_runtime->node_index, t, !is_suspend,
1416 /* is_after */ 1);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001417
1418 vlib_process_update_stats (vm, p,
Dave Barach9b8ffd92016-07-08 08:13:45 -04001419 /* n_calls */ !is_suspend,
Ed Warnickecb9cada2015-12-08 15:45:58 -07001420 /* n_vectors */ n_vectors,
1421 /* n_clocks */ t - last_time_stamp);
1422
1423 return t;
1424}
1425
Damjan Marione9d52d52017-03-09 15:42:26 +01001426static_always_inline void
1427vlib_main_or_worker_loop (vlib_main_t * vm, int is_main)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001428{
Dave Barach9b8ffd92016-07-08 08:13:45 -04001429 vlib_node_main_t *nm = &vm->node_main;
Damjan Marione9d52d52017-03-09 15:42:26 +01001430 vlib_thread_main_t *tm = vlib_get_thread_main ();
Ed Warnickecb9cada2015-12-08 15:45:58 -07001431 uword i;
1432 u64 cpu_time_now;
Damjan Marione9d52d52017-03-09 15:42:26 +01001433 vlib_frame_queue_main_t *fqm;
Damjan Marion2c2b6402017-03-28 14:16:15 +02001434 u32 *last_node_runtime_indices = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001435
1436 /* Initialize pending node vector. */
Damjan Marione9d52d52017-03-09 15:42:26 +01001437 if (is_main)
1438 {
1439 vec_resize (nm->pending_frames, 32);
1440 _vec_len (nm->pending_frames) = 0;
1441 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001442
1443 /* Mark time of main loop start. */
Damjan Marione9d52d52017-03-09 15:42:26 +01001444 if (is_main)
1445 {
1446 cpu_time_now = vm->clib_time.last_cpu_time;
1447 vm->cpu_time_main_loop_start = cpu_time_now;
1448 }
1449 else
1450 cpu_time_now = clib_cpu_time_now ();
Ed Warnickecb9cada2015-12-08 15:45:58 -07001451
Damjan Marion2c2b6402017-03-28 14:16:15 +02001452 /* Pre-allocate interupt runtime indices and lock. */
Ed Warnickecb9cada2015-12-08 15:45:58 -07001453 vec_alloc (nm->pending_interrupt_node_runtime_indices, 32);
Damjan Marion2c2b6402017-03-28 14:16:15 +02001454 vec_alloc (last_node_runtime_indices, 32);
1455 if (!is_main)
1456 clib_spinlock_init (&nm->pending_interrupt_lock);
1457
1458 /* Pre-allocate expired nodes. */
Steven7312cc72017-03-15 21:18:55 -07001459 if (!nm->polling_threshold_vector_length)
1460 nm->polling_threshold_vector_length = 10;
1461 if (!nm->interrupt_threshold_vector_length)
1462 nm->interrupt_threshold_vector_length = 5;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001463
Ed Warnickecb9cada2015-12-08 15:45:58 -07001464 /* Start all processes. */
Damjan Marione9d52d52017-03-09 15:42:26 +01001465 if (is_main)
1466 {
1467 uword i;
Stevenf3b53642017-05-01 14:03:02 -07001468 nm->current_process_index = ~0;
Damjan Marione9d52d52017-03-09 15:42:26 +01001469 for (i = 0; i < vec_len (nm->processes); i++)
1470 cpu_time_now = dispatch_process (vm, nm->processes[i], /* frame */ 0,
1471 cpu_time_now);
1472 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001473
1474 while (1)
1475 {
Dave Barach9b8ffd92016-07-08 08:13:45 -04001476 vlib_node_runtime_t *n;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001477
Damjan Marione9d52d52017-03-09 15:42:26 +01001478 if (!is_main)
1479 {
1480 vlib_worker_thread_barrier_check ();
1481 vec_foreach (fqm, tm->frame_queue_mains)
1482 vlib_frame_queue_dequeue (vm, fqm);
1483 }
1484
Ed Warnickecb9cada2015-12-08 15:45:58 -07001485 /* Process pre-input nodes. */
Damjan Marion20e272c2017-03-14 11:10:00 +01001486 if (is_main)
1487 vec_foreach (n, nm->nodes_by_type[VLIB_NODE_TYPE_PRE_INPUT])
1488 cpu_time_now = dispatch_node (vm, n,
1489 VLIB_NODE_TYPE_PRE_INPUT,
1490 VLIB_NODE_STATE_POLLING,
1491 /* frame */ 0,
1492 cpu_time_now);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001493
1494 /* Next process input nodes. */
1495 vec_foreach (n, nm->nodes_by_type[VLIB_NODE_TYPE_INPUT])
1496 cpu_time_now = dispatch_node (vm, n,
1497 VLIB_NODE_TYPE_INPUT,
1498 VLIB_NODE_STATE_POLLING,
1499 /* frame */ 0,
1500 cpu_time_now);
1501
Damjan Marione9d52d52017-03-09 15:42:26 +01001502 if (PREDICT_TRUE (is_main && vm->queue_signal_pending == 0))
Dave Barach9b8ffd92016-07-08 08:13:45 -04001503 vm->queue_signal_callback (vm);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001504
1505 /* Next handle interrupts. */
1506 {
1507 uword l = _vec_len (nm->pending_interrupt_node_runtime_indices);
1508 uword i;
1509 if (l > 0)
1510 {
Damjan Marion2c2b6402017-03-28 14:16:15 +02001511 u32 *tmp;
1512 if (!is_main)
1513 clib_spinlock_lock (&nm->pending_interrupt_lock);
1514 tmp = nm->pending_interrupt_node_runtime_indices;
1515 nm->pending_interrupt_node_runtime_indices =
1516 last_node_runtime_indices;
1517 last_node_runtime_indices = tmp;
1518 _vec_len (last_node_runtime_indices) = 0;
1519 if (!is_main)
1520 clib_spinlock_unlock (&nm->pending_interrupt_lock);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001521 for (i = 0; i < l; i++)
1522 {
1523 n = vec_elt_at_index (nm->nodes_by_type[VLIB_NODE_TYPE_INPUT],
Damjan Marion2c2b6402017-03-28 14:16:15 +02001524 last_node_runtime_indices[i]);
Dave Barach9b8ffd92016-07-08 08:13:45 -04001525 cpu_time_now =
1526 dispatch_node (vm, n, VLIB_NODE_TYPE_INPUT,
1527 VLIB_NODE_STATE_INTERRUPT,
1528 /* frame */ 0,
1529 cpu_time_now);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001530 }
1531 }
1532 }
1533
Damjan Marione9d52d52017-03-09 15:42:26 +01001534 if (is_main)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001535 {
Damjan Marione9d52d52017-03-09 15:42:26 +01001536 /* Check if process nodes have expired from timing wheel. */
Dave Barach5c20a012017-06-13 08:48:31 -04001537 ASSERT (nm->data_from_advancing_timing_wheel != 0);
1538
1539 nm->data_from_advancing_timing_wheel =
1540 TW (tw_timer_expire_timers_vec)
1541 ((TWT (tw_timer_wheel) *) nm->timing_wheel, vlib_time_now (vm),
1542 nm->data_from_advancing_timing_wheel);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001543
Damjan Marione9d52d52017-03-09 15:42:26 +01001544 ASSERT (nm->data_from_advancing_timing_wheel != 0);
Dave Barach5c20a012017-06-13 08:48:31 -04001545
Damjan Marione9d52d52017-03-09 15:42:26 +01001546 if (PREDICT_FALSE
1547 (_vec_len (nm->data_from_advancing_timing_wheel) > 0))
Ed Warnickecb9cada2015-12-08 15:45:58 -07001548 {
Damjan Marione9d52d52017-03-09 15:42:26 +01001549 uword i;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001550
Damjan Marione9d52d52017-03-09 15:42:26 +01001551 processes_timing_wheel_data:
1552 for (i = 0; i < _vec_len (nm->data_from_advancing_timing_wheel);
1553 i++)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001554 {
Damjan Marione9d52d52017-03-09 15:42:26 +01001555 u32 d = nm->data_from_advancing_timing_wheel[i];
1556 u32 di = vlib_timing_wheel_data_get_index (d);
1557
1558 if (vlib_timing_wheel_data_is_timed_event (d))
1559 {
1560 vlib_signal_timed_event_data_t *te =
1561 pool_elt_at_index (nm->signal_timed_event_data_pool,
1562 di);
1563 vlib_node_t *n =
1564 vlib_get_node (vm, te->process_node_index);
1565 vlib_process_t *p =
1566 vec_elt (nm->processes, n->runtime_index);
1567 void *data;
1568 data =
1569 vlib_process_signal_event_helper (nm, n, p,
1570 te->event_type_index,
1571 te->n_data_elts,
1572 te->n_data_elt_bytes);
1573 if (te->n_data_bytes < sizeof (te->inline_event_data))
1574 clib_memcpy (data, te->inline_event_data,
1575 te->n_data_bytes);
1576 else
1577 {
1578 clib_memcpy (data, te->event_data_as_vector,
1579 te->n_data_bytes);
1580 vec_free (te->event_data_as_vector);
1581 }
1582 pool_put (nm->signal_timed_event_data_pool, te);
1583 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001584 else
1585 {
Damjan Marione9d52d52017-03-09 15:42:26 +01001586 cpu_time_now = clib_cpu_time_now ();
1587 cpu_time_now =
1588 dispatch_suspended_process (vm, di, cpu_time_now);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001589 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001590 }
Damjan Marione9d52d52017-03-09 15:42:26 +01001591 _vec_len (nm->data_from_advancing_timing_wheel) = 0;
1592 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001593 }
1594
1595 /* Input nodes may have added work to the pending vector.
1596 Process pending vector until there is nothing left.
1597 All pending vectors will be processed from input -> output. */
1598 for (i = 0; i < _vec_len (nm->pending_frames); i++)
Dave Baracha6269992017-06-07 08:18:49 -04001599 cpu_time_now = dispatch_pending_node (vm, i, cpu_time_now);
Ed Warnickecb9cada2015-12-08 15:45:58 -07001600 /* Reset pending vector for next iteration. */
1601 _vec_len (nm->pending_frames) = 0;
Dave Barach9b8ffd92016-07-08 08:13:45 -04001602
Ed Warnickecb9cada2015-12-08 15:45:58 -07001603 /* Pending internal nodes may resume processes. */
Damjan Marione9d52d52017-03-09 15:42:26 +01001604 if (is_main && _vec_len (nm->data_from_advancing_timing_wheel) > 0)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001605 goto processes_timing_wheel_data;
1606
1607 vlib_increment_main_loop_counter (vm);
1608
1609 /* Record time stamp in case there are no enabled nodes and above
Dave Barach9b8ffd92016-07-08 08:13:45 -04001610 calls do not update time stamp. */
Ed Warnickecb9cada2015-12-08 15:45:58 -07001611 cpu_time_now = clib_cpu_time_now ();
1612 }
1613}
Dave Barach9b8ffd92016-07-08 08:13:45 -04001614
Damjan Marione9d52d52017-03-09 15:42:26 +01001615static void
1616vlib_main_loop (vlib_main_t * vm)
1617{
1618 vlib_main_or_worker_loop (vm, /* is_main */ 1);
1619}
1620
1621void
1622vlib_worker_loop (vlib_main_t * vm)
1623{
1624 vlib_main_or_worker_loop (vm, /* is_main */ 0);
1625}
1626
Ed Warnickecb9cada2015-12-08 15:45:58 -07001627vlib_main_t vlib_global_main;
1628
1629static clib_error_t *
1630vlib_main_configure (vlib_main_t * vm, unformat_input_t * input)
1631{
1632 int turn_on_mem_trace = 0;
1633
1634 while (unformat_check_input (input) != UNFORMAT_END_OF_INPUT)
1635 {
1636 if (unformat (input, "memory-trace"))
1637 turn_on_mem_trace = 1;
1638
1639 else if (unformat (input, "elog-events %d",
1640 &vm->elog_main.event_ring_size))
1641 ;
Dave Barach81481312017-05-16 09:08:14 -04001642 else if (unformat (input, "elog-post-mortem-dump"))
1643 vm->elog_post_mortem_dump = 1;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001644 else
1645 return unformat_parse_error (input);
1646 }
1647
1648 unformat_free (input);
1649
1650 /* Enable memory trace as early as possible. */
1651 if (turn_on_mem_trace)
1652 clib_mem_trace (1);
1653
1654 return 0;
1655}
1656
1657VLIB_EARLY_CONFIG_FUNCTION (vlib_main_configure, "vlib");
1658
Dave Barach9b8ffd92016-07-08 08:13:45 -04001659static void
1660dummy_queue_signal_callback (vlib_main_t * vm)
1661{
1662}
Dave Barach16c75df2016-05-31 14:05:46 -04001663
Ed Warnickecb9cada2015-12-08 15:45:58 -07001664/* Main function. */
Dave Barach9b8ffd92016-07-08 08:13:45 -04001665int
Eyal Barid334a6b2016-09-19 10:23:39 +03001666vlib_main (vlib_main_t * volatile vm, unformat_input_t * input)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001667{
Eyal Barid334a6b2016-09-19 10:23:39 +03001668 clib_error_t *volatile error;
Dave Barach5c20a012017-06-13 08:48:31 -04001669 vlib_node_main_t *nm = &vm->node_main;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001670
Dave Barach16c75df2016-05-31 14:05:46 -04001671 vm->queue_signal_callback = dummy_queue_signal_callback;
1672
Ed Warnickecb9cada2015-12-08 15:45:58 -07001673 clib_time_init (&vm->clib_time);
1674
1675 /* Turn on event log. */
Dave Barach9b8ffd92016-07-08 08:13:45 -04001676 if (!vm->elog_main.event_ring_size)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001677 vm->elog_main.event_ring_size = 128 << 10;
1678 elog_init (&vm->elog_main, vm->elog_main.event_ring_size);
1679 elog_enable_disable (&vm->elog_main, 1);
1680
1681 /* Default name. */
Dave Barach9b8ffd92016-07-08 08:13:45 -04001682 if (!vm->name)
Ed Warnickecb9cada2015-12-08 15:45:58 -07001683 vm->name = "VLIB";
1684
Damjan Marion49d66f12017-07-20 18:10:35 +02001685 if ((error = unix_physmem_init (vm)))
Damjan Marion04a7f052017-07-10 15:06:17 +02001686 {
Damjan Marion49d66f12017-07-20 18:10:35 +02001687 clib_error_report (error);
1688 goto done;
Damjan Marion04a7f052017-07-10 15:06:17 +02001689 }
Damjan Marion49d66f12017-07-20 18:10:35 +02001690
1691 if ((error = vlib_buffer_main_init (vm)))
Damjan Marion04a7f052017-07-10 15:06:17 +02001692 {
Damjan Marion49d66f12017-07-20 18:10:35 +02001693 clib_error_report (error);
1694 goto done;
Damjan Marion04a7f052017-07-10 15:06:17 +02001695 }
Ed Warnickecb9cada2015-12-08 15:45:58 -07001696
1697 if ((error = vlib_thread_init (vm)))
1698 {
1699 clib_error_report (error);
1700 goto done;
1701 }
1702
1703 /* Register static nodes so that init functions may use them. */
1704 vlib_register_all_static_nodes (vm);
1705
1706 /* Set seed for random number generator.
1707 Allow user to specify seed to make random sequence deterministic. */
Dave Barach9b8ffd92016-07-08 08:13:45 -04001708 if (!unformat (input, "seed %wd", &vm->random_seed))
Ed Warnickecb9cada2015-12-08 15:45:58 -07001709 vm->random_seed = clib_cpu_time_now ();
1710 clib_random_buffer_init (&vm->random_buffer, vm->random_seed);
1711
Ed Warnickecb9cada2015-12-08 15:45:58 -07001712 /* Initialize node graph. */
1713 if ((error = vlib_node_main_init (vm)))
1714 {
1715 /* Arrange for graph hook up error to not be fatal when debugging. */
1716 if (CLIB_DEBUG > 0)
1717 clib_error_report (error);
1718 else
1719 goto done;
1720 }
1721
Ole Troan964f93e2016-06-10 13:22:36 +02001722 /* See unix/main.c; most likely already set up */
1723 if (vm->init_functions_called == 0)
Dave Barach9b8ffd92016-07-08 08:13:45 -04001724 vm->init_functions_called = hash_create (0, /* value bytes */ 0);
Ole Troan964f93e2016-06-10 13:22:36 +02001725 if ((error = vlib_call_all_init_functions (vm)))
1726 goto done;
1727
Ed Warnickecb9cada2015-12-08 15:45:58 -07001728 /* Create default buffer free list. */
Dave Barach9b8ffd92016-07-08 08:13:45 -04001729 vlib_buffer_get_or_create_free_list (vm,
1730 VLIB_BUFFER_DEFAULT_FREE_LIST_BYTES,
Ed Warnickecb9cada2015-12-08 15:45:58 -07001731 "default");
1732
Dave Barach5c20a012017-06-13 08:48:31 -04001733 nm->timing_wheel = clib_mem_alloc_aligned (sizeof (TWT (tw_timer_wheel)),
1734 CLIB_CACHE_LINE_BYTES);
1735
1736 vec_validate (nm->data_from_advancing_timing_wheel, 10);
1737 _vec_len (nm->data_from_advancing_timing_wheel) = 0;
1738
1739 /* Create the process timing wheel */
1740 TW (tw_timer_wheel_init) ((TWT (tw_timer_wheel) *) nm->timing_wheel,
1741 0 /* no callback */ ,
1742 10e-6 /* timer period 10us */ ,
1743 ~0 /* max expirations per call */ );
1744
Ed Warnickecb9cada2015-12-08 15:45:58 -07001745 switch (clib_setjmp (&vm->main_loop_exit, VLIB_MAIN_LOOP_EXIT_NONE))
1746 {
1747 case VLIB_MAIN_LOOP_EXIT_NONE:
1748 vm->main_loop_exit_set = 1;
1749 break;
1750
1751 case VLIB_MAIN_LOOP_EXIT_CLI:
1752 goto done;
1753
1754 default:
1755 error = vm->main_loop_error;
1756 goto done;
1757 }
1758
Dave Barach9b8ffd92016-07-08 08:13:45 -04001759 if ((error = vlib_call_all_config_functions (vm, input, 0 /* is_early */ )))
Ed Warnickecb9cada2015-12-08 15:45:58 -07001760 goto done;
1761
1762 /* Call all main loop enter functions. */
1763 {
Dave Barach9b8ffd92016-07-08 08:13:45 -04001764 clib_error_t *sub_error;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001765 sub_error = vlib_call_all_main_loop_enter_functions (vm);
1766 if (sub_error)
1767 clib_error_report (sub_error);
1768 }
1769
1770 vlib_main_loop (vm);
1771
Dave Barach9b8ffd92016-07-08 08:13:45 -04001772done:
Ed Warnickecb9cada2015-12-08 15:45:58 -07001773 /* Call all exit functions. */
1774 {
Dave Barach9b8ffd92016-07-08 08:13:45 -04001775 clib_error_t *sub_error;
Ed Warnickecb9cada2015-12-08 15:45:58 -07001776 sub_error = vlib_call_all_main_loop_exit_functions (vm);
1777 if (sub_error)
1778 clib_error_report (sub_error);
1779 }
1780
1781 if (error)
1782 clib_error_report (error);
1783
1784 return 0;
1785}
Dave Barach9b8ffd92016-07-08 08:13:45 -04001786
1787/*
1788 * fd.io coding-style-patch-verification: ON
1789 *
1790 * Local Variables:
1791 * eval: (c-set-style "gnu")
1792 * End:
1793 */