blob: 0fdca0bf13c25091eededf3922e3dac21fdd962c [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * replication.c : packet replication
3 *
4 * Copyright (c) 2013 Cisco and/or its affiliates.
5 * Licensed under the Apache License, Version 2.0 (the "License");
6 * you may not use this file except in compliance with the License.
7 * You may obtain a copy of the License at:
8 *
9 * http://www.apache.org/licenses/LICENSE-2.0
10 *
11 * Unless required by applicable law or agreed to in writing, software
12 * distributed under the License is distributed on an "AS IS" BASIS,
13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 * See the License for the specific language governing permissions and
15 * limitations under the License.
16 */
17
18#include <vlib/vlib.h>
19#include <vnet/vnet.h>
20#include <vppinfra/error.h>
21#include <vnet/ip/ip4_packet.h>
22#include <vnet/replication.h>
23
24
25replication_main_t replication_main;
26
27
28replication_context_t *
29replication_prep (vlib_main_t * vm,
Dave Barachba868bb2016-08-08 09:51:21 -040030 vlib_buffer_t * b0, u32 recycle_node_index, u32 l2_packet)
Ed Warnickecb9cada2015-12-08 15:45:58 -070031{
Dave Barachba868bb2016-08-08 09:51:21 -040032 replication_main_t *rm = &replication_main;
33 replication_context_t *ctx;
Damjan Marion586afd72017-04-05 19:18:20 +020034 uword thread_index = vm->thread_index;
Dave Barachba868bb2016-08-08 09:51:21 -040035 ip4_header_t *ip;
Ed Warnickecb9cada2015-12-08 15:45:58 -070036 u32 ctx_id;
37
Dave Barachba868bb2016-08-08 09:51:21 -040038 /* Allocate a context, reserve context 0 */
Damjan Marion586afd72017-04-05 19:18:20 +020039 if (PREDICT_FALSE (rm->contexts[thread_index] == 0))
40 pool_get_aligned (rm->contexts[thread_index], ctx, CLIB_CACHE_LINE_BYTES);
Dave Barachba868bb2016-08-08 09:51:21 -040041
Damjan Marion586afd72017-04-05 19:18:20 +020042 pool_get_aligned (rm->contexts[thread_index], ctx, CLIB_CACHE_LINE_BYTES);
43 ctx_id = ctx - rm->contexts[thread_index];
Ed Warnickecb9cada2015-12-08 15:45:58 -070044
Dave Barachba868bb2016-08-08 09:51:21 -040045 /* Save state from vlib buffer */
Damjan Marion072401e2017-07-13 18:53:27 +020046 ctx->saved_free_list_index = vlib_buffer_get_free_list_index (b0);
Ed Warnickecb9cada2015-12-08 15:45:58 -070047 ctx->current_data = b0->current_data;
48
Dave Barachba868bb2016-08-08 09:51:21 -040049 /* Set up vlib buffer hooks */
Dave Barachb5adaea2016-06-17 14:09:56 -040050 b0->recycle_count = ctx_id;
Damjan Marion072401e2017-07-13 18:53:27 +020051 vlib_buffer_set_free_list_index (b0, rm->recycle_list_index);
Dave Barachb5adaea2016-06-17 14:09:56 -040052 b0->flags |= VLIB_BUFFER_RECYCLE;
Ed Warnickecb9cada2015-12-08 15:45:58 -070053
Dave Barachba868bb2016-08-08 09:51:21 -040054 /* Save feature state */
Ed Warnickecb9cada2015-12-08 15:45:58 -070055 ctx->recycle_node_index = recycle_node_index;
56
Dave Barachba868bb2016-08-08 09:51:21 -040057 /* Save vnet state */
58 clib_memcpy (ctx->vnet_buffer, vnet_buffer (b0),
59 sizeof (vnet_buffer_opaque_t));
Ed Warnickecb9cada2015-12-08 15:45:58 -070060
Dave Barachba868bb2016-08-08 09:51:21 -040061 /* Save packet contents */
Ed Warnickecb9cada2015-12-08 15:45:58 -070062 ctx->l2_packet = l2_packet;
Dave Barachba868bb2016-08-08 09:51:21 -040063 ip = (ip4_header_t *) vlib_buffer_get_current (b0);
64 if (l2_packet)
65 {
66 /* Save ethernet header */
67 ctx->l2_header[0] = ((u64 *) ip)[0];
68 ctx->l2_header[1] = ((u64 *) ip)[1];
69 ctx->l2_header[2] = ((u64 *) ip)[2];
70 /* set ip to the true ip header */
71 ip = (ip4_header_t *) (((u8 *) ip) + vnet_buffer (b0)->l2.l2_len);
72 }
Ed Warnickecb9cada2015-12-08 15:45:58 -070073
Dave Barachba868bb2016-08-08 09:51:21 -040074 /*
75 * Copy L3 fields.
76 * We need to save TOS for ip4 and ip6 packets.
77 * Fortunately the TOS field is
78 * in the first two bytes of both the ip4 and ip6 headers.
79 */
80 ctx->ip_tos = *((u16 *) (ip));
Ed Warnickecb9cada2015-12-08 15:45:58 -070081
Dave Barachba868bb2016-08-08 09:51:21 -040082 /*
83 * Save the ip4 checksum as well. We just blindly save the corresponding two
84 * bytes even for ip6 packets.
85 */
Ed Warnickecb9cada2015-12-08 15:45:58 -070086 ctx->ip4_checksum = ip->checksum;
87
88 return ctx;
89}
90
91
92replication_context_t *
Dave Barachba868bb2016-08-08 09:51:21 -040093replication_recycle (vlib_main_t * vm, vlib_buffer_t * b0, u32 is_last)
Ed Warnickecb9cada2015-12-08 15:45:58 -070094{
Dave Barachba868bb2016-08-08 09:51:21 -040095 replication_main_t *rm = &replication_main;
96 replication_context_t *ctx;
Damjan Marion586afd72017-04-05 19:18:20 +020097 uword thread_index = vm->thread_index;
Dave Barachba868bb2016-08-08 09:51:21 -040098 ip4_header_t *ip;
Ed Warnickecb9cada2015-12-08 15:45:58 -070099
Dave Barachba868bb2016-08-08 09:51:21 -0400100 /* Get access to the replication context */
Damjan Marion586afd72017-04-05 19:18:20 +0200101 ctx = pool_elt_at_index (rm->contexts[thread_index], b0->recycle_count);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700102
Dave Barachba868bb2016-08-08 09:51:21 -0400103 /* Restore vnet buffer state */
104 clib_memcpy (vnet_buffer (b0), ctx->vnet_buffer,
105 sizeof (vnet_buffer_opaque_t));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700106
Dave Barachba868bb2016-08-08 09:51:21 -0400107 /* Restore the packet start (current_data) and length */
108 vlib_buffer_advance (b0, ctx->current_data - b0->current_data);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700109
Dave Barachba868bb2016-08-08 09:51:21 -0400110 /* Restore packet contents */
111 ip = (ip4_header_t *) vlib_buffer_get_current (b0);
112 if (ctx->l2_packet)
113 {
114 /* Restore ethernet header */
115 ((u64 *) ip)[0] = ctx->l2_header[0];
116 ((u64 *) ip)[1] = ctx->l2_header[1];
117 ((u64 *) ip)[2] = ctx->l2_header[2];
118 /* set ip to the true ip header */
119 ip = (ip4_header_t *) (((u8 *) ip) + vnet_buffer (b0)->l2.l2_len);
120 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700121
122 // Restore L3 fields
Dave Barachba868bb2016-08-08 09:51:21 -0400123 *((u16 *) (ip)) = ctx->ip_tos;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700124 ip->checksum = ctx->ip4_checksum;
125
Dave Barachba868bb2016-08-08 09:51:21 -0400126 if (is_last)
127 {
128 /*
129 * This is the last replication in the list.
130 * Restore original buffer free functionality.
131 */
Damjan Marion072401e2017-07-13 18:53:27 +0200132 vlib_buffer_set_free_list_index (b0, ctx->saved_free_list_index);
Dave Barachba868bb2016-08-08 09:51:21 -0400133 b0->flags &= ~VLIB_BUFFER_RECYCLE;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700134
Dave Barachba868bb2016-08-08 09:51:21 -0400135 /* Free context back to its pool */
Damjan Marion586afd72017-04-05 19:18:20 +0200136 pool_put (rm->contexts[thread_index], ctx);
Dave Barachba868bb2016-08-08 09:51:21 -0400137 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700138
139 return ctx;
140}
141
142
143
144/*
145 * fish pkts back from the recycle queue/freelist
146 * un-flatten the context chains
147 */
Dave Barachba868bb2016-08-08 09:51:21 -0400148static void
149replication_recycle_callback (vlib_main_t * vm, vlib_buffer_free_list_t * fl)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700150{
Dave Barachba868bb2016-08-08 09:51:21 -0400151 vlib_frame_t *f = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700152 u32 n_left_from;
153 u32 n_left_to_next = 0;
154 u32 n_this_frame = 0;
Dave Barachba868bb2016-08-08 09:51:21 -0400155 u32 *from;
156 u32 *to_next = 0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700157 u32 bi0, pi0;
158 vlib_buffer_t *b0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700159 int i;
Dave Barachba868bb2016-08-08 09:51:21 -0400160 replication_main_t *rm = &replication_main;
161 replication_context_t *ctx;
162 u32 feature_node_index = 0;
Damjan Marion586afd72017-04-05 19:18:20 +0200163 uword thread_index = vm->thread_index;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700164
Dave Barachba868bb2016-08-08 09:51:21 -0400165 /*
166 * All buffers in the list are destined to the same recycle node.
167 * Pull the recycle node index from the first buffer.
168 * Note: this could be sped up if the node index were stuffed into
169 * the freelist itself.
170 */
Damjan Marionbd69a5f2017-02-05 23:44:42 +0100171 if (vec_len (fl->buffers) > 0)
Dave Barachba868bb2016-08-08 09:51:21 -0400172 {
Damjan Marionbd69a5f2017-02-05 23:44:42 +0100173 bi0 = fl->buffers[0];
Dave Barachba868bb2016-08-08 09:51:21 -0400174 b0 = vlib_get_buffer (vm, bi0);
Damjan Marion586afd72017-04-05 19:18:20 +0200175 ctx = pool_elt_at_index (rm->contexts[thread_index], b0->recycle_count);
Dave Barachba868bb2016-08-08 09:51:21 -0400176 feature_node_index = ctx->recycle_node_index;
177 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700178
Damjan Marionbd69a5f2017-02-05 23:44:42 +0100179 /* buffers */
Dave Barachba868bb2016-08-08 09:51:21 -0400180 for (i = 0; i < 2; i++)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700181 {
182 if (i == 0)
Dave Barachba868bb2016-08-08 09:51:21 -0400183 {
Damjan Marionbd69a5f2017-02-05 23:44:42 +0100184 from = fl->buffers;
Dave Barachba868bb2016-08-08 09:51:21 -0400185 n_left_from = vec_len (from);
186 }
187
Ed Warnickecb9cada2015-12-08 15:45:58 -0700188 while (n_left_from > 0)
Dave Barachba868bb2016-08-08 09:51:21 -0400189 {
190 if (PREDICT_FALSE (n_left_to_next == 0))
191 {
192 if (f)
193 {
194 f->n_vectors = n_this_frame;
195 vlib_put_frame_to_node (vm, feature_node_index, f);
196 }
197
198 f = vlib_get_frame_to_node (vm, feature_node_index);
199 to_next = vlib_frame_vector_args (f);
200 n_left_to_next = VLIB_FRAME_SIZE;
201 n_this_frame = 0;
202 }
203
204 bi0 = from[0];
205 if (PREDICT_TRUE (n_left_from > 1))
206 {
207 pi0 = from[1];
208 vlib_prefetch_buffer_with_index (vm, pi0, LOAD);
209 }
John Lo17f17cb2016-05-31 16:25:13 -0400210
211 b0 = vlib_get_buffer (vm, bi0);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700212
Dave Barachba868bb2016-08-08 09:51:21 -0400213 /* Mark that this buffer was just recycled */
214 b0->flags |= VLIB_BUFFER_IS_RECYCLED;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700215
Neale Rannsb80c5362016-10-08 13:03:40 +0100216#if (CLIB_DEBUG > 0)
Damjan Marion04a7f052017-07-10 15:06:17 +0200217 if (vm->buffer_main->callbacks_registered == 0)
Damjan Marionc3a814b2017-02-28 19:22:22 +0100218 vlib_buffer_set_known_state (vm, bi0,
219 VLIB_BUFFER_KNOWN_ALLOCATED);
Neale Rannsb80c5362016-10-08 13:03:40 +0100220#endif
221
Dave Barachba868bb2016-08-08 09:51:21 -0400222 /* If buffer is traced, mark frame as traced */
223 if (PREDICT_FALSE (b0->flags & VLIB_BUFFER_IS_TRACED))
224 f->flags |= VLIB_FRAME_TRACE;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700225
Dave Barachba868bb2016-08-08 09:51:21 -0400226 to_next[0] = bi0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700227
Dave Barachba868bb2016-08-08 09:51:21 -0400228 from++;
229 to_next++;
230 n_this_frame++;
231 n_left_to_next--;
232 n_left_from--;
233 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700234 }
Dave Barachba868bb2016-08-08 09:51:21 -0400235
Damjan Marionbd69a5f2017-02-05 23:44:42 +0100236 vec_reset_length (fl->buffers);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700237
238 if (f)
239 {
Dave Barachba868bb2016-08-08 09:51:21 -0400240 ASSERT (n_this_frame);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700241 f->n_vectors = n_this_frame;
242 vlib_put_frame_to_node (vm, feature_node_index, f);
243 }
244}
245
Dave Barachba868bb2016-08-08 09:51:21 -0400246clib_error_t *
247replication_init (vlib_main_t * vm)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700248{
Dave Barachba868bb2016-08-08 09:51:21 -0400249 replication_main_t *rm = &replication_main;
250 vlib_buffer_main_t *bm = vm->buffer_main;
251 vlib_buffer_free_list_t *fl;
252 __attribute__ ((unused)) replication_context_t *ctx;
253 vlib_thread_main_t *tm = vlib_get_thread_main ();
Ed Warnickecb9cada2015-12-08 15:45:58 -0700254
Dave Barachba868bb2016-08-08 09:51:21 -0400255 rm->vlib_main = vm;
256 rm->vnet_main = vnet_get_main ();
257 rm->recycle_list_index =
258 vlib_buffer_create_free_list (vm, 1024 /* fictional */ ,
259 "replication-recycle");
260
261 fl = pool_elt_at_index (bm->buffer_free_list_pool, rm->recycle_list_index);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700262
263 fl->buffers_added_to_freelist_function = replication_recycle_callback;
264
Dave Barachba868bb2016-08-08 09:51:21 -0400265 /* Verify the replication context is the expected size */
266 ASSERT (sizeof (replication_context_t) == 128); /* 2 cache lines */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700267
268 vec_validate (rm->contexts, tm->n_vlib_mains - 1);
269 return 0;
270}
271
272VLIB_INIT_FUNCTION (replication_init);
Dave Barachba868bb2016-08-08 09:51:21 -0400273
274/*
275 * fd.io coding-style-patch-verification: ON
276 *
277 * Local Variables:
278 * eval: (c-set-style "gnu")
279 * End:
280 */