blob: d94ddf8950570875b881175f6b3a7f5b5c8281c2 [file] [log] [blame]
/*
* Copyright (c) 2015 Cisco and/or its affiliates.
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include <stdio.h>
#include <time.h>
#include <sys/types.h>
#include <signal.h>
#include <sys/stat.h>
#include <unistd.h>
#include <vppinfra/clib.h>
#include <vppinfra/vec.h>
#include <vppinfra/hash.h>
#include <svmdb.h>
#include <vppinfra/format.h>
#include <vppinfra/error.h>
#include <vppinfra/time.h>
#include <vppinfra/macros.h>
int restart_main_fn (unformat_input_t * i)
{
int verbose = 0;
int old_pid;
int wait;
u8 * chroot_path = 0;
svmdb_client_t * svmdb_client;
volatile pid_t *pidp;
struct stat statb;
ino_t old_inode;
int sleeps;
struct timespec _req, *req = &_req;
struct timespec _rem, *rem = &_rem;
if (geteuid())
clib_error ("vpp_restart: must be root...");
while (unformat_check_input (i) != UNFORMAT_END_OF_INPUT)
{
if (unformat (i, "verbose") || unformat (i, "v"))
verbose = 1;
else if (unformat (i, "chroot %s", &chroot_path))
;
else
{
clib_error ("unknown input `%U'", format_unformat_error, i);
return 1;
}
}
/*
* Step 1: look up the current VPP pid in the shared-memory database
*/
svmdb_client = svmdb_map_chroot ((char *) chroot_path);
pidp = svmdb_local_get_variable_reference (svmdb_client,
SVMDB_NAMESPACE_VEC,
"vpp_pid");
if (pidp == 0)
{
clib_error ("'vpp_pid' svm variable not found, vpp has never run?");
return 2;
}
/* Spin for up to 10 seconds for vpp to start */
for (wait = 0; wait < 1000; wait++)
{
req->tv_sec = 0;
req->tv_nsec = 10000*1000; /* 10 ms */
while (nanosleep(req, rem) < 0)
*req = *rem;
if (*pidp)
goto found2;
}
clib_error ("VPP not runnning...");
return 3;
found2:
old_pid = *pidp;
/*
* Step 2: sanity check the pid we discovered
*/
if (verbose)
fformat(stdout, "Sanity check current vpp pid %d\n", old_pid);
if (kill (old_pid, 0) < 0)
{
svmdb_unmap (svmdb_client);
clib_error ("vpp current pid %d not running...", old_pid);
return 2;
}
if (verbose)
fformat(stdout, "Sanity check vpp pid %d OK\n", old_pid);
/*
* Step 3: figure out the current vpp <--> client shared-VM file
* inode number
*/
if (stat("/dev/shm/vpe-api", &statb) < 0)
{
clib_unix_error ("stat fail");
return 4;
}
old_inode = statb.st_ino;
if (verbose)
fformat(stdout, "Old inode %u\n", old_inode);
/* Note: restart wipes out the shared VM database*/
svmdb_unmap (svmdb_client);
/*
* Step 4: send SIGTERM to vpp.
* systemd et al. will restart vpp after wiping out the shared-VM
* database and (crucially) the shared API messaging segment
*/
if (kill (old_pid, SIGTERM) < 0)
{
clib_unix_error ("SIGTERM fail");
return 3;
}
sleeps = 0;
/*
* Step 5: wait up to 15 seconds for a new incarnation of
* the shared-VM API segment to appear.
*/
for (wait = 0; wait < 150; wait++)
{
if ((stat("/dev/shm/vpe-api", &statb) < 0)
|| statb.st_ino == old_inode)
{
req->tv_sec = 0;
req->tv_nsec = 100000*1000; /* 100 ms */
while (nanosleep(req, rem) < 0)
*req = *rem;
sleeps++;
}
else
goto new_inode;
}
clib_error ("Timeout waiting for new inode to appear...");
return 5;
new_inode:
if (verbose && sleeps > 0)
fformat(stdout, "Inode sleeps %d\n", sleeps);
if (verbose)
fformat(stdout, "New inode %u\n", statb.st_ino);
/*
* Step 6: remap the SVM database
*/
svmdb_client = svmdb_map_chroot ((char *) chroot_path);
pidp = svmdb_local_get_variable_reference (svmdb_client,
SVMDB_NAMESPACE_VEC,
"vpp_pid");
if (pidp == 0)
{
clib_error ("post_restart: 'vpp_pid' svm variable not found,"
"vpp did not restart?");
return 2;
}
sleeps = 0;
/*
* Step 7: wait for vpp to publish its new PID
*/
/* Spin for up to 15 seconds */
for (wait = 0; wait < 150; wait++)
{
if (*pidp && (*pidp != old_pid))
goto restarted;
req->tv_sec = 0;
req->tv_nsec = 100000*1000; /* 100 ms */
while (nanosleep(req, rem) < 0)
*req = *rem;
sleeps++;
}
clib_error ("Timeout waiting for vpp to publish pid after restart...");
return 4;
restarted:
/* Done... */
if (verbose && sleeps)
fformat(stdout, "pid sleeps %d\n", sleeps);
if (verbose)
fformat (stdout, "New PID %d... Restarted...\n", *pidp);
svmdb_unmap (svmdb_client);
return 0;
}
int main (int argc, char **argv)
{
unformat_input_t i;
int ret;
clib_mem_init (0, 64ULL<<20);
unformat_init_command_line (&i, argv);
ret = restart_main_fn (&i);
unformat_free (&i);
return ret;
}