blob: 3377828bbc5c171d8a9eea65dbffee2315c2804d [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15/*
16 Copyright (c) 2005 Eliot Dresselhaus
17
18 Permission is hereby granted, free of charge, to any person obtaining
19 a copy of this software and associated documentation files (the
20 "Software"), to deal in the Software without restriction, including
21 without limitation the rights to use, copy, modify, merge, publish,
22 distribute, sublicense, and/or sell copies of the Software, and to
23 permit persons to whom the Software is furnished to do so, subject to
24 the following conditions:
25
26 The above copyright notice and this permission notice shall be
27 included in all copies or substantial portions of the Software.
28
29 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
30 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
31 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
32 NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
33 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
34 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
35 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
36*/
37
38#include <vppinfra/os.h>
39#include <vppinfra/time.h>
40#include <vppinfra/format.h>
Damjan Marionc0e939b2016-11-12 11:50:01 +010041#include <vppinfra/cpu.h>
Dave Barachc25048b2020-01-29 18:05:24 -050042#include <math.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070043
44#ifdef CLIB_UNIX
45
46#include <math.h>
47#include <sys/time.h>
48#include <fcntl.h>
49
Dave Barachc3799992016-08-15 11:12:27 -040050/* Not very accurate way of determining cpu clock frequency
Ed Warnickecb9cada2015-12-08 15:45:58 -070051 for unix. Better to use /proc/cpuinfo on linux. */
Dave Barachc3799992016-08-15 11:12:27 -040052static f64
53estimate_clock_frequency (f64 sample_time)
Ed Warnickecb9cada2015-12-08 15:45:58 -070054{
Ed Warnickecb9cada2015-12-08 15:45:58 -070055 f64 time_now, time_start, time_limit, freq;
Dave Barachc25048b2020-01-29 18:05:24 -050056 u64 t[2];
Ed Warnickecb9cada2015-12-08 15:45:58 -070057
58 time_start = time_now = unix_time_now ();
59 time_limit = time_now + sample_time;
60 t[0] = clib_cpu_time_now ();
61 while (time_now < time_limit)
62 time_now = unix_time_now ();
63 t[1] = clib_cpu_time_now ();
64
65 freq = (t[1] - t[0]) / (time_now - time_start);
Ed Warnickecb9cada2015-12-08 15:45:58 -070066
67 return freq;
68}
69
70/* Fetch cpu frequency via parseing /proc/cpuinfo.
Dave Barachc3799992016-08-15 11:12:27 -040071 Only works for Linux. */
72static f64
73clock_frequency_from_proc_filesystem (void)
Ed Warnickecb9cada2015-12-08 15:45:58 -070074{
Dave Barachc3799992016-08-15 11:12:27 -040075 f64 cpu_freq = 1e9; /* better than 40... */
76 f64 ppc_timebase = 0; /* warnings be gone */
Ed Warnickecb9cada2015-12-08 15:45:58 -070077 int fd;
78 unformat_input_t input;
79
Dave Barach61efa142016-01-22 08:23:09 -050080/* $$$$ aarch64 kernel doesn't report "cpu MHz" */
81#if defined(__aarch64__)
82 return 0.0;
83#endif
Dave Barachc3799992016-08-15 11:12:27 -040084
Ed Warnickecb9cada2015-12-08 15:45:58 -070085 cpu_freq = 0;
86 fd = open ("/proc/cpuinfo", 0);
87 if (fd < 0)
88 return cpu_freq;
89
Dave Barach59b25652017-09-10 15:04:27 -040090 unformat_init_clib_file (&input, fd);
Ed Warnickecb9cada2015-12-08 15:45:58 -070091
92 ppc_timebase = 0;
93 while (unformat_check_input (&input) != UNFORMAT_END_OF_INPUT)
94 {
95 if (unformat (&input, "cpu MHz : %f", &cpu_freq))
96 cpu_freq *= 1e6;
97 else if (unformat (&input, "timebase : %f", &ppc_timebase))
98 ;
99 else
100 unformat_skip_line (&input);
101 }
102
103 unformat_free (&input);
104
105 close (fd);
106
107 /* Override CPU frequency with time base for PPC. */
108 if (ppc_timebase != 0)
109 cpu_freq = ppc_timebase;
110
111 return cpu_freq;
112}
113
114/* Fetch cpu frequency via reading /sys/devices/system/cpu/cpu0/cpufreq/cpuinfo_max_freq
Dave Barachc3799992016-08-15 11:12:27 -0400115 Only works for Linux. */
116static f64
117clock_frequency_from_sys_filesystem (void)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700118{
Dave Barach96e2d442018-11-14 11:42:03 -0500119 f64 cpu_freq = 0.0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700120 int fd;
121 unformat_input_t input;
122
123 /* Time stamp always runs at max frequency. */
124 cpu_freq = 0;
125 fd = open ("/sys/devices/system/cpu/cpu0/cpufreq/cpuinfo_max_freq", 0);
126 if (fd < 0)
127 goto done;
128
Dave Barach59b25652017-09-10 15:04:27 -0400129 unformat_init_clib_file (&input, fd);
Dave Barach96e2d442018-11-14 11:42:03 -0500130 (void) unformat (&input, "%f", &cpu_freq);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700131 cpu_freq *= 1e3; /* measured in kHz */
132 unformat_free (&input);
133 close (fd);
Dave Barachc3799992016-08-15 11:12:27 -0400134done:
Ed Warnickecb9cada2015-12-08 15:45:58 -0700135 return cpu_freq;
136}
137
Damjan Mariondae1c7e2020-10-17 13:32:25 +0200138__clib_export f64
Dave Barachc3799992016-08-15 11:12:27 -0400139os_cpu_clock_frequency (void)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700140{
Brian Brooksc0379ae2018-01-09 16:39:07 -0600141#if defined (__aarch64__)
142 /* The system counter increments at a fixed frequency. It is distributed
143 * to each core which has registers for reading the current counter value
144 * as well as the clock frequency. The system counter is not clocked at
145 * the same frequency as the core. */
Sirshak Das40c6e1d2018-05-29 21:21:02 -0500146 u64 hz;
Brian Brooksc0379ae2018-01-09 16:39:07 -0600147 asm volatile ("mrs %0, cntfrq_el0":"=r" (hz));
148 return (f64) hz;
149#endif
Ed Warnickecb9cada2015-12-08 15:45:58 -0700150 f64 cpu_freq;
151
Damjan Marion12e3e312019-12-18 18:45:19 +0100152#ifdef __x86_64__
153 u32 __clib_unused eax = 0, ebx = 0, ecx = 0, edx = 0;
154 clib_get_cpuid (0x00, &eax, &ebx, &ecx, &edx);
155 if (eax >= 0x15)
156 {
157 u32 max_leaf = eax;
158 /*
159 CPUID Leaf 0x15 - Time Stamp Counter and Nominal Core Crystal Clock Info
160 eax - denominator of the TSC/”core crystal clock” ratio
161 ebx - numerator of the TSC/”core crystal clock” ratio
162 ecx - nominal frequency of the core crystal clock in Hz
163 edx - reseved
164 */
165
166 clib_get_cpuid (0x15, &eax, &ebx, &ecx, &edx);
167 if (ebx && ecx)
Damjan Marionfa958422020-03-04 20:06:06 +0100168 return (u64) ecx *ebx / eax;
Damjan Marion12e3e312019-12-18 18:45:19 +0100169
170 if (max_leaf >= 0x16)
171 {
172 /*
173 CPUID Leaf 0x16 - Processor Frequency Information Leaf
174 eax - Bits 15 - 00: Processor Base Frequency (in MHz).
175 */
176
177 clib_get_cpuid (0x16, &eax, &ebx, &ecx, &edx);
178 if (eax)
179 return 1e6 * (eax & 0xffff);
180 }
181 }
182#endif
183
Dave Barachc25048b2020-01-29 18:05:24 -0500184 /* If we have an invariant TSC, use it to estimate the clock frequency */
Damjan Marionc0e939b2016-11-12 11:50:01 +0100185 if (clib_cpu_supports_invariant_tsc ())
186 return estimate_clock_frequency (1e-3);
187
Dave Barachc25048b2020-01-29 18:05:24 -0500188 /* Next, try /sys version. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700189 cpu_freq = clock_frequency_from_sys_filesystem ();
190 if (cpu_freq != 0)
191 return cpu_freq;
192
193 /* Next try /proc version. */
194 cpu_freq = clock_frequency_from_proc_filesystem ();
195 if (cpu_freq != 0)
196 return cpu_freq;
197
198 /* If /proc/cpuinfo fails (e.g. not running on Linux) fall back to
199 gettimeofday based estimated clock frequency. */
200 return estimate_clock_frequency (1e-3);
201}
202
203#endif /* CLIB_UNIX */
204
205/* Initialize time. */
Damjan Mariondae1c7e2020-10-17 13:32:25 +0200206__clib_export void
Dave Barachc3799992016-08-15 11:12:27 -0400207clib_time_init (clib_time_t * c)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700208{
Dave Barachb7b92992018-10-17 10:38:51 -0400209 clib_memset (c, 0, sizeof (c[0]));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700210 c->clocks_per_second = os_cpu_clock_frequency ();
Dave Barach51cabf22020-02-04 16:10:17 -0500211 /*
212 * Sporadic reports of os_cpu_clock_frequency() returning 0.0
213 * in highly parallel container environments.
214 * To avoid immediate division by zero:
215 * Step 1: try estimate_clock_frequency().
216 * Step 2: give up. Pretend we have a 2gHz clock.
217 */
218 if (PREDICT_FALSE (c->clocks_per_second == 0.0))
219 {
220 c->clocks_per_second = estimate_clock_frequency (1e-3);
221 if (c->clocks_per_second == 0.0)
222 {
223 clib_warning ("os_cpu_clock_frequency() returned 0.0, use 2e9...");
224 c->clocks_per_second = 2e9;
225 }
226 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700227 c->seconds_per_clock = 1 / c->clocks_per_second;
228 c->log2_clocks_per_second = min_log2_u64 ((u64) c->clocks_per_second);
229
Dave Barachc25048b2020-01-29 18:05:24 -0500230 /* Verify frequency every 16 sec */
231 c->log2_clocks_per_frequency_verify = c->log2_clocks_per_second + 4;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700232
233 c->last_verify_reference_time = unix_time_now ();
Dave Barachc25048b2020-01-29 18:05:24 -0500234 c->init_reference_time = c->last_verify_reference_time;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700235 c->last_cpu_time = clib_cpu_time_now ();
236 c->init_cpu_time = c->last_verify_cpu_time = c->last_cpu_time;
Dave Barachc25048b2020-01-29 18:05:24 -0500237 c->total_cpu_time = 0ULL;
238
239 /*
240 * Use exponential smoothing, with a half-life of 1 minute
241 * reported_rate(t) = reported_rate(t-1) * K + rate(t)*(1-K)
242 * where K = e**(-1.0/3.75);
243 * 15 samples in 4 minutes
244 * 7.5 samples in 2 minutes,
245 * 3.75 samples in 1 minute, etc.
246 */
247 c->damping_constant = exp (-1.0 / 3.75);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700248}
249
Damjan Mariondae1c7e2020-10-17 13:32:25 +0200250__clib_export void
Dave Barachc3799992016-08-15 11:12:27 -0400251clib_time_verify_frequency (clib_time_t * c)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700252{
Dave Barachc25048b2020-01-29 18:05:24 -0500253 f64 now_reference, delta_reference, delta_reference_max;
Dave Barach66441c42020-03-10 09:01:02 -0400254 f64 delta_clock_in_seconds;
255 u64 now_clock, delta_clock;
Dave Barach36feebb2018-09-07 11:12:27 -0400256 f64 new_clocks_per_second, delta;
Dave Barachc25048b2020-01-29 18:05:24 -0500257
258 /* Ask the kernel and the CPU what time it is... */
259 now_reference = unix_time_now ();
Dave Barach66441c42020-03-10 09:01:02 -0400260 now_clock = clib_cpu_time_now ();
261
262 /* Compute change in the reference clock */
263 delta_reference = now_reference - c->last_verify_reference_time;
264
265 /* And change in the CPU clock */
266 delta_clock_in_seconds = (f64) (now_clock - c->last_verify_cpu_time) *
267 c->seconds_per_clock;
268
269 /*
270 * Recompute vpp start time reference, and total clocks
271 * using the current clock rate
272 */
273 c->init_reference_time += (delta_reference - delta_clock_in_seconds);
274 c->total_cpu_time = (now_reference - c->init_reference_time)
275 * c->clocks_per_second;
276
277 c->last_cpu_time = now_clock;
Dave Barachc25048b2020-01-29 18:05:24 -0500278
279 /* Calculate a new clock rate sample */
Dave Barachc25048b2020-01-29 18:05:24 -0500280 delta_clock = c->last_cpu_time - c->last_verify_cpu_time;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700281
282 c->last_verify_cpu_time = c->last_cpu_time;
283 c->last_verify_reference_time = now_reference;
284
Dave Barachc3799992016-08-15 11:12:27 -0400285 /*
286 * Is the reported reference interval non-positive,
287 * or off by a factor of two - or 8 seconds - whichever is larger?
Ed Warnickecb9cada2015-12-08 15:45:58 -0700288 * Someone reset the clock behind our back.
289 */
Dave Barachc25048b2020-01-29 18:05:24 -0500290 delta_reference_max = (f64) (2ULL << c->log2_clocks_per_frequency_verify) /
Dave Barachc3799992016-08-15 11:12:27 -0400291 (f64) (1ULL << c->log2_clocks_per_second);
Dave Barachc25048b2020-01-29 18:05:24 -0500292 delta_reference_max = delta_reference_max > 8.0 ? delta_reference_max : 8.0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700293
Dave Barachc25048b2020-01-29 18:05:24 -0500294 /* Ignore this sample */
295 if (delta_reference <= 0.0 || delta_reference > delta_reference_max)
296 return;
Dave Barachba603ba2018-11-07 17:40:19 -0500297
Dave Barach36feebb2018-09-07 11:12:27 -0400298 /*
299 * Reject large frequency changes, another consequence of
300 * system clock changes particularly with old kernels.
301 */
Dave Barachc25048b2020-01-29 18:05:24 -0500302 new_clocks_per_second = ((f64) delta_clock) / delta_reference;
Dave Barach36feebb2018-09-07 11:12:27 -0400303
Dave Barache52d8d82019-12-01 08:59:03 -0500304 /* Compute abs(rate change) */
Dave Barach36feebb2018-09-07 11:12:27 -0400305 delta = new_clocks_per_second - c->clocks_per_second;
306 if (delta < 0.0)
307 delta = -delta;
308
Dave Barachc25048b2020-01-29 18:05:24 -0500309 /* If rate change > 1%, reject this sample */
Dave Barach36feebb2018-09-07 11:12:27 -0400310 if (PREDICT_FALSE ((delta / c->clocks_per_second) > .01))
311 {
312 clib_warning ("Rejecting large frequency change of %.2f%%",
313 (delta / c->clocks_per_second) * 100.0);
Dave Barach36feebb2018-09-07 11:12:27 -0400314 return;
315 }
316
Dave Barachc25048b2020-01-29 18:05:24 -0500317 /* Add sample to the exponentially-smoothed rate */
318 c->clocks_per_second = c->clocks_per_second * c->damping_constant +
319 (1.0 - c->damping_constant) * new_clocks_per_second;
320 c->seconds_per_clock = 1.0 / c->clocks_per_second;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700321
Dave Barache52d8d82019-12-01 08:59:03 -0500322 /*
Dave Barachc25048b2020-01-29 18:05:24 -0500323 * Recalculate total_cpu_time based on the kernel timebase, and
324 * the calculated clock rate
Dave Barache52d8d82019-12-01 08:59:03 -0500325 */
Dave Barachc25048b2020-01-29 18:05:24 -0500326 c->total_cpu_time =
327 (now_reference - c->init_reference_time) * c->clocks_per_second;
328}
Dave Barache52d8d82019-12-01 08:59:03 -0500329
Dave Barachc25048b2020-01-29 18:05:24 -0500330
Damjan Mariondae1c7e2020-10-17 13:32:25 +0200331__clib_export u8 *
Dave Barachc25048b2020-01-29 18:05:24 -0500332format_clib_time (u8 * s, va_list * args)
333{
334 clib_time_t *c = va_arg (*args, clib_time_t *);
335 int verbose = va_arg (*args, int);
336 f64 now, reftime, delta_reftime_in_seconds, error;
337
338 /* Compute vpp elapsed time from the CPU clock */
339 reftime = unix_time_now ();
340 now = clib_time_now (c);
341
342 s = format (s, "Time now %.6f", now);
343 if (verbose == 0)
344 return s;
345
346 /* And also from the kernel */
347 delta_reftime_in_seconds = reftime - c->init_reference_time;
348
349 error = now - delta_reftime_in_seconds;
350
351 s = format (s, ", reftime %.6f, error %.6f, clocks/sec %.6f",
352 delta_reftime_in_seconds, error, c->clocks_per_second);
353 return (s);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700354}
Dave Barachc3799992016-08-15 11:12:27 -0400355
356/*
357 * fd.io coding-style-patch-verification: ON
358 *
359 * Local Variables:
360 * eval: (c-set-style "gnu")
361 * End:
362 */