blob: 27758dc7534e4b78a40871a6a699b96811cff852 [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15/*
16 Copyright (c) 2005 Eliot Dresselhaus
17
18 Permission is hereby granted, free of charge, to any person obtaining
19 a copy of this software and associated documentation files (the
20 "Software"), to deal in the Software without restriction, including
21 without limitation the rights to use, copy, modify, merge, publish,
22 distribute, sublicense, and/or sell copies of the Software, and to
23 permit persons to whom the Software is furnished to do so, subject to
24 the following conditions:
25
26 The above copyright notice and this permission notice shall be
27 included in all copies or substantial portions of the Software.
28
29 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
30 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
31 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
32 NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
33 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
34 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
35 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
36*/
37
38#include <vppinfra/os.h>
39#include <vppinfra/time.h>
40#include <vppinfra/format.h>
Damjan Marionc0e939b2016-11-12 11:50:01 +010041#include <vppinfra/cpu.h>
Dave Barachc25048b2020-01-29 18:05:24 -050042#include <math.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070043
44#ifdef CLIB_UNIX
45
46#include <math.h>
47#include <sys/time.h>
48#include <fcntl.h>
49
Dave Barachc3799992016-08-15 11:12:27 -040050/* Not very accurate way of determining cpu clock frequency
Ed Warnickecb9cada2015-12-08 15:45:58 -070051 for unix. Better to use /proc/cpuinfo on linux. */
Dave Barachc3799992016-08-15 11:12:27 -040052static f64
53estimate_clock_frequency (f64 sample_time)
Ed Warnickecb9cada2015-12-08 15:45:58 -070054{
Ed Warnickecb9cada2015-12-08 15:45:58 -070055 f64 time_now, time_start, time_limit, freq;
Dave Barachc25048b2020-01-29 18:05:24 -050056 u64 t[2];
Ed Warnickecb9cada2015-12-08 15:45:58 -070057
58 time_start = time_now = unix_time_now ();
59 time_limit = time_now + sample_time;
60 t[0] = clib_cpu_time_now ();
61 while (time_now < time_limit)
62 time_now = unix_time_now ();
63 t[1] = clib_cpu_time_now ();
64
65 freq = (t[1] - t[0]) / (time_now - time_start);
Ed Warnickecb9cada2015-12-08 15:45:58 -070066
67 return freq;
68}
69
70/* Fetch cpu frequency via parseing /proc/cpuinfo.
Dave Barachc3799992016-08-15 11:12:27 -040071 Only works for Linux. */
72static f64
73clock_frequency_from_proc_filesystem (void)
Ed Warnickecb9cada2015-12-08 15:45:58 -070074{
Dave Barachc3799992016-08-15 11:12:27 -040075 f64 cpu_freq = 1e9; /* better than 40... */
76 f64 ppc_timebase = 0; /* warnings be gone */
Ed Warnickecb9cada2015-12-08 15:45:58 -070077 int fd;
78 unformat_input_t input;
79
Dave Barach61efa142016-01-22 08:23:09 -050080/* $$$$ aarch64 kernel doesn't report "cpu MHz" */
81#if defined(__aarch64__)
82 return 0.0;
83#endif
Dave Barachc3799992016-08-15 11:12:27 -040084
Ed Warnickecb9cada2015-12-08 15:45:58 -070085 cpu_freq = 0;
86 fd = open ("/proc/cpuinfo", 0);
87 if (fd < 0)
88 return cpu_freq;
89
Dave Barach59b25652017-09-10 15:04:27 -040090 unformat_init_clib_file (&input, fd);
Ed Warnickecb9cada2015-12-08 15:45:58 -070091
92 ppc_timebase = 0;
93 while (unformat_check_input (&input) != UNFORMAT_END_OF_INPUT)
94 {
95 if (unformat (&input, "cpu MHz : %f", &cpu_freq))
96 cpu_freq *= 1e6;
97 else if (unformat (&input, "timebase : %f", &ppc_timebase))
98 ;
99 else
100 unformat_skip_line (&input);
101 }
102
103 unformat_free (&input);
104
105 close (fd);
106
107 /* Override CPU frequency with time base for PPC. */
108 if (ppc_timebase != 0)
109 cpu_freq = ppc_timebase;
110
111 return cpu_freq;
112}
113
114/* Fetch cpu frequency via reading /sys/devices/system/cpu/cpu0/cpufreq/cpuinfo_max_freq
Dave Barachc3799992016-08-15 11:12:27 -0400115 Only works for Linux. */
116static f64
117clock_frequency_from_sys_filesystem (void)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700118{
Dave Barach96e2d442018-11-14 11:42:03 -0500119 f64 cpu_freq = 0.0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700120 int fd;
121 unformat_input_t input;
122
123 /* Time stamp always runs at max frequency. */
124 cpu_freq = 0;
125 fd = open ("/sys/devices/system/cpu/cpu0/cpufreq/cpuinfo_max_freq", 0);
126 if (fd < 0)
127 goto done;
128
Dave Barach59b25652017-09-10 15:04:27 -0400129 unformat_init_clib_file (&input, fd);
Dave Barach96e2d442018-11-14 11:42:03 -0500130 (void) unformat (&input, "%f", &cpu_freq);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700131 cpu_freq *= 1e3; /* measured in kHz */
132 unformat_free (&input);
133 close (fd);
Dave Barachc3799992016-08-15 11:12:27 -0400134done:
Ed Warnickecb9cada2015-12-08 15:45:58 -0700135 return cpu_freq;
136}
137
Dave Barachc3799992016-08-15 11:12:27 -0400138f64
139os_cpu_clock_frequency (void)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700140{
Brian Brooksc0379ae2018-01-09 16:39:07 -0600141#if defined (__aarch64__)
142 /* The system counter increments at a fixed frequency. It is distributed
143 * to each core which has registers for reading the current counter value
144 * as well as the clock frequency. The system counter is not clocked at
145 * the same frequency as the core. */
Sirshak Das40c6e1d2018-05-29 21:21:02 -0500146 u64 hz;
Brian Brooksc0379ae2018-01-09 16:39:07 -0600147 asm volatile ("mrs %0, cntfrq_el0":"=r" (hz));
148 return (f64) hz;
149#endif
Ed Warnickecb9cada2015-12-08 15:45:58 -0700150 f64 cpu_freq;
151
Damjan Marion12e3e312019-12-18 18:45:19 +0100152#ifdef __x86_64__
153 u32 __clib_unused eax = 0, ebx = 0, ecx = 0, edx = 0;
154 clib_get_cpuid (0x00, &eax, &ebx, &ecx, &edx);
155 if (eax >= 0x15)
156 {
157 u32 max_leaf = eax;
158 /*
159 CPUID Leaf 0x15 - Time Stamp Counter and Nominal Core Crystal Clock Info
160 eax - denominator of the TSC/”core crystal clock” ratio
161 ebx - numerator of the TSC/”core crystal clock” ratio
162 ecx - nominal frequency of the core crystal clock in Hz
163 edx - reseved
164 */
165
166 clib_get_cpuid (0x15, &eax, &ebx, &ecx, &edx);
167 if (ebx && ecx)
168 return ecx * ebx / eax;
169
170 if (max_leaf >= 0x16)
171 {
172 /*
173 CPUID Leaf 0x16 - Processor Frequency Information Leaf
174 eax - Bits 15 - 00: Processor Base Frequency (in MHz).
175 */
176
177 clib_get_cpuid (0x16, &eax, &ebx, &ecx, &edx);
178 if (eax)
179 return 1e6 * (eax & 0xffff);
180 }
181 }
182#endif
183
Dave Barachc25048b2020-01-29 18:05:24 -0500184 /* If we have an invariant TSC, use it to estimate the clock frequency */
Damjan Marionc0e939b2016-11-12 11:50:01 +0100185 if (clib_cpu_supports_invariant_tsc ())
186 return estimate_clock_frequency (1e-3);
187
Dave Barachc25048b2020-01-29 18:05:24 -0500188 /* Next, try /sys version. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700189 cpu_freq = clock_frequency_from_sys_filesystem ();
190 if (cpu_freq != 0)
191 return cpu_freq;
192
193 /* Next try /proc version. */
194 cpu_freq = clock_frequency_from_proc_filesystem ();
195 if (cpu_freq != 0)
196 return cpu_freq;
197
198 /* If /proc/cpuinfo fails (e.g. not running on Linux) fall back to
199 gettimeofday based estimated clock frequency. */
200 return estimate_clock_frequency (1e-3);
201}
202
203#endif /* CLIB_UNIX */
204
205/* Initialize time. */
Dave Barachc3799992016-08-15 11:12:27 -0400206void
207clib_time_init (clib_time_t * c)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700208{
Dave Barachb7b92992018-10-17 10:38:51 -0400209 clib_memset (c, 0, sizeof (c[0]));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700210 c->clocks_per_second = os_cpu_clock_frequency ();
Dave Barach51cabf22020-02-04 16:10:17 -0500211 /*
212 * Sporadic reports of os_cpu_clock_frequency() returning 0.0
213 * in highly parallel container environments.
214 * To avoid immediate division by zero:
215 * Step 1: try estimate_clock_frequency().
216 * Step 2: give up. Pretend we have a 2gHz clock.
217 */
218 if (PREDICT_FALSE (c->clocks_per_second == 0.0))
219 {
220 c->clocks_per_second = estimate_clock_frequency (1e-3);
221 if (c->clocks_per_second == 0.0)
222 {
223 clib_warning ("os_cpu_clock_frequency() returned 0.0, use 2e9...");
224 c->clocks_per_second = 2e9;
225 }
226 }
Ed Warnickecb9cada2015-12-08 15:45:58 -0700227 c->seconds_per_clock = 1 / c->clocks_per_second;
228 c->log2_clocks_per_second = min_log2_u64 ((u64) c->clocks_per_second);
229
Dave Barachc25048b2020-01-29 18:05:24 -0500230 /* Verify frequency every 16 sec */
231 c->log2_clocks_per_frequency_verify = c->log2_clocks_per_second + 4;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700232
233 c->last_verify_reference_time = unix_time_now ();
Dave Barachc25048b2020-01-29 18:05:24 -0500234 c->init_reference_time = c->last_verify_reference_time;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700235 c->last_cpu_time = clib_cpu_time_now ();
236 c->init_cpu_time = c->last_verify_cpu_time = c->last_cpu_time;
Dave Barachc25048b2020-01-29 18:05:24 -0500237 c->total_cpu_time = 0ULL;
238
239 /*
240 * Use exponential smoothing, with a half-life of 1 minute
241 * reported_rate(t) = reported_rate(t-1) * K + rate(t)*(1-K)
242 * where K = e**(-1.0/3.75);
243 * 15 samples in 4 minutes
244 * 7.5 samples in 2 minutes,
245 * 3.75 samples in 1 minute, etc.
246 */
247 c->damping_constant = exp (-1.0 / 3.75);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700248}
249
Dave Barachc3799992016-08-15 11:12:27 -0400250void
251clib_time_verify_frequency (clib_time_t * c)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700252{
Dave Barachc25048b2020-01-29 18:05:24 -0500253 f64 now_reference, delta_reference, delta_reference_max;
254 u64 delta_clock;
Dave Barach36feebb2018-09-07 11:12:27 -0400255 f64 new_clocks_per_second, delta;
Dave Barachc25048b2020-01-29 18:05:24 -0500256
257 /* Ask the kernel and the CPU what time it is... */
258 now_reference = unix_time_now ();
259 c->last_cpu_time = clib_cpu_time_now ();
260
261 /* Calculate a new clock rate sample */
262 delta_reference = now_reference - c->last_verify_reference_time;
263 delta_clock = c->last_cpu_time - c->last_verify_cpu_time;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700264
265 c->last_verify_cpu_time = c->last_cpu_time;
266 c->last_verify_reference_time = now_reference;
267
Dave Barachc3799992016-08-15 11:12:27 -0400268 /*
269 * Is the reported reference interval non-positive,
270 * or off by a factor of two - or 8 seconds - whichever is larger?
Ed Warnickecb9cada2015-12-08 15:45:58 -0700271 * Someone reset the clock behind our back.
272 */
Dave Barachc25048b2020-01-29 18:05:24 -0500273 delta_reference_max = (f64) (2ULL << c->log2_clocks_per_frequency_verify) /
Dave Barachc3799992016-08-15 11:12:27 -0400274 (f64) (1ULL << c->log2_clocks_per_second);
Dave Barachc25048b2020-01-29 18:05:24 -0500275 delta_reference_max = delta_reference_max > 8.0 ? delta_reference_max : 8.0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700276
Dave Barachc25048b2020-01-29 18:05:24 -0500277 /* Ignore this sample */
278 if (delta_reference <= 0.0 || delta_reference > delta_reference_max)
279 return;
Dave Barachba603ba2018-11-07 17:40:19 -0500280
Dave Barach36feebb2018-09-07 11:12:27 -0400281 /*
282 * Reject large frequency changes, another consequence of
283 * system clock changes particularly with old kernels.
284 */
Dave Barachc25048b2020-01-29 18:05:24 -0500285 new_clocks_per_second = ((f64) delta_clock) / delta_reference;
Dave Barach36feebb2018-09-07 11:12:27 -0400286
Dave Barache52d8d82019-12-01 08:59:03 -0500287 /* Compute abs(rate change) */
Dave Barach36feebb2018-09-07 11:12:27 -0400288 delta = new_clocks_per_second - c->clocks_per_second;
289 if (delta < 0.0)
290 delta = -delta;
291
Dave Barachc25048b2020-01-29 18:05:24 -0500292 /* If rate change > 1%, reject this sample */
Dave Barach36feebb2018-09-07 11:12:27 -0400293 if (PREDICT_FALSE ((delta / c->clocks_per_second) > .01))
294 {
295 clib_warning ("Rejecting large frequency change of %.2f%%",
296 (delta / c->clocks_per_second) * 100.0);
Dave Barach36feebb2018-09-07 11:12:27 -0400297 return;
298 }
299
Dave Barachc25048b2020-01-29 18:05:24 -0500300 /* Add sample to the exponentially-smoothed rate */
301 c->clocks_per_second = c->clocks_per_second * c->damping_constant +
302 (1.0 - c->damping_constant) * new_clocks_per_second;
303 c->seconds_per_clock = 1.0 / c->clocks_per_second;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700304
Dave Barache52d8d82019-12-01 08:59:03 -0500305 /*
Dave Barachc25048b2020-01-29 18:05:24 -0500306 * Recalculate total_cpu_time based on the kernel timebase, and
307 * the calculated clock rate
Dave Barache52d8d82019-12-01 08:59:03 -0500308 */
Dave Barachc25048b2020-01-29 18:05:24 -0500309 c->total_cpu_time =
310 (now_reference - c->init_reference_time) * c->clocks_per_second;
311}
Dave Barache52d8d82019-12-01 08:59:03 -0500312
Dave Barachc25048b2020-01-29 18:05:24 -0500313
314u8 *
315format_clib_time (u8 * s, va_list * args)
316{
317 clib_time_t *c = va_arg (*args, clib_time_t *);
318 int verbose = va_arg (*args, int);
319 f64 now, reftime, delta_reftime_in_seconds, error;
320
321 /* Compute vpp elapsed time from the CPU clock */
322 reftime = unix_time_now ();
323 now = clib_time_now (c);
324
325 s = format (s, "Time now %.6f", now);
326 if (verbose == 0)
327 return s;
328
329 /* And also from the kernel */
330 delta_reftime_in_seconds = reftime - c->init_reference_time;
331
332 error = now - delta_reftime_in_seconds;
333
334 s = format (s, ", reftime %.6f, error %.6f, clocks/sec %.6f",
335 delta_reftime_in_seconds, error, c->clocks_per_second);
336 return (s);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700337}
Dave Barachc3799992016-08-15 11:12:27 -0400338
339/*
340 * fd.io coding-style-patch-verification: ON
341 *
342 * Local Variables:
343 * eval: (c-set-style "gnu")
344 * End:
345 */