blob: 3b3acfa3d1b7afd5f75fa891015273acd4250ac8 [file] [log] [blame]
Ed Warnickecb9cada2015-12-08 15:45:58 -07001/*
2 * Copyright (c) 2015 Cisco and/or its affiliates.
3 * Licensed under the Apache License, Version 2.0 (the "License");
4 * you may not use this file except in compliance with the License.
5 * You may obtain a copy of the License at:
6 *
7 * http://www.apache.org/licenses/LICENSE-2.0
8 *
9 * Unless required by applicable law or agreed to in writing, software
10 * distributed under the License is distributed on an "AS IS" BASIS,
11 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 * See the License for the specific language governing permissions and
13 * limitations under the License.
14 */
15/*
16 Copyright (c) 2005 Eliot Dresselhaus
17
18 Permission is hereby granted, free of charge, to any person obtaining
19 a copy of this software and associated documentation files (the
20 "Software"), to deal in the Software without restriction, including
21 without limitation the rights to use, copy, modify, merge, publish,
22 distribute, sublicense, and/or sell copies of the Software, and to
23 permit persons to whom the Software is furnished to do so, subject to
24 the following conditions:
25
26 The above copyright notice and this permission notice shall be
27 included in all copies or substantial portions of the Software.
28
29 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
30 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
31 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
32 NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
33 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
34 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
35 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
36*/
37
38#include <vppinfra/os.h>
39#include <vppinfra/time.h>
40#include <vppinfra/format.h>
Damjan Marionc0e939b2016-11-12 11:50:01 +010041#include <vppinfra/cpu.h>
Dave Barachc25048b2020-01-29 18:05:24 -050042#include <math.h>
Ed Warnickecb9cada2015-12-08 15:45:58 -070043
44#ifdef CLIB_UNIX
45
46#include <math.h>
47#include <sys/time.h>
48#include <fcntl.h>
49
Dave Barachc3799992016-08-15 11:12:27 -040050/* Not very accurate way of determining cpu clock frequency
Ed Warnickecb9cada2015-12-08 15:45:58 -070051 for unix. Better to use /proc/cpuinfo on linux. */
Dave Barachc3799992016-08-15 11:12:27 -040052static f64
53estimate_clock_frequency (f64 sample_time)
Ed Warnickecb9cada2015-12-08 15:45:58 -070054{
Ed Warnickecb9cada2015-12-08 15:45:58 -070055 f64 time_now, time_start, time_limit, freq;
Dave Barachc25048b2020-01-29 18:05:24 -050056 u64 t[2];
Ed Warnickecb9cada2015-12-08 15:45:58 -070057
58 time_start = time_now = unix_time_now ();
59 time_limit = time_now + sample_time;
60 t[0] = clib_cpu_time_now ();
61 while (time_now < time_limit)
62 time_now = unix_time_now ();
63 t[1] = clib_cpu_time_now ();
64
65 freq = (t[1] - t[0]) / (time_now - time_start);
Ed Warnickecb9cada2015-12-08 15:45:58 -070066
67 return freq;
68}
69
70/* Fetch cpu frequency via parseing /proc/cpuinfo.
Dave Barachc3799992016-08-15 11:12:27 -040071 Only works for Linux. */
72static f64
73clock_frequency_from_proc_filesystem (void)
Ed Warnickecb9cada2015-12-08 15:45:58 -070074{
Dave Barachc3799992016-08-15 11:12:27 -040075 f64 cpu_freq = 1e9; /* better than 40... */
76 f64 ppc_timebase = 0; /* warnings be gone */
Ed Warnickecb9cada2015-12-08 15:45:58 -070077 int fd;
78 unformat_input_t input;
79
Dave Barach61efa142016-01-22 08:23:09 -050080/* $$$$ aarch64 kernel doesn't report "cpu MHz" */
81#if defined(__aarch64__)
82 return 0.0;
83#endif
Dave Barachc3799992016-08-15 11:12:27 -040084
Ed Warnickecb9cada2015-12-08 15:45:58 -070085 cpu_freq = 0;
86 fd = open ("/proc/cpuinfo", 0);
87 if (fd < 0)
88 return cpu_freq;
89
Dave Barach59b25652017-09-10 15:04:27 -040090 unformat_init_clib_file (&input, fd);
Ed Warnickecb9cada2015-12-08 15:45:58 -070091
92 ppc_timebase = 0;
93 while (unformat_check_input (&input) != UNFORMAT_END_OF_INPUT)
94 {
95 if (unformat (&input, "cpu MHz : %f", &cpu_freq))
96 cpu_freq *= 1e6;
97 else if (unformat (&input, "timebase : %f", &ppc_timebase))
98 ;
99 else
100 unformat_skip_line (&input);
101 }
102
103 unformat_free (&input);
104
105 close (fd);
106
107 /* Override CPU frequency with time base for PPC. */
108 if (ppc_timebase != 0)
109 cpu_freq = ppc_timebase;
110
111 return cpu_freq;
112}
113
114/* Fetch cpu frequency via reading /sys/devices/system/cpu/cpu0/cpufreq/cpuinfo_max_freq
Dave Barachc3799992016-08-15 11:12:27 -0400115 Only works for Linux. */
116static f64
117clock_frequency_from_sys_filesystem (void)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700118{
Dave Barach96e2d442018-11-14 11:42:03 -0500119 f64 cpu_freq = 0.0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700120 int fd;
121 unformat_input_t input;
122
123 /* Time stamp always runs at max frequency. */
124 cpu_freq = 0;
125 fd = open ("/sys/devices/system/cpu/cpu0/cpufreq/cpuinfo_max_freq", 0);
126 if (fd < 0)
127 goto done;
128
Dave Barach59b25652017-09-10 15:04:27 -0400129 unformat_init_clib_file (&input, fd);
Dave Barach96e2d442018-11-14 11:42:03 -0500130 (void) unformat (&input, "%f", &cpu_freq);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700131 cpu_freq *= 1e3; /* measured in kHz */
132 unformat_free (&input);
133 close (fd);
Dave Barachc3799992016-08-15 11:12:27 -0400134done:
Ed Warnickecb9cada2015-12-08 15:45:58 -0700135 return cpu_freq;
136}
137
Dave Barachc3799992016-08-15 11:12:27 -0400138f64
139os_cpu_clock_frequency (void)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700140{
Brian Brooksc0379ae2018-01-09 16:39:07 -0600141#if defined (__aarch64__)
142 /* The system counter increments at a fixed frequency. It is distributed
143 * to each core which has registers for reading the current counter value
144 * as well as the clock frequency. The system counter is not clocked at
145 * the same frequency as the core. */
Sirshak Das40c6e1d2018-05-29 21:21:02 -0500146 u64 hz;
Brian Brooksc0379ae2018-01-09 16:39:07 -0600147 asm volatile ("mrs %0, cntfrq_el0":"=r" (hz));
148 return (f64) hz;
149#endif
Ed Warnickecb9cada2015-12-08 15:45:58 -0700150 f64 cpu_freq;
151
Damjan Marion12e3e312019-12-18 18:45:19 +0100152#ifdef __x86_64__
153 u32 __clib_unused eax = 0, ebx = 0, ecx = 0, edx = 0;
154 clib_get_cpuid (0x00, &eax, &ebx, &ecx, &edx);
155 if (eax >= 0x15)
156 {
157 u32 max_leaf = eax;
158 /*
159 CPUID Leaf 0x15 - Time Stamp Counter and Nominal Core Crystal Clock Info
160 eax - denominator of the TSC/”core crystal clock” ratio
161 ebx - numerator of the TSC/”core crystal clock” ratio
162 ecx - nominal frequency of the core crystal clock in Hz
163 edx - reseved
164 */
165
166 clib_get_cpuid (0x15, &eax, &ebx, &ecx, &edx);
167 if (ebx && ecx)
168 return ecx * ebx / eax;
169
170 if (max_leaf >= 0x16)
171 {
172 /*
173 CPUID Leaf 0x16 - Processor Frequency Information Leaf
174 eax - Bits 15 - 00: Processor Base Frequency (in MHz).
175 */
176
177 clib_get_cpuid (0x16, &eax, &ebx, &ecx, &edx);
178 if (eax)
179 return 1e6 * (eax & 0xffff);
180 }
181 }
182#endif
183
Dave Barachc25048b2020-01-29 18:05:24 -0500184 /* If we have an invariant TSC, use it to estimate the clock frequency */
Damjan Marionc0e939b2016-11-12 11:50:01 +0100185 if (clib_cpu_supports_invariant_tsc ())
186 return estimate_clock_frequency (1e-3);
187
Dave Barachc25048b2020-01-29 18:05:24 -0500188 /* Next, try /sys version. */
Ed Warnickecb9cada2015-12-08 15:45:58 -0700189 cpu_freq = clock_frequency_from_sys_filesystem ();
190 if (cpu_freq != 0)
191 return cpu_freq;
192
193 /* Next try /proc version. */
194 cpu_freq = clock_frequency_from_proc_filesystem ();
195 if (cpu_freq != 0)
196 return cpu_freq;
197
198 /* If /proc/cpuinfo fails (e.g. not running on Linux) fall back to
199 gettimeofday based estimated clock frequency. */
200 return estimate_clock_frequency (1e-3);
201}
202
203#endif /* CLIB_UNIX */
204
205/* Initialize time. */
Dave Barachc3799992016-08-15 11:12:27 -0400206void
207clib_time_init (clib_time_t * c)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700208{
Dave Barachb7b92992018-10-17 10:38:51 -0400209 clib_memset (c, 0, sizeof (c[0]));
Ed Warnickecb9cada2015-12-08 15:45:58 -0700210 c->clocks_per_second = os_cpu_clock_frequency ();
211 c->seconds_per_clock = 1 / c->clocks_per_second;
212 c->log2_clocks_per_second = min_log2_u64 ((u64) c->clocks_per_second);
213
Dave Barachc25048b2020-01-29 18:05:24 -0500214 /* Verify frequency every 16 sec */
215 c->log2_clocks_per_frequency_verify = c->log2_clocks_per_second + 4;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700216
217 c->last_verify_reference_time = unix_time_now ();
Dave Barachc25048b2020-01-29 18:05:24 -0500218 c->init_reference_time = c->last_verify_reference_time;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700219 c->last_cpu_time = clib_cpu_time_now ();
220 c->init_cpu_time = c->last_verify_cpu_time = c->last_cpu_time;
Dave Barachc25048b2020-01-29 18:05:24 -0500221 c->total_cpu_time = 0ULL;
222
223 /*
224 * Use exponential smoothing, with a half-life of 1 minute
225 * reported_rate(t) = reported_rate(t-1) * K + rate(t)*(1-K)
226 * where K = e**(-1.0/3.75);
227 * 15 samples in 4 minutes
228 * 7.5 samples in 2 minutes,
229 * 3.75 samples in 1 minute, etc.
230 */
231 c->damping_constant = exp (-1.0 / 3.75);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700232}
233
Dave Barachc3799992016-08-15 11:12:27 -0400234void
235clib_time_verify_frequency (clib_time_t * c)
Ed Warnickecb9cada2015-12-08 15:45:58 -0700236{
Dave Barachc25048b2020-01-29 18:05:24 -0500237 f64 now_reference, delta_reference, delta_reference_max;
238 u64 delta_clock;
Dave Barach36feebb2018-09-07 11:12:27 -0400239 f64 new_clocks_per_second, delta;
Dave Barachc25048b2020-01-29 18:05:24 -0500240
241 /* Ask the kernel and the CPU what time it is... */
242 now_reference = unix_time_now ();
243 c->last_cpu_time = clib_cpu_time_now ();
244
245 /* Calculate a new clock rate sample */
246 delta_reference = now_reference - c->last_verify_reference_time;
247 delta_clock = c->last_cpu_time - c->last_verify_cpu_time;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700248
249 c->last_verify_cpu_time = c->last_cpu_time;
250 c->last_verify_reference_time = now_reference;
251
Dave Barachc3799992016-08-15 11:12:27 -0400252 /*
253 * Is the reported reference interval non-positive,
254 * or off by a factor of two - or 8 seconds - whichever is larger?
Ed Warnickecb9cada2015-12-08 15:45:58 -0700255 * Someone reset the clock behind our back.
256 */
Dave Barachc25048b2020-01-29 18:05:24 -0500257 delta_reference_max = (f64) (2ULL << c->log2_clocks_per_frequency_verify) /
Dave Barachc3799992016-08-15 11:12:27 -0400258 (f64) (1ULL << c->log2_clocks_per_second);
Dave Barachc25048b2020-01-29 18:05:24 -0500259 delta_reference_max = delta_reference_max > 8.0 ? delta_reference_max : 8.0;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700260
Dave Barachc25048b2020-01-29 18:05:24 -0500261 /* Ignore this sample */
262 if (delta_reference <= 0.0 || delta_reference > delta_reference_max)
263 return;
Dave Barachba603ba2018-11-07 17:40:19 -0500264
Dave Barach36feebb2018-09-07 11:12:27 -0400265 /*
266 * Reject large frequency changes, another consequence of
267 * system clock changes particularly with old kernels.
268 */
Dave Barachc25048b2020-01-29 18:05:24 -0500269 new_clocks_per_second = ((f64) delta_clock) / delta_reference;
Dave Barach36feebb2018-09-07 11:12:27 -0400270
Dave Barache52d8d82019-12-01 08:59:03 -0500271 /* Compute abs(rate change) */
Dave Barach36feebb2018-09-07 11:12:27 -0400272 delta = new_clocks_per_second - c->clocks_per_second;
273 if (delta < 0.0)
274 delta = -delta;
275
Dave Barachc25048b2020-01-29 18:05:24 -0500276 /* If rate change > 1%, reject this sample */
Dave Barach36feebb2018-09-07 11:12:27 -0400277 if (PREDICT_FALSE ((delta / c->clocks_per_second) > .01))
278 {
279 clib_warning ("Rejecting large frequency change of %.2f%%",
280 (delta / c->clocks_per_second) * 100.0);
Dave Barach36feebb2018-09-07 11:12:27 -0400281 return;
282 }
283
Dave Barachc25048b2020-01-29 18:05:24 -0500284 /* Add sample to the exponentially-smoothed rate */
285 c->clocks_per_second = c->clocks_per_second * c->damping_constant +
286 (1.0 - c->damping_constant) * new_clocks_per_second;
287 c->seconds_per_clock = 1.0 / c->clocks_per_second;
Ed Warnickecb9cada2015-12-08 15:45:58 -0700288
Dave Barache52d8d82019-12-01 08:59:03 -0500289 /*
Dave Barachc25048b2020-01-29 18:05:24 -0500290 * Recalculate total_cpu_time based on the kernel timebase, and
291 * the calculated clock rate
Dave Barache52d8d82019-12-01 08:59:03 -0500292 */
Dave Barachc25048b2020-01-29 18:05:24 -0500293 c->total_cpu_time =
294 (now_reference - c->init_reference_time) * c->clocks_per_second;
295}
Dave Barache52d8d82019-12-01 08:59:03 -0500296
Dave Barachc25048b2020-01-29 18:05:24 -0500297
298u8 *
299format_clib_time (u8 * s, va_list * args)
300{
301 clib_time_t *c = va_arg (*args, clib_time_t *);
302 int verbose = va_arg (*args, int);
303 f64 now, reftime, delta_reftime_in_seconds, error;
304
305 /* Compute vpp elapsed time from the CPU clock */
306 reftime = unix_time_now ();
307 now = clib_time_now (c);
308
309 s = format (s, "Time now %.6f", now);
310 if (verbose == 0)
311 return s;
312
313 /* And also from the kernel */
314 delta_reftime_in_seconds = reftime - c->init_reference_time;
315
316 error = now - delta_reftime_in_seconds;
317
318 s = format (s, ", reftime %.6f, error %.6f, clocks/sec %.6f",
319 delta_reftime_in_seconds, error, c->clocks_per_second);
320 return (s);
Ed Warnickecb9cada2015-12-08 15:45:58 -0700321}
Dave Barachc3799992016-08-15 11:12:27 -0400322
323/*
324 * fd.io coding-style-patch-verification: ON
325 *
326 * Local Variables:
327 * eval: (c-set-style "gnu")
328 * End:
329 */