blob: e3e3b979f9bd2645d6cc7416e7c6c25cb7d20b2e [file] [log] [blame]
Peter Zijlstra3e51f332008-05-03 18:29:28 +02001/*
Ingo Molnar97fb7a02018-03-03 14:01:12 +01002 * sched_clock() for unstable CPU clocks
Peter Zijlstra3e51f332008-05-03 18:29:28 +02003 *
Peter Zijlstra90eec102015-11-16 11:08:45 +01004 * Copyright (C) 2008 Red Hat, Inc., Peter Zijlstra
Peter Zijlstra3e51f332008-05-03 18:29:28 +02005 *
Steven Rostedtc300ba22008-07-09 00:15:33 -04006 * Updates and enhancements:
7 * Copyright (C) 2008 Red Hat, Inc. Steven Rostedt <srostedt@redhat.com>
8 *
Peter Zijlstra3e51f332008-05-03 18:29:28 +02009 * Based on code by:
10 * Ingo Molnar <mingo@redhat.com>
11 * Guillaume Chazarain <guichaz@gmail.com>
12 *
Peter Zijlstrac6763292010-05-25 10:48:51 +020013 *
Ingo Molnar97fb7a02018-03-03 14:01:12 +010014 * What this file implements:
Peter Zijlstrac6763292010-05-25 10:48:51 +020015 *
16 * cpu_clock(i) provides a fast (execution time) high resolution
17 * clock with bounded drift between CPUs. The value of cpu_clock(i)
18 * is monotonic for constant i. The timestamp returned is in nanoseconds.
19 *
20 * ######################### BIG FAT WARNING ##########################
21 * # when comparing cpu_clock(i) to cpu_clock(j) for i != j, time can #
22 * # go backwards !! #
23 * ####################################################################
24 *
25 * There is no strict promise about the base, although it tends to start
26 * at 0 on boot (but people really shouldn't rely on that).
27 *
28 * cpu_clock(i) -- can be used from any context, including NMI.
Ingo Molnar97fb7a02018-03-03 14:01:12 +010029 * local_clock() -- is cpu_clock() on the current CPU.
Peter Zijlstrac6763292010-05-25 10:48:51 +020030 *
Peter Zijlstraef08f0f2013-11-28 19:31:23 +010031 * sched_clock_cpu(i)
32 *
Ingo Molnar97fb7a02018-03-03 14:01:12 +010033 * How it is implemented:
Peter Zijlstrac6763292010-05-25 10:48:51 +020034 *
35 * The implementation either uses sched_clock() when
36 * !CONFIG_HAVE_UNSTABLE_SCHED_CLOCK, which means in that case the
37 * sched_clock() is assumed to provide these properties (mostly it means
38 * the architecture provides a globally synchronized highres time source).
39 *
40 * Otherwise it tries to create a semi stable clock from a mixture of other
41 * clocks, including:
42 *
43 * - GTOD (clock monotomic)
Peter Zijlstra3e51f332008-05-03 18:29:28 +020044 * - sched_clock()
45 * - explicit idle events
46 *
Peter Zijlstrac6763292010-05-25 10:48:51 +020047 * We use GTOD as base and use sched_clock() deltas to improve resolution. The
48 * deltas are filtered to provide monotonicity and keeping it within an
49 * expected window.
Peter Zijlstra3e51f332008-05-03 18:29:28 +020050 *
51 * Furthermore, explicit sleep and wakeup hooks allow us to account for time
52 * that is otherwise invisible (TSC gets stopped).
53 *
Peter Zijlstra3e51f332008-05-03 18:29:28 +020054 */
Ingo Molnar325ea102018-03-03 12:20:47 +010055#include "sched.h"
Pavel Tatashin5d2a4e92018-07-19 16:55:41 -040056#include <linux/sched_clock.h>
Peter Zijlstra3e51f332008-05-03 18:29:28 +020057
Hugh Dickins2c3d1032008-07-25 19:45:00 +010058/*
59 * Scheduler clock - returns current time in nanosec units.
60 * This is default implementation.
61 * Architectures and sub-architectures can override this.
62 */
Gideon Israel Dsouza52f5684c2014-04-07 15:39:20 -070063unsigned long long __weak sched_clock(void)
Hugh Dickins2c3d1032008-07-25 19:45:00 +010064{
Ron92d23f72009-05-08 22:54:49 +093065 return (unsigned long long)(jiffies - INITIAL_JIFFIES)
66 * (NSEC_PER_SEC / HZ);
Hugh Dickins2c3d1032008-07-25 19:45:00 +010067}
Divyesh Shahb6ac23af2010-04-15 08:54:59 +020068EXPORT_SYMBOL_GPL(sched_clock);
Peter Zijlstra3e51f332008-05-03 18:29:28 +020069
Pavel Tatashin46457ea2018-07-19 16:55:43 -040070static DEFINE_STATIC_KEY_FALSE(sched_clock_running);
Peter Zijlstrac1955a32008-08-11 08:59:03 +020071
Peter Zijlstra3e51f332008-05-03 18:29:28 +020072#ifdef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK
Peter Zijlstraacb04052017-01-19 14:36:33 +010073/*
74 * We must start with !__sched_clock_stable because the unstable -> stable
75 * transition is accurate, while the stable -> unstable transition is not.
76 *
77 * Similarly we start with __sched_clock_stable_early, thereby assuming we
78 * will become stable, such that there's only a single 1 -> 0 transition.
79 */
Peter Zijlstra555570d72016-12-15 13:21:58 +010080static DEFINE_STATIC_KEY_FALSE(__sched_clock_stable);
Peter Zijlstraacb04052017-01-19 14:36:33 +010081static int __sched_clock_stable_early = 1;
Peter Zijlstra35af99e2013-11-28 19:38:42 +010082
Peter Zijlstra5680d802016-12-15 13:36:17 +010083/*
Peter Zijlstra698eff62017-03-17 12:48:18 +010084 * We want: ktime_get_ns() + __gtod_offset == sched_clock() + __sched_clock_offset
Peter Zijlstra5680d802016-12-15 13:36:17 +010085 */
Peter Zijlstra698eff62017-03-17 12:48:18 +010086__read_mostly u64 __sched_clock_offset;
87static __read_mostly u64 __gtod_offset;
Peter Zijlstra5680d802016-12-15 13:36:17 +010088
89struct sched_clock_data {
90 u64 tick_raw;
91 u64 tick_gtod;
92 u64 clock;
93};
94
95static DEFINE_PER_CPU_SHARED_ALIGNED(struct sched_clock_data, sched_clock_data);
96
97static inline struct sched_clock_data *this_scd(void)
98{
99 return this_cpu_ptr(&sched_clock_data);
100}
101
102static inline struct sched_clock_data *cpu_sdc(int cpu)
103{
104 return &per_cpu(sched_clock_data, cpu);
105}
106
Peter Zijlstra35af99e2013-11-28 19:38:42 +0100107int sched_clock_stable(void)
108{
Peter Zijlstra555570d72016-12-15 13:21:58 +0100109 return static_branch_likely(&__sched_clock_stable);
Peter Zijlstrad375b4e2014-01-22 12:59:18 +0100110}
111
Peter Zijlstracf15ca82017-04-21 12:11:53 +0200112static void __scd_stamp(struct sched_clock_data *scd)
113{
114 scd->tick_gtod = ktime_get_ns();
115 scd->tick_raw = sched_clock();
116}
117
Peter Zijlstrad375b4e2014-01-22 12:59:18 +0100118static void __set_sched_clock_stable(void)
119{
Peter Zijlstra45aea3212017-05-24 08:52:02 +0200120 struct sched_clock_data *scd;
Peter Zijlstra5680d802016-12-15 13:36:17 +0100121
122 /*
Peter Zijlstra45aea3212017-05-24 08:52:02 +0200123 * Since we're still unstable and the tick is already running, we have
124 * to disable IRQs in order to get a consistent scd->tick* reading.
125 */
126 local_irq_disable();
127 scd = this_scd();
128 /*
Peter Zijlstra5680d802016-12-15 13:36:17 +0100129 * Attempt to make the (initial) unstable->stable transition continuous.
130 */
Peter Zijlstra698eff62017-03-17 12:48:18 +0100131 __sched_clock_offset = (scd->tick_gtod + __gtod_offset) - (scd->tick_raw);
Peter Zijlstra45aea3212017-05-24 08:52:02 +0200132 local_irq_enable();
Peter Zijlstra5680d802016-12-15 13:36:17 +0100133
134 printk(KERN_INFO "sched_clock: Marking stable (%lld, %lld)->(%lld, %lld)\n",
Peter Zijlstra698eff62017-03-17 12:48:18 +0100135 scd->tick_gtod, __gtod_offset,
136 scd->tick_raw, __sched_clock_offset);
Peter Zijlstra5680d802016-12-15 13:36:17 +0100137
Peter Zijlstra555570d72016-12-15 13:21:58 +0100138 static_branch_enable(&__sched_clock_stable);
Frederic Weisbecker4f49b902015-07-22 17:03:52 +0200139 tick_dep_clear(TICK_DEP_BIT_CLOCK_UNSTABLE);
Peter Zijlstra35af99e2013-11-28 19:38:42 +0100140}
141
Peter Zijlstracf15ca82017-04-21 12:11:53 +0200142/*
143 * If we ever get here, we're screwed, because we found out -- typically after
144 * the fact -- that TSC wasn't good. This means all our clocksources (including
145 * ktime) could have reported wrong values.
146 *
147 * What we do here is an attempt to fix up and continue sort of where we left
148 * off in a coherent manner.
149 *
150 * The only way to fully avoid random clock jumps is to boot with:
151 * "tsc=unstable".
152 */
Peter Zijlstra71fdb702017-03-13 13:46:21 +0100153static void __sched_clock_work(struct work_struct *work)
154{
Peter Zijlstracf15ca82017-04-21 12:11:53 +0200155 struct sched_clock_data *scd;
156 int cpu;
157
158 /* take a current timestamp and set 'now' */
159 preempt_disable();
160 scd = this_scd();
161 __scd_stamp(scd);
162 scd->clock = scd->tick_gtod + __gtod_offset;
163 preempt_enable();
164
165 /* clone to all CPUs */
166 for_each_possible_cpu(cpu)
167 per_cpu(sched_clock_data, cpu) = *scd;
168
Peter Zijlstra7708d5f2017-04-21 12:52:52 +0200169 printk(KERN_WARNING "TSC found unstable after boot, most likely due to broken BIOS. Use 'tsc=unstable'.\n");
Peter Zijlstracf15ca82017-04-21 12:11:53 +0200170 printk(KERN_INFO "sched_clock: Marking unstable (%lld, %lld)<-(%lld, %lld)\n",
171 scd->tick_gtod, __gtod_offset,
172 scd->tick_raw, __sched_clock_offset);
173
Peter Zijlstra71fdb702017-03-13 13:46:21 +0100174 static_branch_disable(&__sched_clock_stable);
175}
176
177static DECLARE_WORK(sched_clock_work, __sched_clock_work);
178
179static void __clear_sched_clock_stable(void)
Peter Zijlstra35af99e2013-11-28 19:38:42 +0100180{
Peter Zijlstracf15ca82017-04-21 12:11:53 +0200181 if (!sched_clock_stable())
182 return;
Peter Zijlstra5680d802016-12-15 13:36:17 +0100183
Frederic Weisbecker4f49b902015-07-22 17:03:52 +0200184 tick_dep_set(TICK_DEP_BIT_CLOCK_UNSTABLE);
Peter Zijlstracf15ca82017-04-21 12:11:53 +0200185 schedule_work(&sched_clock_work);
Peter Zijlstra71fdb702017-03-13 13:46:21 +0100186}
Peter Zijlstra6577e422013-12-11 18:55:53 +0100187
188void clear_sched_clock_stable(void)
189{
Peter Zijlstrad375b4e2014-01-22 12:59:18 +0100190 __sched_clock_stable_early = 0;
191
Peter Zijlstra9881b022016-12-15 13:35:52 +0100192 smp_mb(); /* matches sched_clock_init_late() */
Peter Zijlstrad375b4e2014-01-22 12:59:18 +0100193
Pavel Tatashin46457ea2018-07-19 16:55:43 -0400194 if (static_key_count(&sched_clock_running.key) == 2)
Peter Zijlstra71fdb702017-03-13 13:46:21 +0100195 __clear_sched_clock_stable();
Peter Zijlstra6577e422013-12-11 18:55:53 +0100196}
197
Pavel Tatashin5d2a4e92018-07-19 16:55:41 -0400198static void __sched_clock_gtod_offset(void)
199{
Peter Zijlstra9407f5a2018-07-20 10:09:11 +0200200 struct sched_clock_data *scd = this_scd();
201
202 __scd_stamp(scd);
203 __gtod_offset = (scd->tick_raw + __sched_clock_offset) - scd->tick_gtod;
Pavel Tatashin5d2a4e92018-07-19 16:55:41 -0400204}
205
206void __init sched_clock_init(void)
207{
Pavel Tatashin857baa82018-07-19 16:55:42 -0400208 /*
209 * Set __gtod_offset such that once we mark sched_clock_running,
210 * sched_clock_tick() continues where sched_clock() left off.
211 *
212 * Even if TSC is buggered, we're still UP at this point so it
213 * can't really be out of sync.
214 */
Peter Zijlstra9407f5a2018-07-20 10:09:11 +0200215 local_irq_disable();
Pavel Tatashin857baa82018-07-19 16:55:42 -0400216 __sched_clock_gtod_offset();
Peter Zijlstra9407f5a2018-07-20 10:09:11 +0200217 local_irq_enable();
Pavel Tatashin857baa82018-07-19 16:55:42 -0400218
Pavel Tatashin46457ea2018-07-19 16:55:43 -0400219 static_branch_inc(&sched_clock_running);
Pavel Tatashin5d2a4e92018-07-19 16:55:41 -0400220}
Peter Zijlstra2e44b7d2017-04-21 12:46:57 +0200221/*
222 * We run this as late_initcall() such that it runs after all built-in drivers,
223 * notably: acpi_processor and intel_idle, which can mark the TSC as unstable.
224 */
225static int __init sched_clock_init_late(void)
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200226{
Pavel Tatashin46457ea2018-07-19 16:55:43 -0400227 static_branch_inc(&sched_clock_running);
Peter Zijlstrad375b4e2014-01-22 12:59:18 +0100228 /*
229 * Ensure that it is impossible to not do a static_key update.
230 *
231 * Either {set,clear}_sched_clock_stable() must see sched_clock_running
232 * and do the update, or we must see their __sched_clock_stable_early
233 * and do the update, or both.
234 */
235 smp_mb(); /* matches {set,clear}_sched_clock_stable() */
236
237 if (__sched_clock_stable_early)
238 __set_sched_clock_stable();
Peter Zijlstra2e44b7d2017-04-21 12:46:57 +0200239
240 return 0;
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200241}
Peter Zijlstra2e44b7d2017-04-21 12:46:57 +0200242late_initcall(sched_clock_init_late);
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200243
244/*
Ingo Molnarb3425012009-02-26 20:20:29 +0100245 * min, max except they take wrapping into account
Peter Zijlstra354879b2008-08-25 17:15:34 +0200246 */
247
248static inline u64 wrap_min(u64 x, u64 y)
249{
250 return (s64)(x - y) < 0 ? x : y;
251}
252
253static inline u64 wrap_max(u64 x, u64 y)
254{
255 return (s64)(x - y) > 0 ? x : y;
256}
257
258/*
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200259 * update the percpu scd from the raw @now value
260 *
261 * - filter out backward motion
Peter Zijlstra354879b2008-08-25 17:15:34 +0200262 * - use the GTOD tick value to create a window to filter crazy TSC values
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200263 */
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200264static u64 sched_clock_local(struct sched_clock_data *scd)
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200265{
Pavel Tatashin7b09cc52017-03-22 16:24:17 -0400266 u64 now, clock, old_clock, min_clock, max_clock, gtod;
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200267 s64 delta;
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200268
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200269again:
270 now = sched_clock();
271 delta = now - scd->tick_raw;
Peter Zijlstra354879b2008-08-25 17:15:34 +0200272 if (unlikely(delta < 0))
273 delta = 0;
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200274
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200275 old_clock = scd->clock;
276
Peter Zijlstra354879b2008-08-25 17:15:34 +0200277 /*
278 * scd->clock = clamp(scd->tick_gtod + delta,
Ingo Molnarb3425012009-02-26 20:20:29 +0100279 * max(scd->tick_gtod, scd->clock),
280 * scd->tick_gtod + TICK_NSEC);
Peter Zijlstra354879b2008-08-25 17:15:34 +0200281 */
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200282
Pavel Tatashin7b09cc52017-03-22 16:24:17 -0400283 gtod = scd->tick_gtod + __gtod_offset;
284 clock = gtod + delta;
285 min_clock = wrap_max(gtod, old_clock);
286 max_clock = wrap_max(old_clock, gtod + TICK_NSEC);
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200287
Peter Zijlstra354879b2008-08-25 17:15:34 +0200288 clock = wrap_max(clock, min_clock);
289 clock = wrap_min(clock, max_clock);
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200290
Eric Dumazet152f9d02009-09-30 20:36:19 +0200291 if (cmpxchg64(&scd->clock, old_clock, clock) != old_clock)
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200292 goto again;
Ingo Molnar56b90612008-07-30 10:15:55 +0200293
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200294 return clock;
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200295}
296
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200297static u64 sched_clock_remote(struct sched_clock_data *scd)
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200298{
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200299 struct sched_clock_data *my_scd = this_scd();
300 u64 this_clock, remote_clock;
301 u64 *ptr, old_val, val;
302
Thomas Gleixnera1cbcaa2013-04-06 10:10:27 +0200303#if BITS_PER_LONG != 64
304again:
305 /*
306 * Careful here: The local and the remote clock values need to
307 * be read out atomic as we need to compare the values and
308 * then update either the local or the remote side. So the
309 * cmpxchg64 below only protects one readout.
310 *
311 * We must reread via sched_clock_local() in the retry case on
Ingo Molnar97fb7a02018-03-03 14:01:12 +0100312 * 32-bit kernels as an NMI could use sched_clock_local() via the
Thomas Gleixnera1cbcaa2013-04-06 10:10:27 +0200313 * tracer and hit between the readout of
Ingo Molnar97fb7a02018-03-03 14:01:12 +0100314 * the low 32-bit and the high 32-bit portion.
Thomas Gleixnera1cbcaa2013-04-06 10:10:27 +0200315 */
316 this_clock = sched_clock_local(my_scd);
317 /*
Ingo Molnar97fb7a02018-03-03 14:01:12 +0100318 * We must enforce atomic readout on 32-bit, otherwise the
319 * update on the remote CPU can hit inbetween the readout of
320 * the low 32-bit and the high 32-bit portion.
Thomas Gleixnera1cbcaa2013-04-06 10:10:27 +0200321 */
322 remote_clock = cmpxchg64(&scd->clock, 0, 0);
323#else
324 /*
Ingo Molnar97fb7a02018-03-03 14:01:12 +0100325 * On 64-bit kernels the read of [my]scd->clock is atomic versus the
326 * update, so we can avoid the above 32-bit dance.
Thomas Gleixnera1cbcaa2013-04-06 10:10:27 +0200327 */
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200328 sched_clock_local(my_scd);
329again:
330 this_clock = my_scd->clock;
331 remote_clock = scd->clock;
Thomas Gleixnera1cbcaa2013-04-06 10:10:27 +0200332#endif
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200333
334 /*
335 * Use the opportunity that we have both locks
336 * taken to couple the two clocks: we take the
337 * larger time as the latest time for both
338 * runqueues. (this creates monotonic movement)
339 */
340 if (likely((s64)(remote_clock - this_clock) < 0)) {
341 ptr = &scd->clock;
342 old_val = remote_clock;
343 val = this_clock;
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200344 } else {
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200345 /*
346 * Should be rare, but possible:
347 */
348 ptr = &my_scd->clock;
349 old_val = this_clock;
350 val = remote_clock;
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200351 }
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200352
Eric Dumazet152f9d02009-09-30 20:36:19 +0200353 if (cmpxchg64(ptr, old_val, val) != old_val)
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200354 goto again;
355
356 return val;
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200357}
358
Peter Zijlstrac6763292010-05-25 10:48:51 +0200359/*
360 * Similar to cpu_clock(), but requires local IRQs to be disabled.
361 *
362 * See cpu_clock().
363 */
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200364u64 sched_clock_cpu(int cpu)
365{
Ingo Molnarb3425012009-02-26 20:20:29 +0100366 struct sched_clock_data *scd;
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200367 u64 clock;
368
Peter Zijlstra35af99e2013-11-28 19:38:42 +0100369 if (sched_clock_stable())
Peter Zijlstra698eff62017-03-17 12:48:18 +0100370 return sched_clock() + __sched_clock_offset;
Peter Zijlstraa3817592008-05-29 10:07:15 +0200371
Pavel Tatashin46457ea2018-07-19 16:55:43 -0400372 if (!static_branch_unlikely(&sched_clock_running))
Pavel Tatashin857baa82018-07-19 16:55:42 -0400373 return sched_clock();
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200374
Fernando Luis Vazquez Cao96b3d282014-03-06 14:25:28 +0900375 preempt_disable_notrace();
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200376 scd = cpu_sdc(cpu);
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200377
Peter Zijlstradef0a9b2009-09-18 20:14:01 +0200378 if (cpu != smp_processor_id())
379 clock = sched_clock_remote(scd);
380 else
381 clock = sched_clock_local(scd);
Fernando Luis Vazquez Cao96b3d282014-03-06 14:25:28 +0900382 preempt_enable_notrace();
Ingo Molnare4e4e532008-04-14 08:50:02 +0200383
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200384 return clock;
385}
Daniel Lezcano2c923e92016-04-11 16:38:34 +0200386EXPORT_SYMBOL_GPL(sched_clock_cpu);
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200387
388void sched_clock_tick(void)
389{
Peter Zijlstra8325d9c2009-02-26 21:40:16 +0100390 struct sched_clock_data *scd;
Peter Zijlstraa3817592008-05-29 10:07:15 +0200391
Peter Zijlstrab421b222017-04-21 12:14:13 +0200392 if (sched_clock_stable())
393 return;
394
Pavel Tatashin46457ea2018-07-19 16:55:43 -0400395 if (!static_branch_unlikely(&sched_clock_running))
Peter Zijlstrab421b222017-04-21 12:14:13 +0200396 return;
397
Frederic Weisbecker2c11dba2017-11-06 16:01:27 +0100398 lockdep_assert_irqs_disabled();
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200399
Peter Zijlstra8325d9c2009-02-26 21:40:16 +0100400 scd = this_scd();
Peter Zijlstracf15ca82017-04-21 12:11:53 +0200401 __scd_stamp(scd);
Peter Zijlstrab421b222017-04-21 12:14:13 +0200402 sched_clock_local(scd);
403}
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200404
Peter Zijlstrab421b222017-04-21 12:14:13 +0200405void sched_clock_tick_stable(void)
406{
Peter Zijlstrab421b222017-04-21 12:14:13 +0200407 if (!sched_clock_stable())
408 return;
409
410 /*
411 * Called under watchdog_lock.
412 *
413 * The watchdog just found this TSC to (still) be stable, so now is a
414 * good moment to update our __gtod_offset. Because once we find the
415 * TSC to be unstable, any computation will be computing crap.
416 */
417 local_irq_disable();
Pavel Tatashin5d2a4e92018-07-19 16:55:41 -0400418 __sched_clock_gtod_offset();
Peter Zijlstrab421b222017-04-21 12:14:13 +0200419 local_irq_enable();
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200420}
421
422/*
423 * We are going deep-idle (irqs are disabled):
424 */
425void sched_clock_idle_sleep_event(void)
426{
427 sched_clock_cpu(smp_processor_id());
428}
429EXPORT_SYMBOL_GPL(sched_clock_idle_sleep_event);
430
431/*
Peter Zijlstraf9fccdb2017-04-21 12:43:59 +0200432 * We just idled; resync with ktime.
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200433 */
Peter Zijlstraac1e8432017-04-21 12:26:23 +0200434void sched_clock_idle_wakeup_event(void)
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200435{
Peter Zijlstraf9fccdb2017-04-21 12:43:59 +0200436 unsigned long flags;
437
438 if (sched_clock_stable())
Thomas Gleixner1c5745a2008-12-22 23:05:28 +0100439 return;
440
Peter Zijlstraf9fccdb2017-04-21 12:43:59 +0200441 if (unlikely(timekeeping_suspended))
442 return;
443
444 local_irq_save(flags);
Peter Zijlstra354879b2008-08-25 17:15:34 +0200445 sched_clock_tick();
Peter Zijlstraf9fccdb2017-04-21 12:43:59 +0200446 local_irq_restore(flags);
Peter Zijlstra3e51f332008-05-03 18:29:28 +0200447}
448EXPORT_SYMBOL_GPL(sched_clock_idle_wakeup_event);
449
Peter Zijlstra8325d9c2009-02-26 21:40:16 +0100450#else /* CONFIG_HAVE_UNSTABLE_SCHED_CLOCK */
451
Pavel Tatashin5d2a4e92018-07-19 16:55:41 -0400452void __init sched_clock_init(void)
453{
Pavel Tatashin46457ea2018-07-19 16:55:43 -0400454 static_branch_inc(&sched_clock_running);
Pavel Tatashinbd9f9432018-07-30 09:52:52 -0400455 local_irq_disable();
Pavel Tatashin5d2a4e92018-07-19 16:55:41 -0400456 generic_sched_clock_init();
Pavel Tatashinbd9f9432018-07-30 09:52:52 -0400457 local_irq_enable();
Pavel Tatashin5d2a4e92018-07-19 16:55:41 -0400458}
459
Peter Zijlstra8325d9c2009-02-26 21:40:16 +0100460u64 sched_clock_cpu(int cpu)
461{
Pavel Tatashin46457ea2018-07-19 16:55:43 -0400462 if (!static_branch_unlikely(&sched_clock_running))
Peter Zijlstra8325d9c2009-02-26 21:40:16 +0100463 return 0;
464
465 return sched_clock();
466}
Peter Zijlstra9881b022016-12-15 13:35:52 +0100467
David Millerb9f8fcd2009-12-13 18:25:02 -0800468#endif /* CONFIG_HAVE_UNSTABLE_SCHED_CLOCK */
469
Cyril Bur545a2bf2015-02-12 15:01:24 -0800470/*
471 * Running clock - returns the time that has elapsed while a guest has been
472 * running.
473 * On a guest this value should be local_clock minus the time the guest was
474 * suspended by the hypervisor (for any reason).
475 * On bare metal this function should return the same as local_clock.
476 * Architectures and sub-architectures can override this.
477 */
478u64 __weak running_clock(void)
479{
480 return local_clock();
481}