xref: /openbmc/qemu/util/qemu-timer.c (revision 5e437d3c)
1 /*
2  * QEMU System Emulator
3  *
4  * Copyright (c) 2003-2008 Fabrice Bellard
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a copy
7  * of this software and associated documentation files (the "Software"), to deal
8  * in the Software without restriction, including without limitation the rights
9  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10  * copies of the Software, and to permit persons to whom the Software is
11  * furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be included in
14  * all copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22  * THE SOFTWARE.
23  */
24 
25 #include "qemu/osdep.h"
26 #include "qemu/main-loop.h"
27 #include "qemu/timer.h"
28 #include "qemu/lockable.h"
29 #include "sysemu/cpu-timers.h"
30 #include "sysemu/replay.h"
31 #include "sysemu/cpus.h"
32 
33 #ifdef CONFIG_POSIX
34 #include <pthread.h>
35 #endif
36 
37 #ifdef CONFIG_PPOLL
38 #include <poll.h>
39 #endif
40 
41 #ifdef CONFIG_PRCTL_PR_SET_TIMERSLACK
42 #include <sys/prctl.h>
43 #endif
44 
45 /***********************************************************/
46 /* timers */
47 
48 typedef struct QEMUClock {
49     /* We rely on BQL to protect the timerlists */
50     QLIST_HEAD(, QEMUTimerList) timerlists;
51 
52     QEMUClockType type;
53     bool enabled;
54 } QEMUClock;
55 
56 QEMUTimerListGroup main_loop_tlg;
57 static QEMUClock qemu_clocks[QEMU_CLOCK_MAX];
58 
59 /* A QEMUTimerList is a list of timers attached to a clock. More
60  * than one QEMUTimerList can be attached to each clock, for instance
61  * used by different AioContexts / threads. Each clock also has
62  * a list of the QEMUTimerLists associated with it, in order that
63  * reenabling the clock can call all the notifiers.
64  */
65 
66 struct QEMUTimerList {
67     QEMUClock *clock;
68     QemuMutex active_timers_lock;
69     QEMUTimer *active_timers;
70     QLIST_ENTRY(QEMUTimerList) list;
71     QEMUTimerListNotifyCB *notify_cb;
72     void *notify_opaque;
73 
74     /* lightweight method to mark the end of timerlist's running */
75     QemuEvent timers_done_ev;
76 };
77 
78 /**
79  * qemu_clock_ptr:
80  * @type: type of clock
81  *
82  * Translate a clock type into a pointer to QEMUClock object.
83  *
84  * Returns: a pointer to the QEMUClock object
85  */
86 static inline QEMUClock *qemu_clock_ptr(QEMUClockType type)
87 {
88     return &qemu_clocks[type];
89 }
90 
91 static bool timer_expired_ns(QEMUTimer *timer_head, int64_t current_time)
92 {
93     return timer_head && (timer_head->expire_time <= current_time);
94 }
95 
96 QEMUTimerList *timerlist_new(QEMUClockType type,
97                              QEMUTimerListNotifyCB *cb,
98                              void *opaque)
99 {
100     QEMUTimerList *timer_list;
101     QEMUClock *clock = qemu_clock_ptr(type);
102 
103     timer_list = g_malloc0(sizeof(QEMUTimerList));
104     qemu_event_init(&timer_list->timers_done_ev, true);
105     timer_list->clock = clock;
106     timer_list->notify_cb = cb;
107     timer_list->notify_opaque = opaque;
108     qemu_mutex_init(&timer_list->active_timers_lock);
109     QLIST_INSERT_HEAD(&clock->timerlists, timer_list, list);
110     return timer_list;
111 }
112 
113 void timerlist_free(QEMUTimerList *timer_list)
114 {
115     assert(!timerlist_has_timers(timer_list));
116     if (timer_list->clock) {
117         QLIST_REMOVE(timer_list, list);
118     }
119     qemu_mutex_destroy(&timer_list->active_timers_lock);
120     g_free(timer_list);
121 }
122 
123 static void qemu_clock_init(QEMUClockType type, QEMUTimerListNotifyCB *notify_cb)
124 {
125     QEMUClock *clock = qemu_clock_ptr(type);
126 
127     /* Assert that the clock of type TYPE has not been initialized yet. */
128     assert(main_loop_tlg.tl[type] == NULL);
129 
130     clock->type = type;
131     clock->enabled = (type == QEMU_CLOCK_VIRTUAL ? false : true);
132     QLIST_INIT(&clock->timerlists);
133     main_loop_tlg.tl[type] = timerlist_new(type, notify_cb, NULL);
134 }
135 
136 bool qemu_clock_use_for_deadline(QEMUClockType type)
137 {
138     return !(icount_enabled() && (type == QEMU_CLOCK_VIRTUAL));
139 }
140 
141 void qemu_clock_notify(QEMUClockType type)
142 {
143     QEMUTimerList *timer_list;
144     QEMUClock *clock = qemu_clock_ptr(type);
145     QLIST_FOREACH(timer_list, &clock->timerlists, list) {
146         timerlist_notify(timer_list);
147     }
148 }
149 
150 /* Disabling the clock will wait for related timerlists to stop
151  * executing qemu_run_timers.  Thus, this functions should not
152  * be used from the callback of a timer that is based on @clock.
153  * Doing so would cause a deadlock.
154  *
155  * Caller should hold BQL.
156  */
157 void qemu_clock_enable(QEMUClockType type, bool enabled)
158 {
159     QEMUClock *clock = qemu_clock_ptr(type);
160     QEMUTimerList *tl;
161     bool old = clock->enabled;
162     clock->enabled = enabled;
163     if (enabled && !old) {
164         qemu_clock_notify(type);
165     } else if (!enabled && old) {
166         QLIST_FOREACH(tl, &clock->timerlists, list) {
167             qemu_event_wait(&tl->timers_done_ev);
168         }
169     }
170 }
171 
172 bool timerlist_has_timers(QEMUTimerList *timer_list)
173 {
174     return !!qatomic_read(&timer_list->active_timers);
175 }
176 
177 bool qemu_clock_has_timers(QEMUClockType type)
178 {
179     return timerlist_has_timers(
180         main_loop_tlg.tl[type]);
181 }
182 
183 bool timerlist_expired(QEMUTimerList *timer_list)
184 {
185     int64_t expire_time;
186 
187     if (!qatomic_read(&timer_list->active_timers)) {
188         return false;
189     }
190 
191     WITH_QEMU_LOCK_GUARD(&timer_list->active_timers_lock) {
192         if (!timer_list->active_timers) {
193             return false;
194         }
195         expire_time = timer_list->active_timers->expire_time;
196     }
197 
198     return expire_time <= qemu_clock_get_ns(timer_list->clock->type);
199 }
200 
201 bool qemu_clock_expired(QEMUClockType type)
202 {
203     return timerlist_expired(
204         main_loop_tlg.tl[type]);
205 }
206 
207 /*
208  * As above, but return -1 for no deadline, and do not cap to 2^32
209  * as we know the result is always positive.
210  */
211 
212 int64_t timerlist_deadline_ns(QEMUTimerList *timer_list)
213 {
214     int64_t delta;
215     int64_t expire_time;
216 
217     if (!qatomic_read(&timer_list->active_timers)) {
218         return -1;
219     }
220 
221     if (!timer_list->clock->enabled) {
222         return -1;
223     }
224 
225     /* The active timers list may be modified before the caller uses our return
226      * value but ->notify_cb() is called when the deadline changes.  Therefore
227      * the caller should notice the change and there is no race condition.
228      */
229     WITH_QEMU_LOCK_GUARD(&timer_list->active_timers_lock) {
230         if (!timer_list->active_timers) {
231             return -1;
232         }
233         expire_time = timer_list->active_timers->expire_time;
234     }
235 
236     delta = expire_time - qemu_clock_get_ns(timer_list->clock->type);
237 
238     if (delta <= 0) {
239         return 0;
240     }
241 
242     return delta;
243 }
244 
245 /*
246  * Returns the time remaining for the deadline, in ms.
247  */
248 int64_t timer_deadline_ms(QEMUTimer *timer)
249 {
250     if (timer_pending(timer)) {
251         return qemu_timeout_ns_to_ms(timer->expire_time) -
252                qemu_clock_get_ms(timer->timer_list->clock->type);
253     }
254 
255     return 0;
256 }
257 
258 /* Calculate the soonest deadline across all timerlists attached
259  * to the clock. This is used for the icount timeout so we
260  * ignore whether or not the clock should be used in deadline
261  * calculations.
262  */
263 int64_t qemu_clock_deadline_ns_all(QEMUClockType type, int attr_mask)
264 {
265     int64_t deadline = -1;
266     int64_t delta;
267     int64_t expire_time;
268     QEMUTimer *ts;
269     QEMUTimerList *timer_list;
270     QEMUClock *clock = qemu_clock_ptr(type);
271 
272     if (!clock->enabled) {
273         return -1;
274     }
275 
276     QLIST_FOREACH(timer_list, &clock->timerlists, list) {
277         qemu_mutex_lock(&timer_list->active_timers_lock);
278         ts = timer_list->active_timers;
279         /* Skip all external timers */
280         while (ts && (ts->attributes & ~attr_mask)) {
281             ts = ts->next;
282         }
283         if (!ts) {
284             qemu_mutex_unlock(&timer_list->active_timers_lock);
285             continue;
286         }
287         expire_time = ts->expire_time;
288         qemu_mutex_unlock(&timer_list->active_timers_lock);
289 
290         delta = expire_time - qemu_clock_get_ns(type);
291         if (delta <= 0) {
292             delta = 0;
293         }
294         deadline = qemu_soonest_timeout(deadline, delta);
295     }
296     return deadline;
297 }
298 
299 QEMUClockType timerlist_get_clock(QEMUTimerList *timer_list)
300 {
301     return timer_list->clock->type;
302 }
303 
304 QEMUTimerList *qemu_clock_get_main_loop_timerlist(QEMUClockType type)
305 {
306     return main_loop_tlg.tl[type];
307 }
308 
309 void timerlist_notify(QEMUTimerList *timer_list)
310 {
311     if (timer_list->notify_cb) {
312         timer_list->notify_cb(timer_list->notify_opaque, timer_list->clock->type);
313     } else {
314         qemu_notify_event();
315     }
316 }
317 
318 /* Transition function to convert a nanosecond timeout to ms
319  * This is used where a system does not support ppoll
320  */
321 int qemu_timeout_ns_to_ms(int64_t ns)
322 {
323     int64_t ms;
324     if (ns < 0) {
325         return -1;
326     }
327 
328     if (!ns) {
329         return 0;
330     }
331 
332     /* Always round up, because it's better to wait too long than to wait too
333      * little and effectively busy-wait
334      */
335     ms = DIV_ROUND_UP(ns, SCALE_MS);
336 
337     /* To avoid overflow problems, limit this to 2^31, i.e. approx 25 days */
338     return MIN(ms, INT32_MAX);
339 }
340 
341 
342 /* qemu implementation of g_poll which uses a nanosecond timeout but is
343  * otherwise identical to g_poll
344  */
345 int qemu_poll_ns(GPollFD *fds, guint nfds, int64_t timeout)
346 {
347 #ifdef CONFIG_PPOLL
348     if (timeout < 0) {
349         return ppoll((struct pollfd *)fds, nfds, NULL, NULL);
350     } else {
351         struct timespec ts;
352         int64_t tvsec = timeout / 1000000000LL;
353         /* Avoid possibly overflowing and specifying a negative number of
354          * seconds, which would turn a very long timeout into a busy-wait.
355          */
356         if (tvsec > (int64_t)INT32_MAX) {
357             tvsec = INT32_MAX;
358         }
359         ts.tv_sec = tvsec;
360         ts.tv_nsec = timeout % 1000000000LL;
361         return ppoll((struct pollfd *)fds, nfds, &ts, NULL);
362     }
363 #else
364     return g_poll(fds, nfds, qemu_timeout_ns_to_ms(timeout));
365 #endif
366 }
367 
368 
369 void timer_init_full(QEMUTimer *ts,
370                      QEMUTimerListGroup *timer_list_group, QEMUClockType type,
371                      int scale, int attributes,
372                      QEMUTimerCB *cb, void *opaque)
373 {
374     if (!timer_list_group) {
375         timer_list_group = &main_loop_tlg;
376     }
377     ts->timer_list = timer_list_group->tl[type];
378     ts->cb = cb;
379     ts->opaque = opaque;
380     ts->scale = scale;
381     ts->attributes = attributes;
382     ts->expire_time = -1;
383 }
384 
385 void timer_deinit(QEMUTimer *ts)
386 {
387     assert(ts->expire_time == -1);
388     ts->timer_list = NULL;
389 }
390 
391 static void timer_del_locked(QEMUTimerList *timer_list, QEMUTimer *ts)
392 {
393     QEMUTimer **pt, *t;
394 
395     ts->expire_time = -1;
396     pt = &timer_list->active_timers;
397     for(;;) {
398         t = *pt;
399         if (!t)
400             break;
401         if (t == ts) {
402             qatomic_set(pt, t->next);
403             break;
404         }
405         pt = &t->next;
406     }
407 }
408 
409 static bool timer_mod_ns_locked(QEMUTimerList *timer_list,
410                                 QEMUTimer *ts, int64_t expire_time)
411 {
412     QEMUTimer **pt, *t;
413 
414     /* add the timer in the sorted list */
415     pt = &timer_list->active_timers;
416     for (;;) {
417         t = *pt;
418         if (!timer_expired_ns(t, expire_time)) {
419             break;
420         }
421         pt = &t->next;
422     }
423     ts->expire_time = MAX(expire_time, 0);
424     ts->next = *pt;
425     qatomic_set(pt, ts);
426 
427     return pt == &timer_list->active_timers;
428 }
429 
430 static void timerlist_rearm(QEMUTimerList *timer_list)
431 {
432     /* Interrupt execution to force deadline recalculation.  */
433     if (icount_enabled() && timer_list->clock->type == QEMU_CLOCK_VIRTUAL) {
434         icount_start_warp_timer();
435     }
436     timerlist_notify(timer_list);
437 }
438 
439 /* stop a timer, but do not dealloc it */
440 void timer_del(QEMUTimer *ts)
441 {
442     QEMUTimerList *timer_list = ts->timer_list;
443 
444     if (timer_list) {
445         qemu_mutex_lock(&timer_list->active_timers_lock);
446         timer_del_locked(timer_list, ts);
447         qemu_mutex_unlock(&timer_list->active_timers_lock);
448     }
449 }
450 
451 /* modify the current timer so that it will be fired when current_time
452    >= expire_time. The corresponding callback will be called. */
453 void timer_mod_ns(QEMUTimer *ts, int64_t expire_time)
454 {
455     QEMUTimerList *timer_list = ts->timer_list;
456     bool rearm;
457 
458     qemu_mutex_lock(&timer_list->active_timers_lock);
459     timer_del_locked(timer_list, ts);
460     rearm = timer_mod_ns_locked(timer_list, ts, expire_time);
461     qemu_mutex_unlock(&timer_list->active_timers_lock);
462 
463     if (rearm) {
464         timerlist_rearm(timer_list);
465     }
466 }
467 
468 /* modify the current timer so that it will be fired when current_time
469    >= expire_time or the current deadline, whichever comes earlier.
470    The corresponding callback will be called. */
471 void timer_mod_anticipate_ns(QEMUTimer *ts, int64_t expire_time)
472 {
473     QEMUTimerList *timer_list = ts->timer_list;
474     bool rearm;
475 
476     WITH_QEMU_LOCK_GUARD(&timer_list->active_timers_lock) {
477         if (ts->expire_time == -1 || ts->expire_time > expire_time) {
478             if (ts->expire_time != -1) {
479                 timer_del_locked(timer_list, ts);
480             }
481             rearm = timer_mod_ns_locked(timer_list, ts, expire_time);
482         } else {
483             rearm = false;
484         }
485     }
486     if (rearm) {
487         timerlist_rearm(timer_list);
488     }
489 }
490 
491 void timer_mod(QEMUTimer *ts, int64_t expire_time)
492 {
493     timer_mod_ns(ts, expire_time * ts->scale);
494 }
495 
496 void timer_mod_anticipate(QEMUTimer *ts, int64_t expire_time)
497 {
498     timer_mod_anticipate_ns(ts, expire_time * ts->scale);
499 }
500 
501 bool timer_pending(QEMUTimer *ts)
502 {
503     return ts->expire_time >= 0;
504 }
505 
506 bool timer_expired(QEMUTimer *timer_head, int64_t current_time)
507 {
508     return timer_expired_ns(timer_head, current_time * timer_head->scale);
509 }
510 
511 bool timerlist_run_timers(QEMUTimerList *timer_list)
512 {
513     QEMUTimer *ts;
514     int64_t current_time;
515     bool progress = false;
516     QEMUTimerCB *cb;
517     void *opaque;
518 
519     if (!qatomic_read(&timer_list->active_timers)) {
520         return false;
521     }
522 
523     qemu_event_reset(&timer_list->timers_done_ev);
524     if (!timer_list->clock->enabled) {
525         goto out;
526     }
527 
528     switch (timer_list->clock->type) {
529     case QEMU_CLOCK_REALTIME:
530         break;
531     default:
532     case QEMU_CLOCK_VIRTUAL:
533         break;
534     case QEMU_CLOCK_HOST:
535         if (!replay_checkpoint(CHECKPOINT_CLOCK_HOST)) {
536             goto out;
537         }
538         break;
539     case QEMU_CLOCK_VIRTUAL_RT:
540         if (!replay_checkpoint(CHECKPOINT_CLOCK_VIRTUAL_RT)) {
541             goto out;
542         }
543         break;
544     }
545 
546     /*
547      * Extract expired timers from active timers list and process them.
548      *
549      * In rr mode we need "filtered" checkpointing for virtual clock.  The
550      * checkpoint must be recorded/replayed before processing any non-EXTERNAL timer,
551      * and that must only be done once since the clock value stays the same. Because
552      * non-EXTERNAL timers may appear in the timers list while it being processed,
553      * the checkpoint can be issued at a time until no timers are left and we are
554      * done".
555      */
556     current_time = qemu_clock_get_ns(timer_list->clock->type);
557     qemu_mutex_lock(&timer_list->active_timers_lock);
558     while ((ts = timer_list->active_timers)) {
559         if (!timer_expired_ns(ts, current_time)) {
560             /* No expired timers left.  The checkpoint can be skipped
561              * if no timers fired or they were all external.
562              */
563             break;
564         }
565         /* Checkpoint for virtual clock is redundant in cases where
566          * it's being triggered with only non-EXTERNAL timers, because
567          * these timers don't change guest state directly.
568          */
569         if (replay_mode != REPLAY_MODE_NONE
570             && timer_list->clock->type == QEMU_CLOCK_VIRTUAL
571             && !(ts->attributes & QEMU_TIMER_ATTR_EXTERNAL)
572             && !replay_checkpoint(CHECKPOINT_CLOCK_VIRTUAL)) {
573             qemu_mutex_unlock(&timer_list->active_timers_lock);
574             goto out;
575         }
576 
577         /* remove timer from the list before calling the callback */
578         timer_list->active_timers = ts->next;
579         ts->next = NULL;
580         ts->expire_time = -1;
581         cb = ts->cb;
582         opaque = ts->opaque;
583 
584         /* run the callback (the timer list can be modified) */
585         qemu_mutex_unlock(&timer_list->active_timers_lock);
586         cb(opaque);
587         qemu_mutex_lock(&timer_list->active_timers_lock);
588 
589         progress = true;
590     }
591     qemu_mutex_unlock(&timer_list->active_timers_lock);
592 
593 out:
594     qemu_event_set(&timer_list->timers_done_ev);
595     return progress;
596 }
597 
598 bool qemu_clock_run_timers(QEMUClockType type)
599 {
600     return timerlist_run_timers(main_loop_tlg.tl[type]);
601 }
602 
603 void timerlistgroup_init(QEMUTimerListGroup *tlg,
604                          QEMUTimerListNotifyCB *cb, void *opaque)
605 {
606     QEMUClockType type;
607     for (type = 0; type < QEMU_CLOCK_MAX; type++) {
608         tlg->tl[type] = timerlist_new(type, cb, opaque);
609     }
610 }
611 
612 void timerlistgroup_deinit(QEMUTimerListGroup *tlg)
613 {
614     QEMUClockType type;
615     for (type = 0; type < QEMU_CLOCK_MAX; type++) {
616         timerlist_free(tlg->tl[type]);
617     }
618 }
619 
620 bool timerlistgroup_run_timers(QEMUTimerListGroup *tlg)
621 {
622     QEMUClockType type;
623     bool progress = false;
624     for (type = 0; type < QEMU_CLOCK_MAX; type++) {
625         progress |= timerlist_run_timers(tlg->tl[type]);
626     }
627     return progress;
628 }
629 
630 int64_t timerlistgroup_deadline_ns(QEMUTimerListGroup *tlg)
631 {
632     int64_t deadline = -1;
633     QEMUClockType type;
634     for (type = 0; type < QEMU_CLOCK_MAX; type++) {
635         if (qemu_clock_use_for_deadline(type)) {
636             deadline = qemu_soonest_timeout(deadline,
637                                             timerlist_deadline_ns(tlg->tl[type]));
638         }
639     }
640     return deadline;
641 }
642 
643 int64_t qemu_clock_get_ns(QEMUClockType type)
644 {
645     switch (type) {
646     case QEMU_CLOCK_REALTIME:
647         return get_clock();
648     default:
649     case QEMU_CLOCK_VIRTUAL:
650         return cpus_get_virtual_clock();
651     case QEMU_CLOCK_HOST:
652         return REPLAY_CLOCK(REPLAY_CLOCK_HOST, get_clock_realtime());
653     case QEMU_CLOCK_VIRTUAL_RT:
654         return REPLAY_CLOCK(REPLAY_CLOCK_VIRTUAL_RT, cpu_get_clock());
655     }
656 }
657 
658 void init_clocks(QEMUTimerListNotifyCB *notify_cb)
659 {
660     QEMUClockType type;
661     for (type = 0; type < QEMU_CLOCK_MAX; type++) {
662         qemu_clock_init(type, notify_cb);
663     }
664 
665 #ifdef CONFIG_PRCTL_PR_SET_TIMERSLACK
666     prctl(PR_SET_TIMERSLACK, 1, 0, 0, 0);
667 #endif
668 }
669 
670 uint64_t timer_expire_time_ns(QEMUTimer *ts)
671 {
672     return timer_pending(ts) ? ts->expire_time : -1;
673 }
674 
675 bool qemu_clock_run_all_timers(void)
676 {
677     bool progress = false;
678     QEMUClockType type;
679 
680     for (type = 0; type < QEMU_CLOCK_MAX; type++) {
681         if (qemu_clock_use_for_deadline(type)) {
682             progress |= qemu_clock_run_timers(type);
683         }
684     }
685 
686     return progress;
687 }
688