1 // SPDX-License-Identifier: GPL-2.0
2 /*
3 * Copyright (C) 2015 Anton Ivanov (aivanov@{brocade.com,kot-begemot.co.uk})
4 * Copyright (C) 2015 Thomas Meyer (thomas@m3y3r.de)
5 * Copyright (C) 2012-2014 Cisco Systems
6 * Copyright (C) 2000 - 2007 Jeff Dike (jdike@{addtoit,linux.intel}.com)
7 * Copyright (C) 2019 Intel Corporation
8 */
9
10 #include <linux/clockchips.h>
11 #include <linux/init.h>
12 #include <linux/interrupt.h>
13 #include <linux/jiffies.h>
14 #include <linux/mm.h>
15 #include <linux/sched.h>
16 #include <linux/spinlock.h>
17 #include <linux/threads.h>
18 #include <asm/irq.h>
19 #include <asm/param.h>
20 #include <kern_util.h>
21 #include <os.h>
22 #include <linux/time-internal.h>
23 #include <linux/um_timetravel.h>
24 #include <shared/init.h>
25
26 #ifdef CONFIG_UML_TIME_TRAVEL_SUPPORT
27 enum time_travel_mode time_travel_mode;
28 EXPORT_SYMBOL_GPL(time_travel_mode);
29
30 static bool time_travel_start_set;
31 static unsigned long long time_travel_start;
32 static unsigned long long time_travel_time;
33 static LIST_HEAD(time_travel_events);
34 static LIST_HEAD(time_travel_irqs);
35 static unsigned long long time_travel_timer_interval;
36 static unsigned long long time_travel_next_event;
37 static struct time_travel_event time_travel_timer_event;
38 static int time_travel_ext_fd = -1;
39 static unsigned int time_travel_ext_waiting;
40 static bool time_travel_ext_prev_request_valid;
41 static unsigned long long time_travel_ext_prev_request;
42 static bool time_travel_ext_free_until_valid;
43 static unsigned long long time_travel_ext_free_until;
44
time_travel_set_time(unsigned long long ns)45 static void time_travel_set_time(unsigned long long ns)
46 {
47 if (unlikely(ns < time_travel_time))
48 panic("time-travel: time goes backwards %lld -> %lld\n",
49 time_travel_time, ns);
50 else if (unlikely(ns >= S64_MAX))
51 panic("The system was going to sleep forever, aborting");
52
53 time_travel_time = ns;
54 }
55
56 enum time_travel_message_handling {
57 TTMH_IDLE,
58 TTMH_POLL,
59 TTMH_READ,
60 };
61
time_travel_handle_message(struct um_timetravel_msg * msg,enum time_travel_message_handling mode)62 static void time_travel_handle_message(struct um_timetravel_msg *msg,
63 enum time_travel_message_handling mode)
64 {
65 struct um_timetravel_msg resp = {
66 .op = UM_TIMETRAVEL_ACK,
67 };
68 int ret;
69
70 /*
71 * We can't unlock here, but interrupt signals with a timetravel_handler
72 * (see um_request_irq_tt) get to the timetravel_handler anyway.
73 */
74 if (mode != TTMH_READ) {
75 BUG_ON(mode == TTMH_IDLE && !irqs_disabled());
76
77 while (os_poll(1, &time_travel_ext_fd) != 0) {
78 /* nothing */
79 }
80 }
81
82 ret = os_read_file(time_travel_ext_fd, msg, sizeof(*msg));
83
84 if (ret == 0)
85 panic("time-travel external link is broken\n");
86 if (ret != sizeof(*msg))
87 panic("invalid time-travel message - %d bytes\n", ret);
88
89 switch (msg->op) {
90 default:
91 WARN_ONCE(1, "time-travel: unexpected message %lld\n",
92 (unsigned long long)msg->op);
93 break;
94 case UM_TIMETRAVEL_ACK:
95 return;
96 case UM_TIMETRAVEL_RUN:
97 time_travel_set_time(msg->time);
98 break;
99 case UM_TIMETRAVEL_FREE_UNTIL:
100 time_travel_ext_free_until_valid = true;
101 time_travel_ext_free_until = msg->time;
102 break;
103 }
104
105 resp.seq = msg->seq;
106 os_write_file(time_travel_ext_fd, &resp, sizeof(resp));
107 }
108
time_travel_ext_req(u32 op,u64 time)109 static u64 time_travel_ext_req(u32 op, u64 time)
110 {
111 static int seq;
112 int mseq = ++seq;
113 struct um_timetravel_msg msg = {
114 .op = op,
115 .time = time,
116 .seq = mseq,
117 };
118
119 /*
120 * We need to block even the timetravel handlers of SIGIO here and
121 * only restore their use when we got the ACK - otherwise we may
122 * (will) get interrupted by that, try to queue the IRQ for future
123 * processing and thus send another request while we're still waiting
124 * for an ACK, but the peer doesn't know we got interrupted and will
125 * send the ACKs in the same order as the message, but we'd need to
126 * see them in the opposite order ...
127 *
128 * This wouldn't matter *too* much, but some ACKs carry the
129 * current time (for UM_TIMETRAVEL_GET) and getting another
130 * ACK without a time would confuse us a lot!
131 *
132 * The sequence number assignment that happens here lets us
133 * debug such message handling issues more easily.
134 */
135 block_signals_hard();
136 os_write_file(time_travel_ext_fd, &msg, sizeof(msg));
137
138 while (msg.op != UM_TIMETRAVEL_ACK)
139 time_travel_handle_message(&msg, TTMH_READ);
140
141 if (msg.seq != mseq)
142 panic("time-travel: ACK message has different seqno! op=%d, seq=%d != %d time=%lld\n",
143 msg.op, msg.seq, mseq, msg.time);
144
145 if (op == UM_TIMETRAVEL_GET)
146 time_travel_set_time(msg.time);
147 unblock_signals_hard();
148
149 return msg.time;
150 }
151
__time_travel_wait_readable(int fd)152 void __time_travel_wait_readable(int fd)
153 {
154 int fds[2] = { fd, time_travel_ext_fd };
155 int ret;
156
157 if (time_travel_mode != TT_MODE_EXTERNAL)
158 return;
159
160 while ((ret = os_poll(2, fds))) {
161 struct um_timetravel_msg msg;
162
163 if (ret == 1)
164 time_travel_handle_message(&msg, TTMH_READ);
165 }
166 }
167 EXPORT_SYMBOL_GPL(__time_travel_wait_readable);
168
time_travel_ext_update_request(unsigned long long time)169 static void time_travel_ext_update_request(unsigned long long time)
170 {
171 if (time_travel_mode != TT_MODE_EXTERNAL)
172 return;
173
174 /* asked for exactly this time previously */
175 if (time_travel_ext_prev_request_valid &&
176 time == time_travel_ext_prev_request)
177 return;
178
179 /*
180 * if we're running and are allowed to run past the request
181 * then we don't need to update it either
182 */
183 if (!time_travel_ext_waiting && time_travel_ext_free_until_valid &&
184 time < time_travel_ext_free_until)
185 return;
186
187 time_travel_ext_prev_request = time;
188 time_travel_ext_prev_request_valid = true;
189 time_travel_ext_req(UM_TIMETRAVEL_REQUEST, time);
190 }
191
__time_travel_propagate_time(void)192 void __time_travel_propagate_time(void)
193 {
194 static unsigned long long last_propagated;
195
196 if (last_propagated == time_travel_time)
197 return;
198
199 time_travel_ext_req(UM_TIMETRAVEL_UPDATE, time_travel_time);
200 last_propagated = time_travel_time;
201 }
202 EXPORT_SYMBOL_GPL(__time_travel_propagate_time);
203
204 /* returns true if we must do a wait to the simtime device */
time_travel_ext_request(unsigned long long time)205 static bool time_travel_ext_request(unsigned long long time)
206 {
207 /*
208 * If we received an external sync point ("free until") then we
209 * don't have to request/wait for anything until then, unless
210 * we're already waiting.
211 */
212 if (!time_travel_ext_waiting && time_travel_ext_free_until_valid &&
213 time < time_travel_ext_free_until)
214 return false;
215
216 time_travel_ext_update_request(time);
217 return true;
218 }
219
time_travel_ext_wait(bool idle)220 static void time_travel_ext_wait(bool idle)
221 {
222 struct um_timetravel_msg msg = {
223 .op = UM_TIMETRAVEL_ACK,
224 };
225
226 time_travel_ext_prev_request_valid = false;
227 time_travel_ext_free_until_valid = false;
228 time_travel_ext_waiting++;
229
230 time_travel_ext_req(UM_TIMETRAVEL_WAIT, -1);
231
232 /*
233 * Here we are deep in the idle loop, so we have to break out of the
234 * kernel abstraction in a sense and implement this in terms of the
235 * UML system waiting on the VQ interrupt while sleeping, when we get
236 * the signal it'll call time_travel_ext_vq_notify_done() completing the
237 * call.
238 */
239 while (msg.op != UM_TIMETRAVEL_RUN)
240 time_travel_handle_message(&msg, idle ? TTMH_IDLE : TTMH_POLL);
241
242 time_travel_ext_waiting--;
243
244 /* we might request more stuff while polling - reset when we run */
245 time_travel_ext_prev_request_valid = false;
246 }
247
time_travel_ext_get_time(void)248 static void time_travel_ext_get_time(void)
249 {
250 time_travel_ext_req(UM_TIMETRAVEL_GET, -1);
251 }
252
__time_travel_update_time(unsigned long long ns,bool idle)253 static void __time_travel_update_time(unsigned long long ns, bool idle)
254 {
255 if (time_travel_mode == TT_MODE_EXTERNAL && time_travel_ext_request(ns))
256 time_travel_ext_wait(idle);
257 else
258 time_travel_set_time(ns);
259 }
260
time_travel_first_event(void)261 static struct time_travel_event *time_travel_first_event(void)
262 {
263 return list_first_entry_or_null(&time_travel_events,
264 struct time_travel_event,
265 list);
266 }
267
__time_travel_add_event(struct time_travel_event * e,unsigned long long time)268 static void __time_travel_add_event(struct time_travel_event *e,
269 unsigned long long time)
270 {
271 struct time_travel_event *tmp;
272 bool inserted = false;
273 unsigned long flags;
274
275 if (e->pending)
276 return;
277
278 e->pending = true;
279 e->time = time;
280
281 local_irq_save(flags);
282 list_for_each_entry(tmp, &time_travel_events, list) {
283 /*
284 * Add the new entry before one with higher time,
285 * or if they're equal and both on stack, because
286 * in that case we need to unwind the stack in the
287 * right order, and the later event (timer sleep
288 * or such) must be dequeued first.
289 */
290 if ((tmp->time > e->time) ||
291 (tmp->time == e->time && tmp->onstack && e->onstack)) {
292 list_add_tail(&e->list, &tmp->list);
293 inserted = true;
294 break;
295 }
296 }
297
298 if (!inserted)
299 list_add_tail(&e->list, &time_travel_events);
300
301 tmp = time_travel_first_event();
302 time_travel_ext_update_request(tmp->time);
303 time_travel_next_event = tmp->time;
304 local_irq_restore(flags);
305 }
306
time_travel_add_event(struct time_travel_event * e,unsigned long long time)307 static void time_travel_add_event(struct time_travel_event *e,
308 unsigned long long time)
309 {
310 if (WARN_ON(!e->fn))
311 return;
312
313 __time_travel_add_event(e, time);
314 }
315
time_travel_add_event_rel(struct time_travel_event * e,unsigned long long delay_ns)316 void time_travel_add_event_rel(struct time_travel_event *e,
317 unsigned long long delay_ns)
318 {
319 time_travel_add_event(e, time_travel_time + delay_ns);
320 }
321
time_travel_periodic_timer(struct time_travel_event * e)322 void time_travel_periodic_timer(struct time_travel_event *e)
323 {
324 time_travel_add_event(&time_travel_timer_event,
325 time_travel_time + time_travel_timer_interval);
326 deliver_alarm();
327 }
328
deliver_time_travel_irqs(void)329 void deliver_time_travel_irqs(void)
330 {
331 struct time_travel_event *e;
332 unsigned long flags;
333
334 /*
335 * Don't do anything for most cases. Note that because here we have
336 * to disable IRQs (and re-enable later) we'll actually recurse at
337 * the end of the function, so this is strictly necessary.
338 */
339 if (likely(list_empty(&time_travel_irqs)))
340 return;
341
342 local_irq_save(flags);
343 irq_enter();
344 while ((e = list_first_entry_or_null(&time_travel_irqs,
345 struct time_travel_event,
346 list))) {
347 list_del(&e->list);
348 e->pending = false;
349 e->fn(e);
350 }
351 irq_exit();
352 local_irq_restore(flags);
353 }
354
time_travel_deliver_event(struct time_travel_event * e)355 static void time_travel_deliver_event(struct time_travel_event *e)
356 {
357 if (e == &time_travel_timer_event) {
358 /*
359 * deliver_alarm() does the irq_enter/irq_exit
360 * by itself, so must handle it specially here
361 */
362 e->fn(e);
363 } else if (irqs_disabled()) {
364 list_add_tail(&e->list, &time_travel_irqs);
365 /*
366 * set pending again, it was set to false when the
367 * event was deleted from the original list, but
368 * now it's still pending until we deliver the IRQ.
369 */
370 e->pending = true;
371 } else {
372 unsigned long flags;
373
374 local_irq_save(flags);
375 irq_enter();
376 e->fn(e);
377 irq_exit();
378 local_irq_restore(flags);
379 }
380 }
381
time_travel_del_event(struct time_travel_event * e)382 bool time_travel_del_event(struct time_travel_event *e)
383 {
384 unsigned long flags;
385
386 if (!e->pending)
387 return false;
388 local_irq_save(flags);
389 list_del(&e->list);
390 e->pending = false;
391 local_irq_restore(flags);
392 return true;
393 }
394
time_travel_update_time(unsigned long long next,bool idle)395 static void time_travel_update_time(unsigned long long next, bool idle)
396 {
397 struct time_travel_event ne = {
398 .onstack = true,
399 };
400 struct time_travel_event *e;
401 bool finished = idle;
402
403 /* add it without a handler - we deal with that specifically below */
404 __time_travel_add_event(&ne, next);
405
406 do {
407 e = time_travel_first_event();
408
409 BUG_ON(!e);
410 __time_travel_update_time(e->time, idle);
411
412 /* new events may have been inserted while we were waiting */
413 if (e == time_travel_first_event()) {
414 BUG_ON(!time_travel_del_event(e));
415 BUG_ON(time_travel_time != e->time);
416
417 if (e == &ne) {
418 finished = true;
419 } else {
420 if (e->onstack)
421 panic("On-stack event dequeued outside of the stack! time=%lld, event time=%lld, event=%pS\n",
422 time_travel_time, e->time, e);
423 time_travel_deliver_event(e);
424 }
425 }
426
427 e = time_travel_first_event();
428 if (e)
429 time_travel_ext_update_request(e->time);
430 } while (ne.pending && !finished);
431
432 time_travel_del_event(&ne);
433 }
434
time_travel_update_time_rel(unsigned long long offs)435 static void time_travel_update_time_rel(unsigned long long offs)
436 {
437 unsigned long flags;
438
439 /*
440 * Disable interrupts before calculating the new time so
441 * that a real timer interrupt (signal) can't happen at
442 * a bad time e.g. after we read time_travel_time but
443 * before we've completed updating the time.
444 */
445 local_irq_save(flags);
446 time_travel_update_time(time_travel_time + offs, false);
447 local_irq_restore(flags);
448 }
449
time_travel_ndelay(unsigned long nsec)450 void time_travel_ndelay(unsigned long nsec)
451 {
452 /*
453 * Not strictly needed to use _rel() version since this is
454 * only used in INFCPU/EXT modes, but it doesn't hurt and
455 * is more readable too.
456 */
457 time_travel_update_time_rel(nsec);
458 }
459 EXPORT_SYMBOL(time_travel_ndelay);
460
time_travel_add_irq_event(struct time_travel_event * e)461 void time_travel_add_irq_event(struct time_travel_event *e)
462 {
463 BUG_ON(time_travel_mode != TT_MODE_EXTERNAL);
464
465 time_travel_ext_get_time();
466 /*
467 * We could model interrupt latency here, for now just
468 * don't have any latency at all and request the exact
469 * same time (again) to run the interrupt...
470 */
471 time_travel_add_event(e, time_travel_time);
472 }
473 EXPORT_SYMBOL_GPL(time_travel_add_irq_event);
474
time_travel_oneshot_timer(struct time_travel_event * e)475 static void time_travel_oneshot_timer(struct time_travel_event *e)
476 {
477 deliver_alarm();
478 }
479
time_travel_sleep(void)480 void time_travel_sleep(void)
481 {
482 /*
483 * Wait "forever" (using S64_MAX because there are some potential
484 * wrapping issues, especially with the current TT_MODE_EXTERNAL
485 * controller application.
486 */
487 unsigned long long next = S64_MAX;
488
489 if (time_travel_mode == TT_MODE_BASIC)
490 os_timer_disable();
491
492 time_travel_update_time(next, true);
493
494 if (time_travel_mode == TT_MODE_BASIC &&
495 time_travel_timer_event.pending) {
496 if (time_travel_timer_event.fn == time_travel_periodic_timer) {
497 /*
498 * This is somewhat wrong - we should get the first
499 * one sooner like the os_timer_one_shot() below...
500 */
501 os_timer_set_interval(time_travel_timer_interval);
502 } else {
503 os_timer_one_shot(time_travel_timer_event.time - next);
504 }
505 }
506 }
507
time_travel_handle_real_alarm(void)508 static void time_travel_handle_real_alarm(void)
509 {
510 time_travel_set_time(time_travel_next_event);
511
512 time_travel_del_event(&time_travel_timer_event);
513
514 if (time_travel_timer_event.fn == time_travel_periodic_timer)
515 time_travel_add_event(&time_travel_timer_event,
516 time_travel_time +
517 time_travel_timer_interval);
518 }
519
time_travel_set_interval(unsigned long long interval)520 static void time_travel_set_interval(unsigned long long interval)
521 {
522 time_travel_timer_interval = interval;
523 }
524
time_travel_connect_external(const char * socket)525 static int time_travel_connect_external(const char *socket)
526 {
527 const char *sep;
528 unsigned long long id = (unsigned long long)-1;
529 int rc;
530
531 if ((sep = strchr(socket, ':'))) {
532 char buf[25] = {};
533 if (sep - socket > sizeof(buf) - 1)
534 goto invalid_number;
535
536 memcpy(buf, socket, sep - socket);
537 if (kstrtoull(buf, 0, &id)) {
538 invalid_number:
539 panic("time-travel: invalid external ID in string '%s'\n",
540 socket);
541 return -EINVAL;
542 }
543
544 socket = sep + 1;
545 }
546
547 rc = os_connect_socket(socket);
548 if (rc < 0) {
549 panic("time-travel: failed to connect to external socket %s\n",
550 socket);
551 return rc;
552 }
553
554 time_travel_ext_fd = rc;
555
556 time_travel_ext_req(UM_TIMETRAVEL_START, id);
557
558 return 1;
559 }
560
time_travel_set_start(void)561 static void time_travel_set_start(void)
562 {
563 if (time_travel_start_set)
564 return;
565
566 switch (time_travel_mode) {
567 case TT_MODE_EXTERNAL:
568 time_travel_start = time_travel_ext_req(UM_TIMETRAVEL_GET_TOD, -1);
569 /* controller gave us the *current* time, so adjust by that */
570 time_travel_ext_get_time();
571 time_travel_start -= time_travel_time;
572 break;
573 case TT_MODE_INFCPU:
574 case TT_MODE_BASIC:
575 if (!time_travel_start_set)
576 time_travel_start = os_persistent_clock_emulation();
577 break;
578 case TT_MODE_OFF:
579 /* we just read the host clock with os_persistent_clock_emulation() */
580 break;
581 }
582
583 time_travel_start_set = true;
584 }
585 #else /* CONFIG_UML_TIME_TRAVEL_SUPPORT */
586 #define time_travel_start_set 0
587 #define time_travel_start 0
588 #define time_travel_time 0
589 #define time_travel_ext_waiting 0
590
time_travel_update_time(unsigned long long ns,bool idle)591 static inline void time_travel_update_time(unsigned long long ns, bool idle)
592 {
593 }
594
time_travel_update_time_rel(unsigned long long offs)595 static inline void time_travel_update_time_rel(unsigned long long offs)
596 {
597 }
598
time_travel_handle_real_alarm(void)599 static inline void time_travel_handle_real_alarm(void)
600 {
601 }
602
time_travel_set_interval(unsigned long long interval)603 static void time_travel_set_interval(unsigned long long interval)
604 {
605 }
606
time_travel_set_start(void)607 static inline void time_travel_set_start(void)
608 {
609 }
610
611 /* fail link if this actually gets used */
612 extern u64 time_travel_ext_req(u32 op, u64 time);
613
614 /* these are empty macros so the struct/fn need not exist */
615 #define time_travel_add_event(e, time) do { } while (0)
616 /* externally not usable - redefine here so we can */
617 #undef time_travel_del_event
618 #define time_travel_del_event(e) do { } while (0)
619 #endif
620
timer_handler(int sig,struct siginfo * unused_si,struct uml_pt_regs * regs)621 void timer_handler(int sig, struct siginfo *unused_si, struct uml_pt_regs *regs)
622 {
623 unsigned long flags;
624
625 /*
626 * In basic time-travel mode we still get real interrupts
627 * (signals) but since we don't read time from the OS, we
628 * must update the simulated time here to the expiry when
629 * we get a signal.
630 * This is not the case in inf-cpu mode, since there we
631 * never get any real signals from the OS.
632 */
633 if (time_travel_mode == TT_MODE_BASIC)
634 time_travel_handle_real_alarm();
635
636 local_irq_save(flags);
637 do_IRQ(TIMER_IRQ, regs);
638 local_irq_restore(flags);
639 }
640
itimer_shutdown(struct clock_event_device * evt)641 static int itimer_shutdown(struct clock_event_device *evt)
642 {
643 if (time_travel_mode != TT_MODE_OFF)
644 time_travel_del_event(&time_travel_timer_event);
645
646 if (time_travel_mode != TT_MODE_INFCPU &&
647 time_travel_mode != TT_MODE_EXTERNAL)
648 os_timer_disable();
649
650 return 0;
651 }
652
itimer_set_periodic(struct clock_event_device * evt)653 static int itimer_set_periodic(struct clock_event_device *evt)
654 {
655 unsigned long long interval = NSEC_PER_SEC / HZ;
656
657 if (time_travel_mode != TT_MODE_OFF) {
658 time_travel_del_event(&time_travel_timer_event);
659 time_travel_set_event_fn(&time_travel_timer_event,
660 time_travel_periodic_timer);
661 time_travel_set_interval(interval);
662 time_travel_add_event(&time_travel_timer_event,
663 time_travel_time + interval);
664 }
665
666 if (time_travel_mode != TT_MODE_INFCPU &&
667 time_travel_mode != TT_MODE_EXTERNAL)
668 os_timer_set_interval(interval);
669
670 return 0;
671 }
672
itimer_next_event(unsigned long delta,struct clock_event_device * evt)673 static int itimer_next_event(unsigned long delta,
674 struct clock_event_device *evt)
675 {
676 delta += 1;
677
678 if (time_travel_mode != TT_MODE_OFF) {
679 time_travel_del_event(&time_travel_timer_event);
680 time_travel_set_event_fn(&time_travel_timer_event,
681 time_travel_oneshot_timer);
682 time_travel_add_event(&time_travel_timer_event,
683 time_travel_time + delta);
684 }
685
686 if (time_travel_mode != TT_MODE_INFCPU &&
687 time_travel_mode != TT_MODE_EXTERNAL)
688 return os_timer_one_shot(delta);
689
690 return 0;
691 }
692
itimer_one_shot(struct clock_event_device * evt)693 static int itimer_one_shot(struct clock_event_device *evt)
694 {
695 return itimer_next_event(0, evt);
696 }
697
698 static struct clock_event_device timer_clockevent = {
699 .name = "posix-timer",
700 .rating = 250,
701 .cpumask = cpu_possible_mask,
702 .features = CLOCK_EVT_FEAT_PERIODIC |
703 CLOCK_EVT_FEAT_ONESHOT,
704 .set_state_shutdown = itimer_shutdown,
705 .set_state_periodic = itimer_set_periodic,
706 .set_state_oneshot = itimer_one_shot,
707 .set_next_event = itimer_next_event,
708 .shift = 0,
709 .max_delta_ns = 0xffffffff,
710 .max_delta_ticks = 0xffffffff,
711 .min_delta_ns = TIMER_MIN_DELTA,
712 .min_delta_ticks = TIMER_MIN_DELTA, // microsecond resolution should be enough for anyone, same as 640K RAM
713 .irq = 0,
714 .mult = 1,
715 };
716
um_timer(int irq,void * dev)717 static irqreturn_t um_timer(int irq, void *dev)
718 {
719 if (get_current()->mm != NULL)
720 {
721 /* userspace - relay signal, results in correct userspace timers */
722 os_alarm_process(get_current()->mm->context.id.u.pid);
723 }
724
725 (*timer_clockevent.event_handler)(&timer_clockevent);
726
727 return IRQ_HANDLED;
728 }
729
timer_read(struct clocksource * cs)730 static u64 timer_read(struct clocksource *cs)
731 {
732 if (time_travel_mode != TT_MODE_OFF) {
733 /*
734 * We make reading the timer cost a bit so that we don't get
735 * stuck in loops that expect time to move more than the
736 * exact requested sleep amount, e.g. python's socket server,
737 * see https://bugs.python.org/issue37026.
738 *
739 * However, don't do that when we're in interrupt or such as
740 * then we might recurse into our own processing, and get to
741 * even more waiting, and that's not good - it messes up the
742 * "what do I do next" and onstack event we use to know when
743 * to return from time_travel_update_time().
744 */
745 if (!irqs_disabled() && !in_interrupt() && !in_softirq() &&
746 !time_travel_ext_waiting)
747 time_travel_update_time_rel(TIMER_MULTIPLIER);
748 return time_travel_time / TIMER_MULTIPLIER;
749 }
750
751 return os_nsecs() / TIMER_MULTIPLIER;
752 }
753
754 static struct clocksource timer_clocksource = {
755 .name = "timer",
756 .rating = 300,
757 .read = timer_read,
758 .mask = CLOCKSOURCE_MASK(64),
759 .flags = CLOCK_SOURCE_IS_CONTINUOUS,
760 };
761
um_timer_setup(void)762 static void __init um_timer_setup(void)
763 {
764 int err;
765
766 err = request_irq(TIMER_IRQ, um_timer, IRQF_TIMER, "hr timer", NULL);
767 if (err != 0)
768 printk(KERN_ERR "register_timer : request_irq failed - "
769 "errno = %d\n", -err);
770
771 err = os_timer_create();
772 if (err != 0) {
773 printk(KERN_ERR "creation of timer failed - errno = %d\n", -err);
774 return;
775 }
776
777 err = clocksource_register_hz(&timer_clocksource, NSEC_PER_SEC/TIMER_MULTIPLIER);
778 if (err) {
779 printk(KERN_ERR "clocksource_register_hz returned %d\n", err);
780 return;
781 }
782 clockevents_register_device(&timer_clockevent);
783 }
784
read_persistent_clock64(struct timespec64 * ts)785 void read_persistent_clock64(struct timespec64 *ts)
786 {
787 long long nsecs;
788
789 time_travel_set_start();
790
791 if (time_travel_mode != TT_MODE_OFF)
792 nsecs = time_travel_start + time_travel_time;
793 else
794 nsecs = os_persistent_clock_emulation();
795
796 set_normalized_timespec64(ts, nsecs / NSEC_PER_SEC,
797 nsecs % NSEC_PER_SEC);
798 }
799
time_init(void)800 void __init time_init(void)
801 {
802 timer_set_signal_handler();
803 late_time_init = um_timer_setup;
804 }
805
806 #ifdef CONFIG_UML_TIME_TRAVEL_SUPPORT
calibrate_delay_is_known(void)807 unsigned long calibrate_delay_is_known(void)
808 {
809 if (time_travel_mode == TT_MODE_INFCPU ||
810 time_travel_mode == TT_MODE_EXTERNAL)
811 return 1;
812 return 0;
813 }
814
setup_time_travel(char * str)815 int setup_time_travel(char *str)
816 {
817 if (strcmp(str, "=inf-cpu") == 0) {
818 time_travel_mode = TT_MODE_INFCPU;
819 timer_clockevent.name = "time-travel-timer-infcpu";
820 timer_clocksource.name = "time-travel-clock";
821 return 1;
822 }
823
824 if (strncmp(str, "=ext:", 5) == 0) {
825 time_travel_mode = TT_MODE_EXTERNAL;
826 timer_clockevent.name = "time-travel-timer-external";
827 timer_clocksource.name = "time-travel-clock-external";
828 return time_travel_connect_external(str + 5);
829 }
830
831 if (!*str) {
832 time_travel_mode = TT_MODE_BASIC;
833 timer_clockevent.name = "time-travel-timer";
834 timer_clocksource.name = "time-travel-clock";
835 return 1;
836 }
837
838 return -EINVAL;
839 }
840
841 __setup("time-travel", setup_time_travel);
842 __uml_help(setup_time_travel,
843 "time-travel\n"
844 "This option just enables basic time travel mode, in which the clock/timers\n"
845 "inside the UML instance skip forward when there's nothing to do, rather than\n"
846 "waiting for real time to elapse. However, instance CPU speed is limited by\n"
847 "the real CPU speed, so e.g. a 10ms timer will always fire after ~10ms wall\n"
848 "clock (but quicker when there's nothing to do).\n"
849 "\n"
850 "time-travel=inf-cpu\n"
851 "This enables time travel mode with infinite processing power, in which there\n"
852 "are no wall clock timers, and any CPU processing happens - as seen from the\n"
853 "guest - instantly. This can be useful for accurate simulation regardless of\n"
854 "debug overhead, physical CPU speed, etc. but is somewhat dangerous as it can\n"
855 "easily lead to getting stuck (e.g. if anything in the system busy loops).\n"
856 "\n"
857 "time-travel=ext:[ID:]/path/to/socket\n"
858 "This enables time travel mode similar to =inf-cpu, except the system will\n"
859 "use the given socket to coordinate with a central scheduler, in order to\n"
860 "have more than one system simultaneously be on simulated time. The virtio\n"
861 "driver code in UML knows about this so you can also simulate networks and\n"
862 "devices using it, assuming the device has the right capabilities.\n"
863 "The optional ID is a 64-bit integer that's sent to the central scheduler.\n");
864
setup_time_travel_start(char * str)865 int setup_time_travel_start(char *str)
866 {
867 int err;
868
869 err = kstrtoull(str, 0, &time_travel_start);
870 if (err)
871 return err;
872
873 time_travel_start_set = 1;
874 return 1;
875 }
876
877 __setup("time-travel-start", setup_time_travel_start);
878 __uml_help(setup_time_travel_start,
879 "time-travel-start=<seconds>\n"
880 "Configure the UML instance's wall clock to start at this value rather than\n"
881 "the host's wall clock at the time of UML boot.\n");
882 #endif
883