1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * Copyright (C) 2015 Anton Ivanov (aivanov@{brocade.com,kot-begemot.co.uk})
4  * Copyright (C) 2015 Thomas Meyer (thomas@m3y3r.de)
5  * Copyright (C) 2012-2014 Cisco Systems
6  * Copyright (C) 2000 - 2007 Jeff Dike (jdike@{addtoit,linux.intel}.com)
7  * Copyright (C) 2019 Intel Corporation
8  */
9 
10 #include <linux/clockchips.h>
11 #include <linux/init.h>
12 #include <linux/interrupt.h>
13 #include <linux/jiffies.h>
14 #include <linux/mm.h>
15 #include <linux/sched.h>
16 #include <linux/spinlock.h>
17 #include <linux/threads.h>
18 #include <asm/irq.h>
19 #include <asm/param.h>
20 #include <kern_util.h>
21 #include <os.h>
22 #include <linux/delay.h>
23 #include <linux/time-internal.h>
24 #include <linux/um_timetravel.h>
25 #include <shared/init.h>
26 
27 #ifdef CONFIG_UML_TIME_TRAVEL_SUPPORT
28 enum time_travel_mode time_travel_mode;
29 EXPORT_SYMBOL_GPL(time_travel_mode);
30 
31 static bool time_travel_start_set;
32 static unsigned long long time_travel_start;
33 static unsigned long long time_travel_time;
34 static unsigned long long time_travel_shm_offset;
35 static LIST_HEAD(time_travel_events);
36 static LIST_HEAD(time_travel_irqs);
37 static unsigned long long time_travel_timer_interval;
38 static unsigned long long time_travel_next_event;
39 static struct time_travel_event time_travel_timer_event;
40 static int time_travel_ext_fd = -1;
41 static unsigned int time_travel_ext_waiting;
42 static bool time_travel_ext_prev_request_valid;
43 static unsigned long long time_travel_ext_prev_request;
44 static unsigned long long *time_travel_ext_free_until;
45 static unsigned long long _time_travel_ext_free_until;
46 static u16 time_travel_shm_id;
47 static struct um_timetravel_schedshm *time_travel_shm;
48 static union um_timetravel_schedshm_client *time_travel_shm_client;
49 
time_travel_set_time(unsigned long long ns)50 static void time_travel_set_time(unsigned long long ns)
51 {
52 	if (unlikely(ns < time_travel_time))
53 		panic("time-travel: time goes backwards %lld -> %lld\n",
54 		      time_travel_time, ns);
55 	else if (unlikely(ns >= S64_MAX))
56 		panic("The system was going to sleep forever, aborting");
57 
58 	time_travel_time = ns;
59 }
60 
61 enum time_travel_message_handling {
62 	TTMH_IDLE,
63 	TTMH_POLL,
64 	TTMH_READ,
65 	TTMH_READ_START_ACK,
66 };
67 
68 static u64 bc_message;
69 int time_travel_should_print_bc_msg;
70 
_time_travel_print_bc_msg(void)71 void _time_travel_print_bc_msg(void)
72 {
73 	time_travel_should_print_bc_msg = 0;
74 	printk(KERN_INFO "time-travel: received broadcast 0x%llx\n", bc_message);
75 }
76 
time_travel_setup_shm(int fd,u16 id)77 static void time_travel_setup_shm(int fd, u16 id)
78 {
79 	u32 len;
80 
81 	time_travel_shm = os_mmap_rw_shared(fd, sizeof(*time_travel_shm));
82 
83 	if (!time_travel_shm)
84 		goto out;
85 
86 	len = time_travel_shm->len;
87 
88 	if (time_travel_shm->version != UM_TIMETRAVEL_SCHEDSHM_VERSION ||
89 	    len < struct_size(time_travel_shm, clients, id + 1)) {
90 		os_unmap_memory(time_travel_shm, sizeof(*time_travel_shm));
91 		time_travel_shm = NULL;
92 		goto out;
93 	}
94 
95 	time_travel_shm = os_mremap_rw_shared(time_travel_shm,
96 					      sizeof(*time_travel_shm),
97 					      len);
98 	if (!time_travel_shm)
99 		goto out;
100 
101 	time_travel_shm_offset = time_travel_shm->current_time;
102 	time_travel_shm_client = &time_travel_shm->clients[id];
103 	time_travel_shm_client->capa |= UM_TIMETRAVEL_SCHEDSHM_CAP_TIME_SHARE;
104 	time_travel_shm_id = id;
105 	/* always look at that free_until from now on */
106 	time_travel_ext_free_until = &time_travel_shm->free_until;
107 out:
108 	os_close_file(fd);
109 }
110 
time_travel_handle_message(struct um_timetravel_msg * msg,enum time_travel_message_handling mode)111 static void time_travel_handle_message(struct um_timetravel_msg *msg,
112 				       enum time_travel_message_handling mode)
113 {
114 	struct um_timetravel_msg resp = {
115 		.op = UM_TIMETRAVEL_ACK,
116 	};
117 	int ret;
118 
119 	/*
120 	 * We can't unlock here, but interrupt signals with a timetravel_handler
121 	 * (see um_request_irq_tt) get to the timetravel_handler anyway.
122 	 */
123 	if (mode != TTMH_READ) {
124 		BUG_ON(mode == TTMH_IDLE && !irqs_disabled());
125 
126 		while (os_poll(1, &time_travel_ext_fd) != 0) {
127 			/* nothing */
128 		}
129 	}
130 
131 	if (unlikely(mode == TTMH_READ_START_ACK)) {
132 		int fd[UM_TIMETRAVEL_SHARED_MAX_FDS];
133 
134 		ret = os_rcv_fd_msg(time_travel_ext_fd, fd,
135 				    ARRAY_SIZE(fd), msg, sizeof(*msg));
136 		if (ret == sizeof(*msg)) {
137 			time_travel_setup_shm(fd[UM_TIMETRAVEL_SHARED_MEMFD],
138 					      msg->time & UM_TIMETRAVEL_START_ACK_ID);
139 			/* we don't use the logging for now */
140 			os_close_file(fd[UM_TIMETRAVEL_SHARED_LOGFD]);
141 		}
142 	} else {
143 		ret = os_read_file(time_travel_ext_fd, msg, sizeof(*msg));
144 	}
145 
146 	if (ret == 0)
147 		panic("time-travel external link is broken\n");
148 	if (ret != sizeof(*msg))
149 		panic("invalid time-travel message - %d bytes\n", ret);
150 
151 	switch (msg->op) {
152 	default:
153 		WARN_ONCE(1, "time-travel: unexpected message %lld\n",
154 			  (unsigned long long)msg->op);
155 		break;
156 	case UM_TIMETRAVEL_ACK:
157 		return;
158 	case UM_TIMETRAVEL_RUN:
159 		time_travel_set_time(msg->time);
160 		if (time_travel_shm) {
161 			/* no request right now since we're running */
162 			time_travel_shm_client->flags &=
163 				~UM_TIMETRAVEL_SCHEDSHM_FLAGS_REQ_RUN;
164 			/* no ack for shared memory RUN */
165 			return;
166 		}
167 		break;
168 	case UM_TIMETRAVEL_FREE_UNTIL:
169 		/* not supposed to get this with shm, but ignore it */
170 		if (time_travel_shm)
171 			break;
172 		time_travel_ext_free_until = &_time_travel_ext_free_until;
173 		_time_travel_ext_free_until = msg->time;
174 		break;
175 	case UM_TIMETRAVEL_BROADCAST:
176 		bc_message = msg->time;
177 		time_travel_should_print_bc_msg = 1;
178 		break;
179 	}
180 
181 	resp.seq = msg->seq;
182 	os_write_file(time_travel_ext_fd, &resp, sizeof(resp));
183 }
184 
time_travel_ext_req(u32 op,u64 time)185 static u64 time_travel_ext_req(u32 op, u64 time)
186 {
187 	static int seq;
188 	int mseq = ++seq;
189 	struct um_timetravel_msg msg = {
190 		.op = op,
191 		.time = time,
192 		.seq = mseq,
193 	};
194 
195 	/*
196 	 * We need to block even the timetravel handlers of SIGIO here and
197 	 * only restore their use when we got the ACK - otherwise we may
198 	 * (will) get interrupted by that, try to queue the IRQ for future
199 	 * processing and thus send another request while we're still waiting
200 	 * for an ACK, but the peer doesn't know we got interrupted and will
201 	 * send the ACKs in the same order as the message, but we'd need to
202 	 * see them in the opposite order ...
203 	 *
204 	 * This wouldn't matter *too* much, but some ACKs carry the
205 	 * current time (for UM_TIMETRAVEL_GET) and getting another
206 	 * ACK without a time would confuse us a lot!
207 	 *
208 	 * The sequence number assignment that happens here lets us
209 	 * debug such message handling issues more easily.
210 	 */
211 	block_signals_hard();
212 	os_write_file(time_travel_ext_fd, &msg, sizeof(msg));
213 
214 	/* no ACK expected for WAIT in shared memory mode */
215 	if (msg.op == UM_TIMETRAVEL_WAIT && time_travel_shm)
216 		goto done;
217 
218 	while (msg.op != UM_TIMETRAVEL_ACK)
219 		time_travel_handle_message(&msg,
220 					   op == UM_TIMETRAVEL_START ?
221 						TTMH_READ_START_ACK :
222 						TTMH_READ);
223 
224 	if (msg.seq != mseq)
225 		panic("time-travel: ACK message has different seqno! op=%d, seq=%d != %d time=%lld\n",
226 		      msg.op, msg.seq, mseq, msg.time);
227 
228 	if (op == UM_TIMETRAVEL_GET)
229 		time_travel_set_time(msg.time);
230 done:
231 	unblock_signals_hard();
232 
233 	return msg.time;
234 }
235 
__time_travel_wait_readable(int fd)236 void __time_travel_wait_readable(int fd)
237 {
238 	int fds[2] = { fd, time_travel_ext_fd };
239 	int ret;
240 
241 	if (time_travel_mode != TT_MODE_EXTERNAL)
242 		return;
243 
244 	while ((ret = os_poll(2, fds))) {
245 		struct um_timetravel_msg msg;
246 
247 		if (ret == 1)
248 			time_travel_handle_message(&msg, TTMH_READ);
249 	}
250 }
251 EXPORT_SYMBOL_GPL(__time_travel_wait_readable);
252 
time_travel_ext_update_request(unsigned long long time)253 static void time_travel_ext_update_request(unsigned long long time)
254 {
255 	if (time_travel_mode != TT_MODE_EXTERNAL)
256 		return;
257 
258 	/* asked for exactly this time previously */
259 	if (time_travel_ext_prev_request_valid &&
260 	    time == time_travel_ext_prev_request)
261 		return;
262 
263 	/*
264 	 * if we're running and are allowed to run past the request
265 	 * then we don't need to update it either
266 	 *
267 	 * Note for shm we ignore FREE_UNTIL messages and leave the pointer
268 	 * to shared memory, and for non-shm the offset is 0.
269 	 */
270 	if (!time_travel_ext_waiting && time_travel_ext_free_until &&
271 	    time < (*time_travel_ext_free_until - time_travel_shm_offset))
272 		return;
273 
274 	time_travel_ext_prev_request = time;
275 	time_travel_ext_prev_request_valid = true;
276 
277 	if (time_travel_shm) {
278 		union um_timetravel_schedshm_client *running;
279 
280 		running = &time_travel_shm->clients[time_travel_shm->running_id];
281 
282 		if (running->capa & UM_TIMETRAVEL_SCHEDSHM_CAP_TIME_SHARE) {
283 			time_travel_shm_client->flags |=
284 				UM_TIMETRAVEL_SCHEDSHM_FLAGS_REQ_RUN;
285 			time += time_travel_shm_offset;
286 			time_travel_shm_client->req_time = time;
287 			if (time < time_travel_shm->free_until)
288 				time_travel_shm->free_until = time;
289 			return;
290 		}
291 	}
292 
293 	time_travel_ext_req(UM_TIMETRAVEL_REQUEST, time);
294 }
295 
__time_travel_propagate_time(void)296 void __time_travel_propagate_time(void)
297 {
298 	static unsigned long long last_propagated;
299 
300 	if (time_travel_shm) {
301 		if (time_travel_shm->running_id != time_travel_shm_id)
302 			panic("time-travel: setting time while not running\n");
303 		time_travel_shm->current_time = time_travel_time +
304 						time_travel_shm_offset;
305 		return;
306 	}
307 
308 	if (last_propagated == time_travel_time)
309 		return;
310 
311 	time_travel_ext_req(UM_TIMETRAVEL_UPDATE, time_travel_time);
312 	last_propagated = time_travel_time;
313 }
314 EXPORT_SYMBOL_GPL(__time_travel_propagate_time);
315 
316 /* returns true if we must do a wait to the simtime device */
time_travel_ext_request(unsigned long long time)317 static bool time_travel_ext_request(unsigned long long time)
318 {
319 	/*
320 	 * If we received an external sync point ("free until") then we
321 	 * don't have to request/wait for anything until then, unless
322 	 * we're already waiting.
323 	 *
324 	 * Note for shm we ignore FREE_UNTIL messages and leave the pointer
325 	 * to shared memory, and for non-shm the offset is 0.
326 	 */
327 	if (!time_travel_ext_waiting && time_travel_ext_free_until &&
328 	    time < (*time_travel_ext_free_until - time_travel_shm_offset))
329 		return false;
330 
331 	time_travel_ext_update_request(time);
332 	return true;
333 }
334 
time_travel_ext_wait(bool idle)335 static void time_travel_ext_wait(bool idle)
336 {
337 	struct um_timetravel_msg msg = {
338 		.op = UM_TIMETRAVEL_ACK,
339 	};
340 
341 	time_travel_ext_prev_request_valid = false;
342 	if (!time_travel_shm)
343 		time_travel_ext_free_until = NULL;
344 	time_travel_ext_waiting++;
345 
346 	time_travel_ext_req(UM_TIMETRAVEL_WAIT, -1);
347 
348 	/*
349 	 * Here we are deep in the idle loop, so we have to break out of the
350 	 * kernel abstraction in a sense and implement this in terms of the
351 	 * UML system waiting on the VQ interrupt while sleeping, when we get
352 	 * the signal it'll call time_travel_ext_vq_notify_done() completing the
353 	 * call.
354 	 */
355 	while (msg.op != UM_TIMETRAVEL_RUN)
356 		time_travel_handle_message(&msg, idle ? TTMH_IDLE : TTMH_POLL);
357 
358 	time_travel_ext_waiting--;
359 
360 	/* we might request more stuff while polling - reset when we run */
361 	time_travel_ext_prev_request_valid = false;
362 }
363 
time_travel_ext_get_time(void)364 static void time_travel_ext_get_time(void)
365 {
366 	if (time_travel_shm)
367 		time_travel_set_time(time_travel_shm->current_time -
368 				     time_travel_shm_offset);
369 	else
370 		time_travel_ext_req(UM_TIMETRAVEL_GET, -1);
371 }
372 
__time_travel_update_time(unsigned long long ns,bool idle)373 static void __time_travel_update_time(unsigned long long ns, bool idle)
374 {
375 	if (time_travel_mode == TT_MODE_EXTERNAL && time_travel_ext_request(ns))
376 		time_travel_ext_wait(idle);
377 	else
378 		time_travel_set_time(ns);
379 }
380 
time_travel_first_event(void)381 static struct time_travel_event *time_travel_first_event(void)
382 {
383 	return list_first_entry_or_null(&time_travel_events,
384 					struct time_travel_event,
385 					list);
386 }
387 
__time_travel_add_event(struct time_travel_event * e,unsigned long long time)388 static void __time_travel_add_event(struct time_travel_event *e,
389 				    unsigned long long time)
390 {
391 	struct time_travel_event *tmp;
392 	bool inserted = false;
393 	unsigned long flags;
394 
395 	if (e->pending)
396 		return;
397 
398 	e->pending = true;
399 	e->time = time;
400 
401 	local_irq_save(flags);
402 	list_for_each_entry(tmp, &time_travel_events, list) {
403 		/*
404 		 * Add the new entry before one with higher time,
405 		 * or if they're equal and both on stack, because
406 		 * in that case we need to unwind the stack in the
407 		 * right order, and the later event (timer sleep
408 		 * or such) must be dequeued first.
409 		 */
410 		if ((tmp->time > e->time) ||
411 		    (tmp->time == e->time && tmp->onstack && e->onstack)) {
412 			list_add_tail(&e->list, &tmp->list);
413 			inserted = true;
414 			break;
415 		}
416 	}
417 
418 	if (!inserted)
419 		list_add_tail(&e->list, &time_travel_events);
420 
421 	tmp = time_travel_first_event();
422 	time_travel_ext_update_request(tmp->time);
423 	time_travel_next_event = tmp->time;
424 	local_irq_restore(flags);
425 }
426 
time_travel_add_event(struct time_travel_event * e,unsigned long long time)427 static void time_travel_add_event(struct time_travel_event *e,
428 				  unsigned long long time)
429 {
430 	if (WARN_ON(!e->fn))
431 		return;
432 
433 	__time_travel_add_event(e, time);
434 }
435 
time_travel_add_event_rel(struct time_travel_event * e,unsigned long long delay_ns)436 void time_travel_add_event_rel(struct time_travel_event *e,
437 			       unsigned long long delay_ns)
438 {
439 	time_travel_add_event(e, time_travel_time + delay_ns);
440 }
441 
time_travel_periodic_timer(struct time_travel_event * e)442 static void time_travel_periodic_timer(struct time_travel_event *e)
443 {
444 	time_travel_add_event(&time_travel_timer_event,
445 			      time_travel_time + time_travel_timer_interval);
446 	deliver_alarm();
447 }
448 
deliver_time_travel_irqs(void)449 void deliver_time_travel_irqs(void)
450 {
451 	struct time_travel_event *e;
452 	unsigned long flags;
453 
454 	/*
455 	 * Don't do anything for most cases. Note that because here we have
456 	 * to disable IRQs (and re-enable later) we'll actually recurse at
457 	 * the end of the function, so this is strictly necessary.
458 	 */
459 	if (likely(list_empty(&time_travel_irqs)))
460 		return;
461 
462 	local_irq_save(flags);
463 	irq_enter();
464 	while ((e = list_first_entry_or_null(&time_travel_irqs,
465 					     struct time_travel_event,
466 					     list))) {
467 		list_del(&e->list);
468 		e->pending = false;
469 		e->fn(e);
470 	}
471 	irq_exit();
472 	local_irq_restore(flags);
473 }
474 
time_travel_deliver_event(struct time_travel_event * e)475 static void time_travel_deliver_event(struct time_travel_event *e)
476 {
477 	if (e == &time_travel_timer_event) {
478 		/*
479 		 * deliver_alarm() does the irq_enter/irq_exit
480 		 * by itself, so must handle it specially here
481 		 */
482 		e->fn(e);
483 	} else if (irqs_disabled()) {
484 		list_add_tail(&e->list, &time_travel_irqs);
485 		/*
486 		 * set pending again, it was set to false when the
487 		 * event was deleted from the original list, but
488 		 * now it's still pending until we deliver the IRQ.
489 		 */
490 		e->pending = true;
491 	} else {
492 		unsigned long flags;
493 
494 		local_irq_save(flags);
495 		irq_enter();
496 		e->fn(e);
497 		irq_exit();
498 		local_irq_restore(flags);
499 	}
500 }
501 
time_travel_del_event(struct time_travel_event * e)502 bool time_travel_del_event(struct time_travel_event *e)
503 {
504 	unsigned long flags;
505 
506 	if (!e->pending)
507 		return false;
508 	local_irq_save(flags);
509 	list_del(&e->list);
510 	e->pending = false;
511 	local_irq_restore(flags);
512 	return true;
513 }
514 
time_travel_update_time(unsigned long long next,bool idle)515 static void time_travel_update_time(unsigned long long next, bool idle)
516 {
517 	struct time_travel_event ne = {
518 		.onstack = true,
519 	};
520 	struct time_travel_event *e;
521 	bool finished = idle;
522 
523 	/* add it without a handler - we deal with that specifically below */
524 	__time_travel_add_event(&ne, next);
525 
526 	do {
527 		e = time_travel_first_event();
528 
529 		BUG_ON(!e);
530 		__time_travel_update_time(e->time, idle);
531 
532 		/* new events may have been inserted while we were waiting */
533 		if (e == time_travel_first_event()) {
534 			BUG_ON(!time_travel_del_event(e));
535 			BUG_ON(time_travel_time != e->time);
536 
537 			if (e == &ne) {
538 				finished = true;
539 			} else {
540 				if (e->onstack)
541 					panic("On-stack event dequeued outside of the stack! time=%lld, event time=%lld, event=%pS\n",
542 					      time_travel_time, e->time, e);
543 				time_travel_deliver_event(e);
544 			}
545 		}
546 
547 		e = time_travel_first_event();
548 		if (e)
549 			time_travel_ext_update_request(e->time);
550 	} while (ne.pending && !finished);
551 
552 	time_travel_del_event(&ne);
553 }
554 
time_travel_update_time_rel(unsigned long long offs)555 static void time_travel_update_time_rel(unsigned long long offs)
556 {
557 	unsigned long flags;
558 
559 	/*
560 	 * Disable interrupts before calculating the new time so
561 	 * that a real timer interrupt (signal) can't happen at
562 	 * a bad time e.g. after we read time_travel_time but
563 	 * before we've completed updating the time.
564 	 */
565 	local_irq_save(flags);
566 	time_travel_update_time(time_travel_time + offs, false);
567 	local_irq_restore(flags);
568 }
569 
time_travel_ndelay(unsigned long nsec)570 void time_travel_ndelay(unsigned long nsec)
571 {
572 	/*
573 	 * Not strictly needed to use _rel() version since this is
574 	 * only used in INFCPU/EXT modes, but it doesn't hurt and
575 	 * is more readable too.
576 	 */
577 	time_travel_update_time_rel(nsec);
578 }
579 EXPORT_SYMBOL(time_travel_ndelay);
580 
time_travel_add_irq_event(struct time_travel_event * e)581 void time_travel_add_irq_event(struct time_travel_event *e)
582 {
583 	BUG_ON(time_travel_mode != TT_MODE_EXTERNAL);
584 
585 	time_travel_ext_get_time();
586 	/*
587 	 * We could model interrupt latency here, for now just
588 	 * don't have any latency at all and request the exact
589 	 * same time (again) to run the interrupt...
590 	 */
591 	time_travel_add_event(e, time_travel_time);
592 }
593 EXPORT_SYMBOL_GPL(time_travel_add_irq_event);
594 
time_travel_oneshot_timer(struct time_travel_event * e)595 static void time_travel_oneshot_timer(struct time_travel_event *e)
596 {
597 	deliver_alarm();
598 }
599 
time_travel_sleep(void)600 void time_travel_sleep(void)
601 {
602 	/*
603 	 * Wait "forever" (using S64_MAX because there are some potential
604 	 * wrapping issues, especially with the current TT_MODE_EXTERNAL
605 	 * controller application.
606 	 */
607 	unsigned long long next = S64_MAX;
608 
609 	if (time_travel_mode == TT_MODE_BASIC)
610 		os_timer_disable();
611 
612 	time_travel_update_time(next, true);
613 
614 	if (time_travel_mode == TT_MODE_BASIC &&
615 	    time_travel_timer_event.pending) {
616 		if (time_travel_timer_event.fn == time_travel_periodic_timer) {
617 			/*
618 			 * This is somewhat wrong - we should get the first
619 			 * one sooner like the os_timer_one_shot() below...
620 			 */
621 			os_timer_set_interval(time_travel_timer_interval);
622 		} else {
623 			os_timer_one_shot(time_travel_timer_event.time - next);
624 		}
625 	}
626 }
627 
time_travel_handle_real_alarm(void)628 static void time_travel_handle_real_alarm(void)
629 {
630 	time_travel_set_time(time_travel_next_event);
631 
632 	time_travel_del_event(&time_travel_timer_event);
633 
634 	if (time_travel_timer_event.fn == time_travel_periodic_timer)
635 		time_travel_add_event(&time_travel_timer_event,
636 				      time_travel_time +
637 				      time_travel_timer_interval);
638 }
639 
time_travel_set_interval(unsigned long long interval)640 static void time_travel_set_interval(unsigned long long interval)
641 {
642 	time_travel_timer_interval = interval;
643 }
644 
time_travel_connect_external(const char * socket)645 static int time_travel_connect_external(const char *socket)
646 {
647 	const char *sep;
648 	unsigned long long id = (unsigned long long)-1;
649 	int rc;
650 
651 	if ((sep = strchr(socket, ':'))) {
652 		char buf[25] = {};
653 		if (sep - socket > sizeof(buf) - 1)
654 			goto invalid_number;
655 
656 		memcpy(buf, socket, sep - socket);
657 		if (kstrtoull(buf, 0, &id)) {
658 invalid_number:
659 			panic("time-travel: invalid external ID in string '%s'\n",
660 			      socket);
661 			return -EINVAL;
662 		}
663 
664 		socket = sep + 1;
665 	}
666 
667 	rc = os_connect_socket(socket);
668 	if (rc < 0) {
669 		panic("time-travel: failed to connect to external socket %s\n",
670 		      socket);
671 		return rc;
672 	}
673 
674 	time_travel_ext_fd = rc;
675 
676 	time_travel_ext_req(UM_TIMETRAVEL_START, id);
677 
678 	return 1;
679 }
680 
time_travel_set_start(void)681 static void time_travel_set_start(void)
682 {
683 	if (time_travel_start_set)
684 		return;
685 
686 	switch (time_travel_mode) {
687 	case TT_MODE_EXTERNAL:
688 		time_travel_start = time_travel_ext_req(UM_TIMETRAVEL_GET_TOD, -1);
689 		/* controller gave us the *current* time, so adjust by that */
690 		time_travel_ext_get_time();
691 		time_travel_start -= time_travel_time;
692 		break;
693 	case TT_MODE_INFCPU:
694 	case TT_MODE_BASIC:
695 		if (!time_travel_start_set)
696 			time_travel_start = os_persistent_clock_emulation();
697 		break;
698 	case TT_MODE_OFF:
699 		/* we just read the host clock with os_persistent_clock_emulation() */
700 		break;
701 	}
702 
703 	time_travel_start_set = true;
704 }
705 #else /* CONFIG_UML_TIME_TRAVEL_SUPPORT */
706 #define time_travel_start_set 0
707 #define time_travel_start 0
708 #define time_travel_time 0
709 #define time_travel_ext_waiting 0
710 
time_travel_update_time(unsigned long long ns,bool idle)711 static inline void time_travel_update_time(unsigned long long ns, bool idle)
712 {
713 }
714 
time_travel_update_time_rel(unsigned long long offs)715 static inline void time_travel_update_time_rel(unsigned long long offs)
716 {
717 }
718 
time_travel_handle_real_alarm(void)719 static inline void time_travel_handle_real_alarm(void)
720 {
721 }
722 
time_travel_set_interval(unsigned long long interval)723 static void time_travel_set_interval(unsigned long long interval)
724 {
725 }
726 
time_travel_set_start(void)727 static inline void time_travel_set_start(void)
728 {
729 }
730 
731 /* fail link if this actually gets used */
732 extern u64 time_travel_ext_req(u32 op, u64 time);
733 
734 /* these are empty macros so the struct/fn need not exist */
735 #define time_travel_add_event(e, time) do { } while (0)
736 /* externally not usable - redefine here so we can */
737 #undef time_travel_del_event
738 #define time_travel_del_event(e) do { } while (0)
739 #endif
740 
timer_handler(int sig,struct siginfo * unused_si,struct uml_pt_regs * regs)741 void timer_handler(int sig, struct siginfo *unused_si, struct uml_pt_regs *regs)
742 {
743 	unsigned long flags;
744 
745 	/*
746 	 * In basic time-travel mode we still get real interrupts
747 	 * (signals) but since we don't read time from the OS, we
748 	 * must update the simulated time here to the expiry when
749 	 * we get a signal.
750 	 * This is not the case in inf-cpu mode, since there we
751 	 * never get any real signals from the OS.
752 	 */
753 	if (time_travel_mode == TT_MODE_BASIC)
754 		time_travel_handle_real_alarm();
755 
756 	local_irq_save(flags);
757 	do_IRQ(TIMER_IRQ, regs);
758 	local_irq_restore(flags);
759 }
760 
itimer_shutdown(struct clock_event_device * evt)761 static int itimer_shutdown(struct clock_event_device *evt)
762 {
763 	if (time_travel_mode != TT_MODE_OFF)
764 		time_travel_del_event(&time_travel_timer_event);
765 
766 	if (time_travel_mode != TT_MODE_INFCPU &&
767 	    time_travel_mode != TT_MODE_EXTERNAL)
768 		os_timer_disable();
769 
770 	return 0;
771 }
772 
itimer_set_periodic(struct clock_event_device * evt)773 static int itimer_set_periodic(struct clock_event_device *evt)
774 {
775 	unsigned long long interval = NSEC_PER_SEC / HZ;
776 
777 	if (time_travel_mode != TT_MODE_OFF) {
778 		time_travel_del_event(&time_travel_timer_event);
779 		time_travel_set_event_fn(&time_travel_timer_event,
780 					 time_travel_periodic_timer);
781 		time_travel_set_interval(interval);
782 		time_travel_add_event(&time_travel_timer_event,
783 				      time_travel_time + interval);
784 	}
785 
786 	if (time_travel_mode != TT_MODE_INFCPU &&
787 	    time_travel_mode != TT_MODE_EXTERNAL)
788 		os_timer_set_interval(interval);
789 
790 	return 0;
791 }
792 
itimer_next_event(unsigned long delta,struct clock_event_device * evt)793 static int itimer_next_event(unsigned long delta,
794 			     struct clock_event_device *evt)
795 {
796 	delta += 1;
797 
798 	if (time_travel_mode != TT_MODE_OFF) {
799 		time_travel_del_event(&time_travel_timer_event);
800 		time_travel_set_event_fn(&time_travel_timer_event,
801 					 time_travel_oneshot_timer);
802 		time_travel_add_event(&time_travel_timer_event,
803 				      time_travel_time + delta);
804 	}
805 
806 	if (time_travel_mode != TT_MODE_INFCPU &&
807 	    time_travel_mode != TT_MODE_EXTERNAL)
808 		return os_timer_one_shot(delta);
809 
810 	return 0;
811 }
812 
itimer_one_shot(struct clock_event_device * evt)813 static int itimer_one_shot(struct clock_event_device *evt)
814 {
815 	return itimer_next_event(0, evt);
816 }
817 
818 static struct clock_event_device timer_clockevent = {
819 	.name			= "posix-timer",
820 	.rating			= 250,
821 	.cpumask		= cpu_possible_mask,
822 	.features		= CLOCK_EVT_FEAT_PERIODIC |
823 				  CLOCK_EVT_FEAT_ONESHOT,
824 	.set_state_shutdown	= itimer_shutdown,
825 	.set_state_periodic	= itimer_set_periodic,
826 	.set_state_oneshot	= itimer_one_shot,
827 	.set_next_event		= itimer_next_event,
828 	.shift			= 0,
829 	.max_delta_ns		= 0xffffffff,
830 	.max_delta_ticks	= 0xffffffff,
831 	.min_delta_ns		= TIMER_MIN_DELTA,
832 	.min_delta_ticks	= TIMER_MIN_DELTA, // microsecond resolution should be enough for anyone, same as 640K RAM
833 	.irq			= 0,
834 	.mult			= 1,
835 };
836 
um_timer(int irq,void * dev)837 static irqreturn_t um_timer(int irq, void *dev)
838 {
839 	if (get_current()->mm != NULL)
840 	{
841         /* userspace - relay signal, results in correct userspace timers */
842 		os_alarm_process(get_current()->mm->context.id.pid);
843 	}
844 
845 	(*timer_clockevent.event_handler)(&timer_clockevent);
846 
847 	return IRQ_HANDLED;
848 }
849 
timer_read(struct clocksource * cs)850 static u64 timer_read(struct clocksource *cs)
851 {
852 	if (time_travel_mode != TT_MODE_OFF) {
853 		/*
854 		 * We make reading the timer cost a bit so that we don't get
855 		 * stuck in loops that expect time to move more than the
856 		 * exact requested sleep amount, e.g. python's socket server,
857 		 * see https://bugs.python.org/issue37026.
858 		 *
859 		 * However, don't do that when we're in interrupt or such as
860 		 * then we might recurse into our own processing, and get to
861 		 * even more waiting, and that's not good - it messes up the
862 		 * "what do I do next" and onstack event we use to know when
863 		 * to return from time_travel_update_time().
864 		 */
865 		if (!irqs_disabled() && !in_interrupt() && !in_softirq() &&
866 		    !time_travel_ext_waiting)
867 			time_travel_update_time_rel(TIMER_MULTIPLIER);
868 		return time_travel_time / TIMER_MULTIPLIER;
869 	}
870 
871 	return os_nsecs() / TIMER_MULTIPLIER;
872 }
873 
874 static struct clocksource timer_clocksource = {
875 	.name		= "timer",
876 	.rating		= 300,
877 	.read		= timer_read,
878 	.mask		= CLOCKSOURCE_MASK(64),
879 	.flags		= CLOCK_SOURCE_IS_CONTINUOUS,
880 };
881 
um_timer_setup(void)882 static void __init um_timer_setup(void)
883 {
884 	int err;
885 
886 	err = request_irq(TIMER_IRQ, um_timer, IRQF_TIMER, "hr timer", NULL);
887 	if (err != 0)
888 		printk(KERN_ERR "register_timer : request_irq failed - "
889 		       "errno = %d\n", -err);
890 
891 	err = os_timer_create();
892 	if (err != 0) {
893 		printk(KERN_ERR "creation of timer failed - errno = %d\n", -err);
894 		return;
895 	}
896 
897 	err = clocksource_register_hz(&timer_clocksource, NSEC_PER_SEC/TIMER_MULTIPLIER);
898 	if (err) {
899 		printk(KERN_ERR "clocksource_register_hz returned %d\n", err);
900 		return;
901 	}
902 	clockevents_register_device(&timer_clockevent);
903 }
904 
read_persistent_clock64(struct timespec64 * ts)905 void read_persistent_clock64(struct timespec64 *ts)
906 {
907 	long long nsecs;
908 
909 	time_travel_set_start();
910 
911 	if (time_travel_mode != TT_MODE_OFF)
912 		nsecs = time_travel_start + time_travel_time;
913 	else
914 		nsecs = os_persistent_clock_emulation();
915 
916 	set_normalized_timespec64(ts, nsecs / NSEC_PER_SEC,
917 				  nsecs % NSEC_PER_SEC);
918 }
919 
time_init(void)920 void __init time_init(void)
921 {
922 	timer_set_signal_handler();
923 	late_time_init = um_timer_setup;
924 }
925 
926 #ifdef CONFIG_UML_TIME_TRAVEL_SUPPORT
calibrate_delay_is_known(void)927 unsigned long calibrate_delay_is_known(void)
928 {
929 	if (time_travel_mode == TT_MODE_INFCPU ||
930 	    time_travel_mode == TT_MODE_EXTERNAL)
931 		return 1;
932 	return 0;
933 }
934 
setup_time_travel(char * str)935 static int setup_time_travel(char *str)
936 {
937 	if (strcmp(str, "=inf-cpu") == 0) {
938 		time_travel_mode = TT_MODE_INFCPU;
939 		timer_clockevent.name = "time-travel-timer-infcpu";
940 		timer_clocksource.name = "time-travel-clock";
941 		return 1;
942 	}
943 
944 	if (strncmp(str, "=ext:", 5) == 0) {
945 		time_travel_mode = TT_MODE_EXTERNAL;
946 		timer_clockevent.name = "time-travel-timer-external";
947 		timer_clocksource.name = "time-travel-clock-external";
948 		return time_travel_connect_external(str + 5);
949 	}
950 
951 	if (!*str) {
952 		time_travel_mode = TT_MODE_BASIC;
953 		timer_clockevent.name = "time-travel-timer";
954 		timer_clocksource.name = "time-travel-clock";
955 		return 1;
956 	}
957 
958 	return -EINVAL;
959 }
960 
961 __setup("time-travel", setup_time_travel);
962 __uml_help(setup_time_travel,
963 "time-travel\n"
964 "This option just enables basic time travel mode, in which the clock/timers\n"
965 "inside the UML instance skip forward when there's nothing to do, rather than\n"
966 "waiting for real time to elapse. However, instance CPU speed is limited by\n"
967 "the real CPU speed, so e.g. a 10ms timer will always fire after ~10ms wall\n"
968 "clock (but quicker when there's nothing to do).\n"
969 "\n"
970 "time-travel=inf-cpu\n"
971 "This enables time travel mode with infinite processing power, in which there\n"
972 "are no wall clock timers, and any CPU processing happens - as seen from the\n"
973 "guest - instantly. This can be useful for accurate simulation regardless of\n"
974 "debug overhead, physical CPU speed, etc. but is somewhat dangerous as it can\n"
975 "easily lead to getting stuck (e.g. if anything in the system busy loops).\n"
976 "\n"
977 "time-travel=ext:[ID:]/path/to/socket\n"
978 "This enables time travel mode similar to =inf-cpu, except the system will\n"
979 "use the given socket to coordinate with a central scheduler, in order to\n"
980 "have more than one system simultaneously be on simulated time. The virtio\n"
981 "driver code in UML knows about this so you can also simulate networks and\n"
982 "devices using it, assuming the device has the right capabilities.\n"
983 "The optional ID is a 64-bit integer that's sent to the central scheduler.\n");
984 
setup_time_travel_start(char * str)985 static int setup_time_travel_start(char *str)
986 {
987 	int err;
988 
989 	err = kstrtoull(str, 0, &time_travel_start);
990 	if (err)
991 		return err;
992 
993 	time_travel_start_set = 1;
994 	return 1;
995 }
996 
997 __setup("time-travel-start=", setup_time_travel_start);
998 __uml_help(setup_time_travel_start,
999 "time-travel-start=<nanoseconds>\n"
1000 "Configure the UML instance's wall clock to start at this value rather than\n"
1001 "the host's wall clock at the time of UML boot.\n");
1002 static struct kobject *bc_time_kobject;
1003 
bc_show(struct kobject * kobj,struct kobj_attribute * attr,char * buf)1004 static ssize_t bc_show(struct kobject *kobj, struct kobj_attribute *attr, char *buf)
1005 {
1006 	return sprintf(buf, "0x%llx", bc_message);
1007 }
1008 
bc_store(struct kobject * kobj,struct kobj_attribute * attr,const char * buf,size_t count)1009 static ssize_t bc_store(struct kobject *kobj, struct kobj_attribute *attr, const char *buf, size_t count)
1010 {
1011 	int ret;
1012 	u64 user_bc_message;
1013 
1014 	ret = kstrtou64(buf, 0, &user_bc_message);
1015 	if (ret)
1016 		return ret;
1017 
1018 	bc_message = user_bc_message;
1019 
1020 	time_travel_ext_req(UM_TIMETRAVEL_BROADCAST, bc_message);
1021 	pr_info("um: time: sent broadcast message: 0x%llx\n", bc_message);
1022 	return count;
1023 }
1024 
1025 static struct kobj_attribute bc_attribute = __ATTR(bc-message, 0660, bc_show, bc_store);
1026 
um_bc_start(void)1027 static int __init um_bc_start(void)
1028 {
1029 	if (time_travel_mode != TT_MODE_EXTERNAL)
1030 		return 0;
1031 
1032 	bc_time_kobject = kobject_create_and_add("um-ext-time", kernel_kobj);
1033 	if (!bc_time_kobject)
1034 		return 0;
1035 
1036 	if (sysfs_create_file(bc_time_kobject, &bc_attribute.attr))
1037 		pr_debug("failed to create the bc file in /sys/kernel/um_time");
1038 
1039 	return 0;
1040 }
1041 late_initcall(um_bc_start);
1042 #endif
1043