uml: tickless support
authorJeff Dike <jdike@addtoit.com>
Tue, 16 Oct 2007 08:27:25 +0000 (01:27 -0700)
committerLinus Torvalds <torvalds@woody.linux-foundation.org>
Tue, 16 Oct 2007 16:43:08 +0000 (09:43 -0700)
Enable tickless support.

CONFIG_TICK_ONESHOT and CONFIG_NO_HZ are enabled.

itimer_clockevent gets CLOCK_EVT_FEAT_ONESHOT and an implementation of
.set_next_event.

CONFIG_UML_REAL_TIME_CLOCK goes away because it only makes sense when there is
a clock ticking away all the time.  timer_handler now just calls do_IRQ once
without trying to figure out how many ticks to emulate.

The idle loop now needs to turn ticking on and off.

Userspace ticks keep happening as usual.  However, the userspace loop keep
track of when the next wakeup should happen and suppresses process ticks until
that happens.

Signed-off-by: Jeff Dike <jdike@linux.intel.com>
Cc: Thomas Gleixner <tglx@linutronix.de>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
arch/um/Kconfig
arch/um/defconfig
arch/um/include/os.h
arch/um/kernel/process.c
arch/um/kernel/time.c
arch/um/os-Linux/skas/process.c
arch/um/os-Linux/time.c

index 64fe8d5..740d8a9 100644 (file)
@@ -250,18 +250,6 @@ config KERNEL_STACK_ORDER
          be 1 << order pages.  The default is OK unless you're running Valgrind
          on UML, in which case, set this to 3.
 
-config UML_REAL_TIME_CLOCK
-       bool "Real-time Clock"
-       default y
-       help
-         This option makes UML time deltas match wall clock deltas.  This
-         should normally be enabled.  The exception would be if you are
-         debugging with UML and spend long times with UML stopped at a
-         breakpoint.  In this case, when UML is restarted, it will call the
-         timer enough times to make up for the time spent at the breakpoint.
-         This could result in a noticeable lag.  If this is a problem, then
-         disable this option.
-
 endmenu
 
 source "init/Kconfig"
index 9f105c8..1cbbe98 100644 (file)
@@ -73,8 +73,8 @@ CONFIG_FLATMEM=y
 CONFIG_FLAT_NODE_MEM_MAP=y
 # CONFIG_SPARSEMEM_STATIC is not set
 CONFIG_SPLIT_PTLOCK_CPUS=4
-# CONFIG_TICK_ONESHOT is not set
-# CONFIG_NO_HZ is not set
+CONFIG_TICK_ONESHOT=y
+CONFIG_NO_HZ=y
 CONFIG_HIGH_RES_TIMERS=y
 CONFIG_LD_SCRIPT_DYN=y
 CONFIG_NET=y
@@ -87,7 +87,6 @@ CONFIG_MAGIC_SYSRQ=y
 CONFIG_NEST_LEVEL=0
 # CONFIG_HIGHMEM is not set
 CONFIG_KERNEL_STACK_ORDER=0
-CONFIG_UML_REAL_TIME_CLOCK=y
 
 #
 # Code maturity level options
index a6d8072..e4f2fe1 100644 (file)
@@ -254,6 +254,7 @@ extern void os_dump_core(void);
 extern int switch_timers(int to_real);
 extern void idle_sleep(int secs);
 extern int set_interval(void);
+extern int timer_one_shot(int ticks);
 extern void disable_timer(void);
 extern void uml_idle_timer(void);
 extern unsigned long long os_nsecs(void);
index 56d75af..aef494b 100644 (file)
@@ -13,6 +13,7 @@
 #include "linux/ptrace.h"
 #include "linux/random.h"
 #include "linux/sched.h"
+#include "linux/tick.h"
 #include "linux/threads.h"
 #include "asm/pgtable.h"
 #include "asm/uaccess.h"
@@ -244,9 +245,11 @@ void default_idle(void)
                if (need_resched())
                        schedule();
 
+               tick_nohz_stop_sched_tick();
                switch_timers(1);
                idle_sleep(10);
                switch_timers(0);
+               tick_nohz_restart_sched_tick();
        }
 }
 
index 3cb7135..2acdc7e 100644 (file)
@@ -20,41 +20,12 @@ unsigned long long sched_clock(void)
        return (unsigned long long)jiffies_64 * (1000000000 / HZ);
 }
 
-#ifdef CONFIG_UML_REAL_TIME_CLOCK
-static unsigned long long prev_nsecs[NR_CPUS];
-static long long delta[NR_CPUS];               /* Deviation per interval */
-#endif
-
 void timer_handler(int sig, struct uml_pt_regs *regs)
 {
-       unsigned long long ticks = 0;
        unsigned long flags;
-#ifdef CONFIG_UML_REAL_TIME_CLOCK
-       int c = cpu();
-       if (prev_nsecs[c]) {
-               /* We've had 1 tick */
-               unsigned long long nsecs = os_nsecs();
-
-               delta[c] += nsecs - prev_nsecs[c];
-               prev_nsecs[c] = nsecs;
-
-               /* Protect against the host clock being set backwards */
-               if (delta[c] < 0)
-                       delta[c] = 0;
-
-               ticks += (delta[c] * HZ) / BILLION;
-               delta[c] -= (ticks * BILLION) / HZ;
-       }
-       else prev_nsecs[c] = os_nsecs();
-#else
-       ticks = 1;
-#endif
 
        local_irq_save(flags);
-       while (ticks > 0) {
-               do_IRQ(TIMER_IRQ, regs);
-               ticks--;
-       }
+       do_IRQ(TIMER_IRQ, regs);
        local_irq_restore(flags);
 }
 
@@ -68,10 +39,8 @@ static void itimer_set_mode(enum clock_event_mode mode,
 
        case CLOCK_EVT_MODE_SHUTDOWN:
        case CLOCK_EVT_MODE_UNUSED:
-               disable_timer();
-               break;
        case CLOCK_EVT_MODE_ONESHOT:
-               BUG();
+               disable_timer();
                break;
 
        case CLOCK_EVT_MODE_RESUME:
@@ -79,13 +48,19 @@ static void itimer_set_mode(enum clock_event_mode mode,
        }
 }
 
+static int itimer_next_event(unsigned long delta,
+                            struct clock_event_device *evt)
+{
+       return timer_one_shot(delta + 1);
+}
+
 static struct clock_event_device itimer_clockevent = {
        .name           = "itimer",
        .rating         = 250,
        .cpumask        = CPU_MASK_ALL,
-       .features       = CLOCK_EVT_FEAT_PERIODIC,
+       .features       = CLOCK_EVT_FEAT_PERIODIC | CLOCK_EVT_FEAT_ONESHOT,
        .set_mode       = itimer_set_mode,
-       .set_next_event = NULL,
+       .set_next_event = itimer_next_event,
        .shift          = 32,
        .irq            = 0,
 };
index 0036164..3e64814 100644 (file)
@@ -287,10 +287,18 @@ int start_userspace(unsigned long stub_stack)
 
 void userspace(struct uml_pt_regs *regs)
 {
+       struct itimerval timer;
+       unsigned long long nsecs, now;
        int err, status, op, pid = userspace_pid[0];
        /* To prevent races if using_sysemu changes under us.*/
        int local_using_sysemu;
 
+       if (getitimer(ITIMER_VIRTUAL, &timer))
+               printk("Failed to get itimer, errno = %d\n", errno);
+       nsecs = timer.it_value.tv_sec * BILLION +
+               timer.it_value.tv_usec * 1000;
+       nsecs += os_nsecs();
+
        while (1) {
                restore_registers(pid, regs);
 
@@ -333,8 +341,18 @@ void userspace(struct uml_pt_regs *regs)
                        case SIGTRAP:
                                relay_signal(SIGTRAP, regs);
                                break;
-                       case SIGIO:
                        case SIGVTALRM:
+                               now = os_nsecs();
+                               if(now < nsecs)
+                                       break;
+                               block_signals();
+                               (*sig_info[sig])(sig, regs);
+                               unblock_signals();
+                               nsecs = timer.it_value.tv_sec * BILLION +
+                                       timer.it_value.tv_usec * 1000;
+                               nsecs += os_nsecs();
+                               break;
+                       case SIGIO:
                        case SIGILL:
                        case SIGBUS:
                        case SIGFPE:
@@ -378,6 +396,7 @@ __initcall(init_thread_regs);
 
 int copy_context_skas0(unsigned long new_stack, int pid)
 {
+       struct timeval tv = { .tv_sec = 0, .tv_usec = 1000000 / UM_HZ };
        int err;
        unsigned long current_stack = current_stub_stack();
        struct stub_data *data = (struct stub_data *) current_stack;
@@ -392,9 +411,9 @@ int copy_context_skas0(unsigned long new_stack, int pid)
        *data = ((struct stub_data) { .offset   = MMAP_OFFSET(new_offset),
                                      .fd       = new_fd,
                                      .timer    = ((struct itimerval)
-                                                   { { 0, 1000000 / UM_HZ },
-                                                     { 0, 1000000 / UM_HZ }})
-                                });
+                                                  { .it_value = tv,
+                                                    .it_interval = tv }) });
+
        err = ptrace_setregs(pid, thread_regs);
        if (err < 0)
                panic("copy_context_skas0 : PTRACE_SETREGS failed, "
index 6ff3d98..9ffc61a 100644 (file)
@@ -26,6 +26,21 @@ int set_interval(void)
        return 0;
 }
 
+int timer_one_shot(int ticks)
+{
+       unsigned long usec = ticks * 1000000 / UM_HZ;
+       unsigned long sec = usec / 1000000;
+       struct itimerval interval;
+
+       usec %= 1000000;
+       interval = ((struct itimerval) { { 0, 0 }, { sec, usec } });
+
+       if (setitimer(ITIMER_VIRTUAL, &interval, NULL) == -1)
+               return -errno;
+
+       return 0;
+}
+
 void disable_timer(void)
 {
        struct itimerval disable = ((struct itimerval) { { 0, 0 }, { 0, 0 }});
@@ -74,7 +89,7 @@ unsigned long long os_nsecs(void)
        struct timeval tv;
 
        gettimeofday(&tv, NULL);
-       return (unsigned long long) tv.tv_sec * BILLION + tv.tv_usec * 1000;
+       return timeval_to_ns(&tv);
 }
 
 void idle_sleep(int secs)