[MEDIUM] further improve monotonic clock by check forward jumps

author Willy Tarreau <w@1wt.eu>

Mon, 23 Jun 2008 12:00:57 +0000 (14:00 +0200)

committer Willy Tarreau <w@1wt.eu>

Mon, 23 Jun 2008 12:00:57 +0000 (14:00 +0200)
author Willy Tarreau <w@1wt.eu>
Mon, 23 Jun 2008 12:00:57 +0000 (14:00 +0200)
committer Willy Tarreau <w@1wt.eu>
Mon, 23 Jun 2008 12:00:57 +0000 (14:00 +0200)
diff --git a/include/common/time.h b/include/common/time.h

index d6155265d6108ca92572e547c42aac3960079834..82ec402ccd7f379d29d9572a9e87f0f348ecdc38 100644 (file)
--- a/include/common/time.h
+++ b/include/common/time.h
@@ -44,6 +44,11 @@
  
  #define TIME_ETERNITY   (TV_ETERNITY_MS)
  
+/* we want to be able to detect time jumps. Fix the maximum wait time to a low
+ * value so that we know the time has changed if we wait longer.
+ */
+#define MAX_DELAY_MS    1000
+
  
  /* returns the lowest delay amongst <old> and <new>, and respects TIME_ETERNITY */
  #define MINTIME(old, new)      (((new)<0)?(old):(((old)<0||(new)<(old))?(new):(old)))
@@ -84,13 +89,15 @@ REGPRM1 static inline struct timeval *tv_now(struct timeval *tv)
         return tv;
  }
  
-/* tv_now_mono: sets <date> to the current time (wall clock), <mono> to a value
- * following a monotonic function, and applies any required correction if the
- * time goes backwards. Note that while we could improve it a bit by checking
- * that the new date is not too far in the future, it is not much necessary to
- * do so. 
+/* tv_udpate_date: sets <date> to system time, and sets <now> to something as
+ * close as possible to real time, following a monotonic function. The main
+ * principle consists in detecting backwards and forwards time jumps and adjust
+ * an offset to correct them. This function should be called only once after
+ * each poll. The poll's timeout should be passed in <max_wait>, and the return
+ * value in <interrupted> (a non-zero value means that we have not expired the
+ * timeout).
   */
-REGPRM2 struct timeval *tv_now_mono(struct timeval *mono, struct timeval *wall);
+REGPRM2 void tv_update_date(int max_wait, int interrupted);
  
  /*
   * sets a struct timeval to its highest value so that it can never happen
diff --git a/src/cfgparse.c b/src/cfgparse.c

index 13d2a8930573e27d4e38eb0deefe102d4e30b29c..90611cdaa83843c8bf666b53c76505e88e526079 100644 (file)
--- a/src/cfgparse.c
+++ b/src/cfgparse.c
@@ -2831,7 +2831,7 @@ int readcfgfile(const char *file)
          */
  
         /* will be needed further to delay some tasks */
-       tv_now_mono(&now, &date);
+       tv_update_date(0,1);
  
         if ((curproxy = proxy) == NULL) {
                 Alert("parsing %s : no <listen> line. Nothing to do !\n",
diff --git a/src/ev_epoll.c b/src/ev_epoll.c

index e7aea93f36bce752646dec0565d30b6557d7e7bf..adb0fd6e880d9131c26cc8c0c798feacafc0d12e 100644 (file)
--- a/src/ev_epoll.c
+++ b/src/ev_epoll.c
@@ -235,15 +235,18 @@ REGPRM2 static void _do_poll(struct poller *p, struct timeval *exp)
         if (run_queue)
                 wait_time = 0;
         else if (tv_iseternity(exp))
-               wait_time = -1;
+               wait_time = MAX_DELAY_MS;
         else if (tv_isge(&now, exp))
                 wait_time = 0;
-       else
+       else {
                 wait_time = __tv_ms_elapsed(&now, exp) + 1;
+               if (wait_time > MAX_DELAY_MS)
+                       wait_time = MAX_DELAY_MS;
+       }
  
         fd = MIN(maxfd, global.tune.maxpollevents);
         status = epoll_wait(epoll_fd, epoll_events, fd, wait_time);
-       tv_now_mono(&now, &date);
+       tv_update_date(wait_time, status);
  
         for (count = 0; count < status; count++) {
                 fd = epoll_events[count].data.fd;
diff --git a/src/ev_kqueue.c b/src/ev_kqueue.c

index f22aa5b1fbcc52b777f0efa2c49312eba5a83d6b..71e9ecf614fd5c2ac922fbc333898888e3d63748 100644 (file)
--- a/src/ev_kqueue.c
+++ b/src/ev_kqueue.c
@@ -102,25 +102,41 @@ REGPRM1 static void __fd_clo(int fd)
  REGPRM2 static void _do_poll(struct poller *p, struct timeval *exp)
  {
         int status;
-       int count, fd;
-       struct timespec timeout, *to_ptr;
+       int count, fd, delta_ms;
+       struct timespec timeout;
  
-       to_ptr = NULL;  // no timeout
         if (run_queue) {
                 timeout.tv_sec = timeout.tv_nsec = 0;
-               to_ptr = &timeout;
+               delta_ms = 0;
         }
         else if (tv_isset(exp)) {
+               const struct timeval max_delay = {
+                       .tv_sec  = MAX_DELAY_MS / 1000,
+                       .tv_usec = (MAX_DELAY_MS % 1000) * 1000
+               };
                 struct timeval delta;
  
-               if (tv_isge(&now, exp))
+               if (tv_isge(&now, exp)) {
                         delta.tv_sec = delta.tv_usec = 0;
-               else
+                       delta_ms = 0;
+               }
+               else {
                         tv_remain(&now, exp, &delta);
+                       if (__tv_isgt(&delta, &max_delay)) {
+                               delta    = max_delay;
+                               delta_ms = MAX_DELAY_MS;
+                       } else {
+                               delta_ms = delta.tv_sec * 1000 + delta.tv_usec / 1000;
+                       }
+               }
  
                 timeout.tv_sec  = delta.tv_sec;
                 timeout.tv_nsec = delta.tv_usec * 1000;
-               to_ptr = &timeout;
+       }
+       else {
+               delta_ms = MAX_DELAY_MS;
+               timeout.tv_sec  = MAX_DELAY_MS / 1000;
+               timeout.tv_nsec = (MAX_DELAY_MS % 1000) * 1000000;
         }
  
         fd = MIN(maxfd, global.tune.maxpollevents);
@@ -129,8 +145,8 @@ REGPRM2 static void _do_poll(struct poller *p, struct timeval *exp)
                         0,         // int nchanges
                         kev,       // struct kevent *eventlist
                         fd,        // int nevents
-                       to_ptr);   // const struct timespec *timeout
-       tv_now_mono(&now, &date);
+                       &timeout); // const struct timespec *timeout
+       tv_update_date(delta_ms, status);
  
         for (count = 0; count < status; count++) {
                 fd = kev[count].ident;
diff --git a/src/ev_poll.c b/src/ev_poll.c

index bfbe999ed03bb7bf4a7dc576521f108ae483b5d1..a0355aad6dd112172a7aad33d64fa2f591a73dc0 100644 (file)
--- a/src/ev_poll.c
+++ b/src/ev_poll.c
@@ -127,14 +127,17 @@ REGPRM2 static void _do_poll(struct poller *p, struct timeval *exp)
         if (run_queue)
                 wait_time = 0;
         else if (tv_iseternity(exp))
-               wait_time = -1;
+               wait_time = MAX_DELAY_MS;
         else if (tv_isge(&now, exp))
                 wait_time = 0;
-       else
+       else {
                 wait_time = __tv_ms_elapsed(&now, exp) + 1;
+               if (wait_time > MAX_DELAY_MS)
+                       wait_time = MAX_DELAY_MS;
+       }
  
         status = poll(poll_events, nbfd, wait_time);
-       tv_now_mono(&now, &date);
+       tv_update_date(wait_time, status);
  
         for (count = 0; status > 0 && count < nbfd; count++) {
                 fd = poll_events[count].fd;
diff --git a/src/ev_select.c b/src/ev_select.c

index 25bd3ec60543cf8943751af3078a492fba746660..30df9285bac4b0f2a881666365592c25a2a789c2 100644 (file)
--- a/src/ev_select.c
+++ b/src/ev_select.c
@@ -80,17 +80,27 @@ REGPRM1 static void __fd_rem(int fd)
   */
  REGPRM2 static void _do_poll(struct poller *p, struct timeval *exp)
  {
+       const struct timeval max_delay = {
+               .tv_sec  = MAX_DELAY_MS / 1000,
+               .tv_usec = (MAX_DELAY_MS % 1000) * 1000
+       };
         int status;
         int fd, i;
         struct timeval delta;
+       int delta_ms;
         int readnotnull, writenotnull;
         int fds;
         char count;
                 
         /* allow select to return immediately when needed */
         delta.tv_sec = delta.tv_usec = 0;
-       if (!run_queue && tv_isset(exp)) {
-               if (tv_islt(&now, exp)) {
+       delta_ms = 0;
+       if (!run_queue) {
+               if (!tv_isset(exp)) {
+                       delta = max_delay;
+                       delta_ms = MAX_DELAY_MS;
+               }
+               else if (tv_islt(&now, exp)) {
                         tv_remain(&now, exp, &delta);
                         /* To avoid eventual select loops due to timer precision */
                         delta.tv_usec += SCHEDULER_RESOLUTION * 1000;
@@ -98,6 +108,12 @@ REGPRM2 static void _do_poll(struct poller *p, struct timeval *exp)
                                 delta.tv_usec -= 1000000;
                                 delta.tv_sec ++;
                         }
+                       if (__tv_isge(&delta, &max_delay)) {
+                               delta = max_delay;
+                               delta_ms = MAX_DELAY_MS;
+                       } else {
+                               delta_ms = delta.tv_sec * 1000 + delta.tv_usec / 1000;
+                       }
                 }
         }
  
@@ -122,9 +138,9 @@ REGPRM2 static void _do_poll(struct poller *p, struct timeval *exp)
                         readnotnull ? tmp_evts[DIR_RD] : NULL,
                         writenotnull ? tmp_evts[DIR_WR] : NULL,
                         NULL,
-                       tv_isset(exp) ? &delta : NULL);
+                       &delta);
        
-       tv_now_mono(&now, &date);
+       tv_update_date(delta_ms, status);
  
         if (status <= 0)
                 return;
diff --git a/src/ev_sepoll.c b/src/ev_sepoll.c

index ed2103ced8b89b1b84ea93dbaafdbeb1370bc3b9..f42a97f296b89c3fded21082813db4c7dc562af5 100644 (file)
--- a/src/ev_sepoll.c
+++ b/src/ev_sepoll.c
@@ -418,7 +418,7 @@ REGPRM2 static void _do_poll(struct poller *p, struct timeval *exp)
                  * returning now without checking epoll_wait().
                  */
                 if (++last_skipped <= 1) {
-                       tv_now_mono(&now, &date);
+                       tv_update_date(0, 1);
                         return;
                 }
         }
@@ -435,11 +435,14 @@ REGPRM2 static void _do_poll(struct poller *p, struct timeval *exp)
         }
         else {
                 if (tv_iseternity(exp))
-                       wait_time = -1;
+                       wait_time = MAX_DELAY_MS;
                 else if (tv_isge(&now, exp))
                         wait_time = 0;
-               else
+               else {
                         wait_time = __tv_ms_elapsed(&now, exp) + 1;
+                       if (wait_time > MAX_DELAY_MS)
+                               wait_time = MAX_DELAY_MS;
+               }
         }
  
         /* now let's wait for real events. We normally use maxpollevents as a
@@ -451,8 +454,7 @@ REGPRM2 static void _do_poll(struct poller *p, struct timeval *exp)
         fd = MIN(maxfd, fd);
         spec_processed = 0;
         status = epoll_wait(epoll_fd, epoll_events, fd, wait_time);
-
-       tv_now_mono(&now, &date);
+       tv_update_date(wait_time, status);
  
         for (count = 0; count < status; count++) {
                 int e = epoll_events[count].events;
diff --git a/src/haproxy.c b/src/haproxy.c

index f10e47dc4c6928feed29fae0b72d257fd52a0659..45e48522de3dd210b31b636b8ef09df07f915d25 100644 (file)
--- a/src/haproxy.c
+++ b/src/haproxy.c
@@ -415,7 +415,7 @@ void init(int argc, char **argv)
         global.rlimit_memmax = HAPROXY_MEMMAX;
  #endif
  
-       tv_now_mono(&now, &date);
+       tv_update_date(-1,-1);
         start_date = now;
  
         init_task();
@@ -897,7 +897,7 @@ void run_poll_loop()
  {
         struct timeval next;
  
-       tv_now_mono(&now, &date);
+       tv_update_date(0,1);
         while (1) {
                 process_runnable_tasks(&next);
  
diff --git a/src/proxy.c b/src/proxy.c

index 16804f913f53ff79bc0aedd18829ece21ff7d0f7..a7b4efc1d8c3401c86c491ff821d609bc5fc3768 100644 (file)
--- a/src/proxy.c
+++ b/src/proxy.c
@@ -385,7 +385,7 @@ void soft_stop(void)
  
         stopping = 1;
         p = proxy;
-       tv_now_mono(&now, &date); /* else, the old time before select will be used */
+       tv_update_date(0,1); /* else, the old time before select will be used */
         while (p) {
                 if (p->state != PR_STSTOPPED) {
                         Warning("Stopping proxy %s in %d ms.\n", p->id, p->grace);
@@ -434,7 +434,7 @@ void pause_proxies(void)
  
         err = 0;
         p = proxy;
-       tv_now_mono(&now, &date); /* else, the old time before select will be used */
+       tv_update_date(0,1); /* else, the old time before select will be used */
         while (p) {
                 if (p->state != PR_STERROR &&
                     p->state != PR_STSTOPPED &&
@@ -469,7 +469,7 @@ void listen_proxies(void)
         struct listener *l;
  
         p = proxy;
-       tv_now_mono(&now, &date); /* else, the old time before select will be used */
+       tv_update_date(0,1); /* else, the old time before select will be used */
         while (p) {
                 if (p->state == PR_STPAUSED) {
                         Warning("Enabling proxy %s.\n", p->id);
diff --git a/src/time.c b/src/time.c

index ccb30b2535360f7ff8242537f273e9361b33a6fd..f637f6c78a9eb2756d236c1dccbe70196809ae7f 100644 (file)
--- a/src/time.c
+++ b/src/time.c
@@ -143,25 +143,56 @@ REGPRM2 int _tv_isgt(const struct timeval *tv1, const struct timeval *tv2)
         return __tv_isgt(tv1, tv2);
  }
  
-/* tv_now_mono: sets <date> to the current time (wall clock), <mono> to a value
- * following a monotonic function, and applies any required correction if the
- * time goes backwards. Note that while we could improve it a bit by checking
- * that the new date is not too far in the future, it is not much necessary to
- * do so. 
+/* tv_udpate_date: sets <date> to system time, and sets <now> to something as
+ * close as possible to real time, following a monotonic function. The main
+ * principle consists in detecting backwards and forwards time jumps and adjust
+ * an offset to correct them. This function should be called once after each
+ * poll, and never farther apart than MAX_DELAY_MS*2. The poll's timeout should
+ * be passed in <max_wait>, and the return value in <interrupted> (a non-zero
+ * value means that we have not expired the timeout). Calling it with (-1,*)
+ * sets both <date> and <now> to current date, and calling it with (0,1) simply
+ * updates the values.
   */
-REGPRM2 struct timeval *tv_now_mono(struct timeval *mono, struct timeval *wall)
+REGPRM2 void tv_update_date(int max_wait, int interrupted)
  {
-       static struct timeval tv_offset;
-       struct timeval adjusted;
-
-       gettimeofday(wall, NULL);
-       __tv_add(&adjusted, wall, &tv_offset);
-       if (unlikely(__tv_islt(&adjusted, mono))) {
-               __tv_remain(wall, mono, &tv_offset);
-               return mono;
+       static struct timeval tv_offset; /* warning: signed offset! */
+       struct timeval adjusted, deadline;
+
+       gettimeofday(&date, NULL);
+       if (unlikely(max_wait < 0)) {
+               tv_zero(&tv_offset);
+               now = date;
+               return;
         }
-       *mono = adjusted;
-       return mono;
+       __tv_add(&adjusted, &date, &tv_offset);
+       if (unlikely(__tv_islt(&adjusted, &now))) {
+               goto fixup; /* jump in the past */
+       }
+
+       /* OK we did not jump backwards, let's see if we have jumped too far
+        * forwards. The poll value was in <max_wait>, we accept that plus
+        * MAX_DELAY_MS to cover additional time.
+        */
+       _tv_ms_add(&deadline, &now, max_wait + MAX_DELAY_MS);
+       if (unlikely(__tv_isge(&adjusted, &deadline))) {
+               goto fixup; /* jump in the future */
+       }
+       now = adjusted;
+       return;
+ fixup:
+       /* Large jump. If the poll was interrupted, we consider that the date
+        * has not changed (immediate wake-up), otherwise we add the poll
+        * time-out to the previous date. The new offset is recomputed.
+        */
+       if (!interrupted)
+               _tv_ms_add(&now, &now, max_wait);
+       tv_offset.tv_sec  = now.tv_sec  - date.tv_sec;
+       tv_offset.tv_usec = now.tv_usec - date.tv_usec;
+       if (tv_offset.tv_usec < 0) {
+               tv_offset.tv_usec += 1000000;
+               tv_offset.tv_sec--;
+       }
+       return;
  }
  
  char *human_time(int t, short hz_div) {
author	Willy Tarreau <w@1wt.eu>
	Mon, 23 Jun 2008 12:00:57 +0000 (14:00 +0200)
committer	Willy Tarreau <w@1wt.eu>
	Mon, 23 Jun 2008 12:00:57 +0000 (14:00 +0200)
include/common/time.h		patch \| blob \| blame \| history
src/cfgparse.c		patch \| blob \| blame \| history
src/ev_epoll.c		patch \| blob \| blame \| history
src/ev_kqueue.c		patch \| blob \| blame \| history
src/ev_poll.c		patch \| blob \| blame \| history
src/ev_select.c		patch \| blob \| blame \| history
src/ev_sepoll.c		patch \| blob \| blame \| history
src/haproxy.c		patch \| blob \| blame \| history
src/proxy.c		patch \| blob \| blame \| history
src/time.c		patch \| blob \| blame \| history