steadystate: cleanups
[fio.git] / steadystate.c
index e0dcc22e465c68f80bfeef71704415c0077cdfae..6cd7c13f19a83694a98908aadbc05d25fb380cbf 100644 (file)
@@ -1,8 +1,12 @@
+#include <stdlib.h>
+
 #include "fio.h"
 #include "steadystate.h"
 #include "helper_thread.h"
 
-void steadystate_setup()
+bool steadystate = false;
+
+void steadystate_setup(void)
 {
        int i, prev_groupid;
        struct thread_data *td, *prev_td;
@@ -18,22 +22,139 @@ void steadystate_setup()
        prev_groupid = -1;
        prev_td = NULL;
        for_each_td(td, i) {
-               if (!td->o.group_reporting)
+               if (td->ts.ss == NULL)
                        continue;
 
+               if (!td->o.group_reporting) {
+                       steadystate_alloc(td);
+                       continue;
+               }
+
                if (prev_groupid != td->groupid) {
-                       if (prev_td != NULL)
+                       if (prev_td != NULL) {
                                prev_td->ss.last_in_group = 1;
+                               steadystate_alloc(prev_td);
+                       }
                        prev_groupid = td->groupid;
                }
                prev_td = td;
        }
 
-       if (prev_td != NULL && prev_td->o.group_reporting)
+       if (prev_td != NULL && prev_td->o.group_reporting) {
                prev_td->ss.last_in_group = 1;
+               steadystate_alloc(prev_td);
+       }
+}
+
+void steadystate_alloc(struct thread_data *td)
+{
+       int i;
+
+       td->ss.bw_data = malloc(td->ss.dur * sizeof(unsigned long));
+       td->ss.iops_data = malloc(td->ss.dur * sizeof(unsigned long));
+       /* initialize so that it is obvious if the cache is not full in the output */
+       for (i = 0; i < td->ss.dur; i++)
+               td->ss.iops_data[i] = td->ss.bw_data[i] = 0;
+}
+
+static bool steadystate_slope(unsigned long iops, unsigned long bw,
+                             struct thread_data *td)
+{
+       int i, j;
+       double result;
+       struct steadystate_data *ss = &td->ss;
+       unsigned long new_val = ss->check_iops ? iops : bw;
+
+       ss->bw_data[ss->tail] = bw;
+       ss->iops_data[ss->tail] = iops;
+
+       if (ss->tail < ss->head || (ss->tail - ss->head == ss->dur - 1)) {
+               if (ss->sum_y == 0) {   /* first time through */
+                       for(i = 0; i < ss->dur; i++) {
+                               ss->sum_y += ss->check_iops ? ss->iops_data[i] : ss->bw_data[i];
+                               j = ss->head + i;
+                               if (j >= ss->dur)
+                                       j -= ss->dur;
+                               ss->sum_xy += (ss->check_iops ? ss->iops_data[j] : ss->bw_data[j]) * i;
+                       }
+               } else {                /* easy to update the sums */
+                       ss->sum_y -= ss->oldest_y;
+                       ss->sum_y += new_val;
+                       ss->sum_xy = ss->sum_xy - ss->sum_y + ss->dur * new_val;
+               }
+
+               ss->oldest_y = ss->check_iops ? ss->iops_data[ss->head] : ss->bw_data[ss->head];
+
+               /*
+                * calculate slope as (sum_xy - sum_x * sum_y / n) / (sum_(x^2) - (sum_x)^2 / n)
+                * This code assumes that all x values are equally spaced when they are often
+                * off by a few milliseconds. This assumption greatly simplifies the
+                * calculations.
+                */
+               ss->slope = (ss->sum_xy - (double) ss->sum_x * ss->sum_y / ss->dur) / (ss->sum_x_sq - (double) ss->sum_x * ss->sum_x / ss->dur);
+               ss->criterion = ss->pct ? 100.0 * ss->slope / (ss->sum_y / ss->dur) : ss->slope;
+
+               dprint(FD_STEADYSTATE, "sum_y: %llu, sum_xy: %llu, slope: %f, criterion: %f, limit: %f\n",
+                       ss->sum_y, ss->sum_xy, ss->slope, ss->criterion, ss->limit);
+
+               result = ss->criterion * (ss->criterion < 0.0 ? -1.0 : 1.0);
+               if (result < ss->limit)
+                       return true;
+       }
+
+       ss->tail = (ss->tail + 1) % ss->dur;
+       if (ss->tail <= ss->head)
+               ss->head = (ss->head + 1) % ss->dur;
+
+       return false;
 }
 
-void steadystate_check()
+static bool steadystate_deviation(unsigned long iops, unsigned long bw,
+                                 struct thread_data *td)
+{
+       int i;
+       double diff;
+       double mean;
+
+       struct steadystate_data *ss = &td->ss;
+
+       ss->bw_data[ss->tail] = bw;
+       ss->iops_data[ss->tail] = iops;
+
+       if (ss->tail < ss->head || (ss->tail - ss->head == ss->dur - 1)) {
+               if (ss->sum_y == 0) {   /* first time through */
+                       for(i = 0; i < ss->dur; i++)
+                               ss->sum_y += ss->check_iops ? ss->iops_data[i] : ss->bw_data[i];
+               } else {                /* easy to update the sum */
+                       ss->sum_y -= ss->oldest_y;
+                       ss->sum_y += ss->check_iops ? ss->iops_data[ss->tail] : ss->bw_data[ss->tail];
+               }
+
+               ss->oldest_y = ss->check_iops ? ss->iops_data[ss->head] : ss->bw_data[ss->head];
+               mean = (double) ss->sum_y / ss->dur;
+               ss->deviation = 0.0;
+
+               for (i = 0; i < ss->dur; i++) {
+                       diff = (double) (ss->check_iops ? ss->iops_data[i] : ss->bw_data[i]) - mean;
+                       ss->deviation = max(ss->deviation, diff * (diff < 0.0 ? -1.0 : 1.0));
+               }
+
+               ss->criterion = ss->pct ? 100.0 * ss->deviation / mean : ss->deviation;
+
+               dprint(FD_STEADYSTATE, "sum_y: %llu, mean: %f, max diff: %f, objective: %f, limit: %f\n", ss->sum_y, mean, ss->deviation, ss->criterion, ss->limit);
+
+               if (ss->criterion < ss->limit)
+                       return true;
+       }
+
+       ss->tail = (ss->tail + 1) % ss->dur;
+       if (ss->tail <= ss->head)
+               ss->head = (ss->head + 1) % ss->dur;
+
+       return false;
+}
+
+void steadystate_check(void)
 {
        int i, j, ddir, prev_groupid, group_ramp_time_over = 0;
        unsigned long rate_time;
@@ -42,6 +163,7 @@ void steadystate_check()
        unsigned long group_bw = 0, group_iops = 0;
        unsigned long long td_iops;
        unsigned long long td_bytes;
+       bool ret;
 
        prev_groupid = -1;
        for_each_td(td, i) {
@@ -62,7 +184,7 @@ void steadystate_check()
 
                fio_gettime(&now, NULL);
                if (ss->ramp_time && !ss->ramp_time_over)
-                       /* 
+                       /*
                         * Begin recording data one second after ss->ramp_time
                         * has elapsed
                         */
@@ -79,7 +201,7 @@ void steadystate_check()
                rate_time = mtime_since(&ss->prev_time, &now);
                memcpy(&ss->prev_time, &now, sizeof(now));
 
-               /* 
+               /*
                 * Begin monitoring when job starts but don't actually use
                 * data in checking stopping criterion until ss->ramp_time is
                 * over. This ensures that we will have a sane value in
@@ -88,7 +210,7 @@ void steadystate_check()
                 */
                if (ss->ramp_time_over) {
                        group_bw += 1000 * (td_bytes - ss->prev_bytes) / rate_time;
-                       group_iops += 1000 * (td_iops - ss->prev_iops) / rate_time;
+                       group_iops += 1000 * (td_iops - ss->prev_iops) / rate_time;
                        ++group_ramp_time_over;
                }
                ss->prev_iops = td_iops;
@@ -101,19 +223,23 @@ void steadystate_check()
                if (!group_ramp_time_over)
                        continue;
 
-               dprint(FD_STEADYSTATE, "steadystate_check() thread: %d, groupid: %u, rate_msec: %ld, iops: %lu, bw: %lu, head: %d, tail: %d\n", 
+               dprint(FD_STEADYSTATE, "steadystate_check() thread: %d, groupid: %u, rate_msec: %ld, iops: %lu, bw: %lu, head: %d, tail: %d\n",
                        i, td->groupid, rate_time, group_iops, group_bw, ss->head, ss->tail);
 
-               if (ss->evaluate(group_iops, group_bw, td))
-               {
-                       if (td->o.group_reporting)
+               if (steadystate_check_slope(&td->o))
+                       ret = steadystate_slope(group_iops, group_bw, td);
+               else
+                       ret = steadystate_deviation(group_iops, group_bw, td);
+
+               if (ret) {
+                       if (td->o.group_reporting) {
                                for_each_td(td2, j) {
                                        if (td2->groupid == td->groupid) {
                                                td2->ss.attained = 1;
                                                fio_mark_td_terminate(td2);
                                        }
                                }
-                       else {
+                       else {
                                ss->attained = 1;
                                fio_mark_td_terminate(td);
                        }
@@ -121,100 +247,4 @@ void steadystate_check()
        }
 }
 
-bool steadystate_slope(unsigned long iops, unsigned long bw, struct thread_data *td)
-{
-       int i, x;
-       double result;
-       double slope;
-       struct steadystate_data *ss = &td->ss;
-
-       ss->cache[ss->tail] = ss->check_iops ? iops : bw;
-
-       if (ss->tail < ss->head || (ss->tail - ss->head == ss->dur - 1))
-       {
-               if (ss->sum_y == 0)     /* first time through */
-               {
-                       for(i = 0; i < ss->dur; i++)
-                       {
-                               ss->sum_y += ss->cache[i];
-                               x = ss->head + i;
-                               if (x >= ss->dur)
-                                       x -= ss->dur;
-                               ss->sum_xy += ss->cache[x] * i;
-                       }
-               } else {                /* easy to update the sums */
-                       ss->sum_y -= ss->oldest_y;
-                       ss->sum_y += ss->cache[ss->tail];
-                       ss->sum_xy = ss->sum_xy - ss->sum_y + ss->dur * ss->cache[ss->tail];
-               }
 
-               ss->oldest_y = ss->cache[ss->head];
-
-               /*
-                * calculate slope as (sum_xy - sum_x * sum_y / n) / (sum_(x^2) - (sum_x)^2 / n)
-                * This code assumes that all x values are equally spaced when they are often
-                * off by a few milliseconds. This assumption greatly simplifies the
-                * calculations.
-                */
-               slope = (ss->sum_xy - (double) ss->sum_x * ss->sum_y / ss->dur) / (ss->sum_x_sq - (double) ss->sum_x * ss->sum_x / ss->dur);
-               ss->criterion = ss->pct ? slope / (ss->sum_y / ss->dur) * 100.0: slope;
-
-               dprint(FD_STEADYSTATE, "sum_y: %llu, sum_xy: %llu, slope: %f, criterion: %f, limit: %f\n",
-                       ss->sum_y, ss->sum_xy, slope, ss->criterion, ss->limit);
-
-               result = ss->criterion * (ss->criterion < 0.0 ? -1 : 1);
-               if (result < ss->limit)
-                       return true;
-       }
-
-       ss->tail = (ss->tail + 1) % ss->dur;
-       if (ss->tail <= ss->head)
-               ss->head = (ss->head + 1) % ss->dur;
-       return false;
-}
-
-bool steadystate_deviation(unsigned long iops, unsigned long bw, struct thread_data *td)
-{
-       int i;
-       double diff;
-       double mean;
-       double deviation;
-
-       struct steadystate_data *ss = &td->ss;
-
-       ss->cache[ss->tail] = ss->check_iops ? iops : bw;
-
-       if (ss->tail < ss->head || (ss->tail - ss->head == ss->dur - 1))
-       {
-               if (ss->sum_y == 0)     /* first time through */
-               {
-                       for(i = 0; i < ss->dur; i++)
-                               ss->sum_y += ss->cache[i];
-               } else {                /* easy to update the sum */
-                       ss->sum_y -= ss->oldest_y;
-                       ss->sum_y += ss->cache[ss->tail];
-               }
-
-               ss->oldest_y = ss->cache[ss->head];
-               mean = (double) ss->sum_y / ss->dur;
-               deviation = 0.0;
-
-               for (i = 0; i < ss->dur; i++)
-               {       
-                       diff = (double) ss->cache[i] - mean;
-                       deviation = max(deviation, diff * (diff < 0.0 ? -1 : 1));
-               }
-
-               ss->criterion = ss->pct ? deviation / mean * 100.0 : deviation;
-
-               dprint(FD_STEADYSTATE, "sum_y: %llu, mean: %f, max diff: %f, objective: %f, limit: %f\n", ss->sum_y, mean, deviation, ss->criterion, ss->limit);
-
-               if (ss->criterion < ss->limit)
-                       return true;
-       }
-
-       ss->tail = (ss->tail + 1) % ss->dur;
-       if (ss->tail <= ss->head)
-               ss->head = (ss->head + 1) % ss->dur;
-       return false;
-}