Commit | Line | Data |
---|---|---|
ba8fb6f6 VF |
1 | #include <stdlib.h> |
2 | ||
16e56d25 VF |
3 | #include "fio.h" |
4 | #include "steadystate.h" | |
5 | #include "helper_thread.h" | |
6 | ||
84784e07 | 7 | bool steadystate_enabled = false; |
4cd5b75b | 8 | |
f0c50c66 JA |
9 | static void steadystate_alloc(struct thread_data *td) |
10 | { | |
11 | int i; | |
12 | ||
13 | td->ss.bw_data = malloc(td->ss.dur * sizeof(unsigned long)); | |
14 | td->ss.iops_data = malloc(td->ss.dur * sizeof(unsigned long)); | |
15 | /* initialize so that it is obvious if the cache is not full in the output */ | |
16 | for (i = 0; i < td->ss.dur; i++) | |
17 | td->ss.iops_data[i] = td->ss.bw_data[i] = 0; | |
18 | } | |
19 | ||
4cd5b75b | 20 | void steadystate_setup(void) |
16e56d25 VF |
21 | { |
22 | int i, prev_groupid; | |
23 | struct thread_data *td, *prev_td; | |
24 | ||
84784e07 | 25 | if (!steadystate_enabled) |
16e56d25 VF |
26 | return; |
27 | ||
28 | /* | |
29 | * if group reporting is enabled, identify the last td | |
30 | * for each group and use it for storing steady state | |
31 | * data | |
32 | */ | |
33 | prev_groupid = -1; | |
34 | prev_td = NULL; | |
35 | for_each_td(td, i) { | |
ba8fb6f6 VF |
36 | if (td->ts.ss == NULL) |
37 | continue; | |
38 | ||
39 | if (!td->o.group_reporting) { | |
40 | steadystate_alloc(td); | |
d685adfb | 41 | td->ss.state |= __FIO_SS_DATA; |
16e56d25 | 42 | continue; |
ba8fb6f6 | 43 | } |
16e56d25 VF |
44 | |
45 | if (prev_groupid != td->groupid) { | |
ba8fb6f6 | 46 | if (prev_td != NULL) { |
ec55e631 | 47 | prev_td->ss.state |= __FIO_SS_DATA; |
ba8fb6f6 VF |
48 | steadystate_alloc(prev_td); |
49 | } | |
16e56d25 VF |
50 | prev_groupid = td->groupid; |
51 | } | |
52 | prev_td = td; | |
53 | } | |
54 | ||
ba8fb6f6 | 55 | if (prev_td != NULL && prev_td->o.group_reporting) { |
ec55e631 | 56 | prev_td->ss.state |= __FIO_SS_DATA; |
ba8fb6f6 VF |
57 | steadystate_alloc(prev_td); |
58 | } | |
59 | } | |
60 | ||
4cd5b75b JA |
61 | static bool steadystate_slope(unsigned long iops, unsigned long bw, |
62 | struct thread_data *td) | |
16e56d25 | 63 | { |
ba8fb6f6 | 64 | int i, j; |
16e56d25 | 65 | double result; |
16e56d25 | 66 | struct steadystate_data *ss = &td->ss; |
7be78a8a | 67 | unsigned long new_val; |
16e56d25 | 68 | |
ba8fb6f6 VF |
69 | ss->bw_data[ss->tail] = bw; |
70 | ss->iops_data[ss->tail] = iops; | |
16e56d25 | 71 | |
5b4b6586 | 72 | if (ss->state & __FIO_SS_IOPS) |
7be78a8a JA |
73 | new_val = iops; |
74 | else | |
75 | new_val = bw; | |
76 | ||
4cd5b75b JA |
77 | if (ss->tail < ss->head || (ss->tail - ss->head == ss->dur - 1)) { |
78 | if (ss->sum_y == 0) { /* first time through */ | |
79 | for(i = 0; i < ss->dur; i++) { | |
5b4b6586 | 80 | if (ss->state & __FIO_SS_IOPS) |
7be78a8a JA |
81 | ss->sum_y += ss->iops_data[i]; |
82 | else | |
83 | ss->sum_y += ss->bw_data[i]; | |
ba8fb6f6 VF |
84 | j = ss->head + i; |
85 | if (j >= ss->dur) | |
86 | j -= ss->dur; | |
5b4b6586 | 87 | if (ss->state & __FIO_SS_IOPS) |
94f218f6 | 88 | ss->sum_xy += i * ss->iops_data[j]; |
7be78a8a | 89 | else |
94f218f6 | 90 | ss->sum_xy += i * ss->bw_data[j]; |
16e56d25 VF |
91 | } |
92 | } else { /* easy to update the sums */ | |
93 | ss->sum_y -= ss->oldest_y; | |
ba8fb6f6 VF |
94 | ss->sum_y += new_val; |
95 | ss->sum_xy = ss->sum_xy - ss->sum_y + ss->dur * new_val; | |
16e56d25 VF |
96 | } |
97 | ||
5b4b6586 | 98 | if (ss->state & __FIO_SS_IOPS) |
7be78a8a JA |
99 | ss->oldest_y = ss->iops_data[ss->head]; |
100 | else | |
101 | ss->oldest_y = ss->bw_data[ss->head]; | |
16e56d25 VF |
102 | |
103 | /* | |
7be78a8a JA |
104 | * calculate slope as (sum_xy - sum_x * sum_y / n) / (sum_(x^2) |
105 | * - (sum_x)^2 / n) This code assumes that all x values are | |
106 | * equally spaced when they are often off by a few milliseconds. | |
107 | * This assumption greatly simplifies the calculations. | |
16e56d25 | 108 | */ |
7be78a8a JA |
109 | ss->slope = (ss->sum_xy - (double) ss->sum_x * ss->sum_y / ss->dur) / |
110 | (ss->sum_x_sq - (double) ss->sum_x * ss->sum_x / ss->dur); | |
e6a6a984 | 111 | if (ss->state & __FIO_SS_PCT) |
7be78a8a JA |
112 | ss->criterion = 100.0 * ss->slope / (ss->sum_y / ss->dur); |
113 | else | |
114 | ss->criterion = ss->slope; | |
16e56d25 | 115 | |
7be78a8a JA |
116 | dprint(FD_STEADYSTATE, "sum_y: %llu, sum_xy: %llu, slope: %f, " |
117 | "criterion: %f, limit: %f\n", | |
118 | ss->sum_y, ss->sum_xy, ss->slope, | |
119 | ss->criterion, ss->limit); | |
16e56d25 | 120 | |
6da94b07 | 121 | result = ss->criterion * (ss->criterion < 0.0 ? -1.0 : 1.0); |
16e56d25 VF |
122 | if (result < ss->limit) |
123 | return true; | |
124 | } | |
125 | ||
126 | ss->tail = (ss->tail + 1) % ss->dur; | |
127 | if (ss->tail <= ss->head) | |
128 | ss->head = (ss->head + 1) % ss->dur; | |
4cd5b75b | 129 | |
16e56d25 VF |
130 | return false; |
131 | } | |
132 | ||
4cd5b75b JA |
133 | static bool steadystate_deviation(unsigned long iops, unsigned long bw, |
134 | struct thread_data *td) | |
16e56d25 VF |
135 | { |
136 | int i; | |
137 | double diff; | |
138 | double mean; | |
16e56d25 VF |
139 | |
140 | struct steadystate_data *ss = &td->ss; | |
141 | ||
ba8fb6f6 VF |
142 | ss->bw_data[ss->tail] = bw; |
143 | ss->iops_data[ss->tail] = iops; | |
16e56d25 | 144 | |
4cd5b75b JA |
145 | if (ss->tail < ss->head || (ss->tail - ss->head == ss->dur - 1)) { |
146 | if (ss->sum_y == 0) { /* first time through */ | |
16e56d25 | 147 | for(i = 0; i < ss->dur; i++) |
5b4b6586 | 148 | if (ss->state & __FIO_SS_IOPS) |
7be78a8a JA |
149 | ss->sum_y += ss->iops_data[i]; |
150 | else | |
151 | ss->sum_y += ss->bw_data[i]; | |
16e56d25 VF |
152 | } else { /* easy to update the sum */ |
153 | ss->sum_y -= ss->oldest_y; | |
5b4b6586 | 154 | if (ss->state & __FIO_SS_IOPS) |
7be78a8a JA |
155 | ss->sum_y += ss->iops_data[ss->tail]; |
156 | else | |
157 | ss->sum_y += ss->bw_data[ss->tail]; | |
16e56d25 VF |
158 | } |
159 | ||
5b4b6586 | 160 | if (ss->state & __FIO_SS_IOPS) |
7be78a8a JA |
161 | ss->oldest_y = ss->iops_data[ss->head]; |
162 | else | |
163 | ss->oldest_y = ss->bw_data[ss->head]; | |
164 | ||
16e56d25 | 165 | mean = (double) ss->sum_y / ss->dur; |
ba8fb6f6 | 166 | ss->deviation = 0.0; |
16e56d25 | 167 | |
4cd5b75b | 168 | for (i = 0; i < ss->dur; i++) { |
5b4b6586 | 169 | if (ss->state & __FIO_SS_IOPS) |
7be78a8a JA |
170 | diff = ss->iops_data[i] - mean; |
171 | else | |
172 | diff = ss->bw_data[i] - mean; | |
6da94b07 | 173 | ss->deviation = max(ss->deviation, diff * (diff < 0.0 ? -1.0 : 1.0)); |
16e56d25 VF |
174 | } |
175 | ||
e6a6a984 | 176 | if (ss->state & __FIO_SS_PCT) |
7be78a8a JA |
177 | ss->criterion = 100.0 * ss->deviation / mean; |
178 | else | |
179 | ss->criterion = ss->deviation; | |
16e56d25 | 180 | |
7be78a8a JA |
181 | dprint(FD_STEADYSTATE, "sum_y: %llu, mean: %f, max diff: %f, " |
182 | "objective: %f, limit: %f\n", | |
183 | ss->sum_y, mean, ss->deviation, | |
184 | ss->criterion, ss->limit); | |
16e56d25 VF |
185 | |
186 | if (ss->criterion < ss->limit) | |
187 | return true; | |
188 | } | |
189 | ||
190 | ss->tail = (ss->tail + 1) % ss->dur; | |
191 | if (ss->tail <= ss->head) | |
192 | ss->head = (ss->head + 1) % ss->dur; | |
4cd5b75b | 193 | |
16e56d25 VF |
194 | return false; |
195 | } | |
4cd5b75b JA |
196 | |
197 | void steadystate_check(void) | |
198 | { | |
199 | int i, j, ddir, prev_groupid, group_ramp_time_over = 0; | |
200 | unsigned long rate_time; | |
201 | struct thread_data *td, *td2; | |
202 | struct timeval now; | |
203 | unsigned long group_bw = 0, group_iops = 0; | |
204 | unsigned long long td_iops; | |
205 | unsigned long long td_bytes; | |
206 | bool ret; | |
207 | ||
208 | prev_groupid = -1; | |
209 | for_each_td(td, i) { | |
210 | struct steadystate_data *ss = &td->ss; | |
211 | ||
7be78a8a | 212 | if (!ss->dur || td->runstate <= TD_SETTING_UP || |
5b4b6586 | 213 | td->runstate >= TD_EXITED || (ss->state & __FIO_SS_ATTAINED)) |
4cd5b75b JA |
214 | continue; |
215 | ||
216 | td_iops = 0; | |
217 | td_bytes = 0; | |
218 | if (!td->o.group_reporting || | |
219 | (td->o.group_reporting && td->groupid != prev_groupid)) { | |
220 | group_bw = 0; | |
221 | group_iops = 0; | |
222 | group_ramp_time_over = 0; | |
223 | } | |
224 | prev_groupid = td->groupid; | |
225 | ||
226 | fio_gettime(&now, NULL); | |
5b4b6586 | 227 | if (ss->ramp_time && !(ss->state & __FIO_SS_RAMP_OVER)) { |
4cd5b75b JA |
228 | /* |
229 | * Begin recording data one second after ss->ramp_time | |
230 | * has elapsed | |
231 | */ | |
232 | if (utime_since(&td->epoch, &now) >= (ss->ramp_time + 1000000L)) | |
5b4b6586 JA |
233 | ss->state |= __FIO_SS_RAMP_OVER; |
234 | } | |
4cd5b75b JA |
235 | |
236 | td_io_u_lock(td); | |
237 | for (ddir = DDIR_READ; ddir < DDIR_RWDIR_CNT; ddir++) { | |
238 | td_iops += td->io_blocks[ddir]; | |
239 | td_bytes += td->io_bytes[ddir]; | |
240 | } | |
241 | td_io_u_unlock(td); | |
242 | ||
243 | rate_time = mtime_since(&ss->prev_time, &now); | |
244 | memcpy(&ss->prev_time, &now, sizeof(now)); | |
245 | ||
246 | /* | |
247 | * Begin monitoring when job starts but don't actually use | |
248 | * data in checking stopping criterion until ss->ramp_time is | |
249 | * over. This ensures that we will have a sane value in | |
250 | * prev_iops/bw the first time through after ss->ramp_time | |
251 | * is done. | |
252 | */ | |
5b4b6586 | 253 | if (ss->state & __FIO_SS_RAMP_OVER) { |
4cd5b75b JA |
254 | group_bw += 1000 * (td_bytes - ss->prev_bytes) / rate_time; |
255 | group_iops += 1000 * (td_iops - ss->prev_iops) / rate_time; | |
256 | ++group_ramp_time_over; | |
257 | } | |
258 | ss->prev_iops = td_iops; | |
259 | ss->prev_bytes = td_bytes; | |
260 | ||
ec55e631 | 261 | if (td->o.group_reporting && !(ss->state & __FIO_SS_DATA)) |
4cd5b75b JA |
262 | continue; |
263 | ||
7be78a8a JA |
264 | /* |
265 | * Don't begin checking criterion until ss->ramp_time is over | |
266 | * for at least one thread in group | |
267 | */ | |
4cd5b75b JA |
268 | if (!group_ramp_time_over) |
269 | continue; | |
270 | ||
7be78a8a JA |
271 | dprint(FD_STEADYSTATE, "steadystate_check() thread: %d, " |
272 | "groupid: %u, rate_msec: %ld, " | |
273 | "iops: %lu, bw: %lu, head: %d, tail: %d\n", | |
274 | i, td->groupid, rate_time, group_iops, | |
275 | group_bw, ss->head, ss->tail); | |
4cd5b75b | 276 | |
f0c50c66 | 277 | if (td->o.ss & __FIO_SS_SLOPE) |
4cd5b75b JA |
278 | ret = steadystate_slope(group_iops, group_bw, td); |
279 | else | |
280 | ret = steadystate_deviation(group_iops, group_bw, td); | |
281 | ||
282 | if (ret) { | |
283 | if (td->o.group_reporting) { | |
284 | for_each_td(td2, j) { | |
285 | if (td2->groupid == td->groupid) { | |
5b4b6586 | 286 | td2->ss.state |= __FIO_SS_ATTAINED; |
4cd5b75b JA |
287 | fio_mark_td_terminate(td2); |
288 | } | |
289 | } | |
290 | } else { | |
5b4b6586 | 291 | ss->state |= __FIO_SS_ATTAINED; |
4cd5b75b JA |
292 | fio_mark_td_terminate(td); |
293 | } | |
294 | } | |
295 | } | |
296 | } | |
297 | ||
56a90eba | 298 | int td_steadystate_init(struct thread_data *td) |
f0c50c66 JA |
299 | { |
300 | struct steadystate_data *ss = &td->ss; | |
301 | struct thread_options *o = &td->o; | |
56a90eba VF |
302 | struct thread_data *td2; |
303 | int j; | |
f0c50c66 JA |
304 | |
305 | memset(ss, 0, sizeof(*ss)); | |
306 | ||
56a90eba VF |
307 | if (o->ss_dur) { |
308 | steadystate_enabled = true; | |
309 | o->ss_dur /= 1000000L; | |
310 | ||
311 | /* put all steady state info in one place */ | |
312 | ss->dur = o->ss_dur; | |
313 | ss->limit = o->ss_limit.u.f; | |
314 | ss->ramp_time = o->ss_ramp_time; | |
f0c50c66 | 315 | |
56a90eba VF |
316 | ss->state = o->ss; |
317 | if (!td->ss.ramp_time) | |
318 | ss->state |= __FIO_SS_RAMP_OVER; | |
4cd5b75b | 319 | |
56a90eba VF |
320 | ss->sum_x = o->ss_dur * (o->ss_dur - 1) / 2; |
321 | ss->sum_x_sq = (o->ss_dur - 1) * (o->ss_dur) * (2*o->ss_dur - 1) / 6; | |
f0c50c66 | 322 | |
56a90eba VF |
323 | td->ts.ss = ss; |
324 | } | |
5b4b6586 | 325 | |
56a90eba VF |
326 | /* make sure that ss options are consistent within reporting group */ |
327 | for_each_td(td2, j) { | |
328 | if (td2->groupid == td->groupid) { | |
329 | struct steadystate_data *ss2 = &td2->ss; | |
330 | ||
331 | if (ss2->dur != ss->dur || | |
332 | ss2->limit != ss->limit || | |
333 | ss2->ramp_time != ss->ramp_time || | |
56a90eba VF |
334 | ss2->state != ss->state || |
335 | ss2->sum_x != ss->sum_x || | |
336 | ss2->sum_x_sq != ss->sum_x_sq) { | |
337 | td_verror(td, EINVAL, "job rejected: steadystate options must be consistent within reporting groups"); | |
338 | return 1; | |
339 | } | |
340 | } | |
341 | } | |
f0c50c66 | 342 | |
56a90eba | 343 | return 0; |
f0c50c66 | 344 | } |
d685adfb VF |
345 | |
346 | unsigned long long steadystate_bw_mean(struct steadystate_data *ss) | |
347 | { | |
348 | int i; | |
349 | unsigned long long sum; | |
350 | ||
351 | for (i = 0, sum = 0; i < ss->dur; i++) | |
352 | sum += ss->bw_data[i]; | |
353 | ||
354 | return sum / ss->dur; | |
355 | } | |
356 | ||
357 | unsigned long long steadystate_iops_mean(struct steadystate_data *ss) | |
358 | { | |
359 | int i; | |
360 | unsigned long long sum; | |
361 | ||
362 | for (i = 0, sum = 0; i < ss->dur; i++) | |
363 | sum += ss->iops_data[i]; | |
364 | ||
365 | return sum / ss->dur; | |
366 | } |