fio2gnuplot: Print line if int() conversion fails
[fio.git] / tools / plot / fio2gnuplot.py
... / ...
CommitLineData
1#!/usr/bin/python
2#
3# Copyright (C) 2013 eNovance SAS <licensing@enovance.com>
4# Author: Erwan Velu <erwan@enovance.com>
5#
6# The license below covers all files distributed with fio unless otherwise
7# noted in the file itself.
8#
9# This program is free software; you can redistribute it and/or modify
10# it under the terms of the GNU General Public License version 2 as
11# published by the Free Software Foundation.
12#
13# This program is distributed in the hope that it will be useful,
14# but WITHOUT ANY WARRANTY; without even the implied warranty of
15# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16# GNU General Public License for more details.
17#
18# You should have received a copy of the GNU General Public License
19# along with this program; if not, write to the Free Software
20# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
21
22import os
23import fnmatch
24import sys
25import getopt
26import re
27import math
28import shutil
29
30def find_file(path, pattern):
31 fio_data_file=[]
32 # For all the local files
33 for file in os.listdir(path):
34 # If the file math the regexp
35 if fnmatch.fnmatch(file, pattern):
36 # Let's consider this file
37 fio_data_file.append(file)
38
39 return fio_data_file
40
41def generate_gnuplot_script(fio_data_file,title,gnuplot_output_filename,gnuplot_output_dir,mode,disk_perf,gpm_dir):
42 print "Generating rendering scripts"
43 filename=gnuplot_output_dir+'mygraph'
44 f=open(filename,'w')
45
46 # Plotting 3D or comparing graphs doesn't have a meaning unless if there is at least 2 traces
47 if len(fio_data_file) > 1:
48 f.write("call \'%s/graph3D.gpm\' \'%s' \'%s\' \'\' \'%s\' \'%s\'\n" % (gpm_dir,title,gnuplot_output_filename,gnuplot_output_filename,mode))
49
50 # Setting up the compare files that will be plot later
51 compare=open(gnuplot_output_dir + 'compare.gnuplot','w')
52 compare.write('''
53set title '%s'
54set terminal png size 1280,1024
55set ytics axis out auto
56set key top left reverse
57set xlabel "Time (Seconds)"
58set ylabel '%s'
59set xrange [0:]
60set yrange [0:]
61'''% (title,mode))
62 compare.close()
63 #Copying the common file for all kind of graph (raw/smooth/trend)
64 compare_raw_filename="compare-%s-2Draw" % (gnuplot_output_filename)
65 compare_smooth_filename="compare-%s-2Dsmooth" % (gnuplot_output_filename)
66 compare_trend_filename="compare-%s-2Dtrend" % (gnuplot_output_filename)
67 shutil.copy(gnuplot_output_dir+'compare.gnuplot',gnuplot_output_dir+compare_raw_filename+".gnuplot")
68 shutil.copy(gnuplot_output_dir+'compare.gnuplot',gnuplot_output_dir+compare_smooth_filename+".gnuplot")
69 shutil.copy(gnuplot_output_dir+'compare.gnuplot',gnuplot_output_dir+compare_trend_filename+".gnuplot")
70
71 #Setting up a different output filename for each kind of graph
72 compare_raw=open(gnuplot_output_dir+compare_raw_filename + ".gnuplot",'a')
73 compare_raw.write("set output '%s.png'\n" % compare_raw_filename)
74 compare_smooth=open(gnuplot_output_dir+compare_smooth_filename+".gnuplot",'a')
75 compare_smooth.write("set output '%s.png'\n" % compare_smooth_filename)
76 compare_trend=open(gnuplot_output_dir+compare_trend_filename+".gnuplot",'a')
77 compare_trend.write("set output '%s.png'\n" % compare_trend_filename)
78
79 pos=0
80 # Let's create a temporary file for each selected fio file
81 for file in fio_data_file:
82 tmp_filename = "gnuplot_temp_file.%d" % pos
83
84 # Plotting comparing graphs doesn't have a meaning unless if there is at least 2 traces
85 if len(fio_data_file) > 1:
86 # Adding the plot instruction for each kind of comparing graphs
87 if pos ==0 :
88 compare_raw.write("plot '%s' using 2:3 with linespoints title '%s'" % (tmp_filename,fio_data_file[pos]))
89 compare_smooth.write("plot '%s' using 2:3 smooth csplines title '%s'" % (tmp_filename,fio_data_file[pos]))
90 compare_trend.write("plot '%s' using 2:3 smooth bezier title '%s'" % (tmp_filename,fio_data_file[pos]))
91 else:
92 compare_raw.write(",\\\n'%s' using 2:3 with linespoints title '%s'" % (tmp_filename,fio_data_file[pos]))
93 compare_smooth.write(",\\\n'%s' using 2:3 smooth csplines title '%s'" % (tmp_filename,fio_data_file[pos]))
94 compare_trend.write(",\\\n'%s' using 2:3 smooth bezier title '%s'" % (tmp_filename,fio_data_file[pos]))
95
96 png_file=file.replace('.log','')
97 raw_filename = "%s-2Draw" % (png_file)
98 smooth_filename = "%s-2Dsmooth" % (png_file)
99 trend_filename = "%s-2Dtrend" % (png_file)
100 avg = average(disk_perf[pos])
101 f.write("call \'%s/graph2D.gpm\' \'%s' \'%s\' \'%s\' \'%s\' \'%s\' \'%s\' \'%s\' \'%f\'\n" % (gpm_dir,title,tmp_filename,fio_data_file[pos],raw_filename,mode,smooth_filename,trend_filename,avg))
102 pos = pos +1
103
104 # Plotting comparing graphs doesn't have a meaning unless if there is at least 2 traces
105 if len(fio_data_file) > 1:
106 os.remove(gnuplot_output_dir+"compare.gnuplot")
107 compare_raw.close()
108 compare_smooth.close()
109 compare_trend.close()
110 f.close()
111
112def generate_gnuplot_math_script(title,gnuplot_output_filename,mode,average,gnuplot_output_dir,gpm_dir):
113 filename=gnuplot_output_dir+'mymath';
114 f=open(filename,'a')
115 f.write("call \'%s/math.gpm\' \'%s' \'%s\' \'\' \'%s\' \'%s\' %s\n" % (gpm_dir,title,gnuplot_output_filename,gnuplot_output_filename,mode,average))
116 f.close()
117
118def compute_aggregated_file(fio_data_file, gnuplot_output_filename, gnuplot_output_dir):
119 print "Processing data file 2/2"
120 temp_files=[]
121 pos=0
122
123 # Let's create a temporary file for each selected fio file
124 for file in fio_data_file:
125 tmp_filename = "%sgnuplot_temp_file.%d" % (gnuplot_output_dir, pos)
126 temp_files.append(open(tmp_filename,'r'))
127 pos = pos +1
128
129 f = open(gnuplot_output_dir+gnuplot_output_filename, "w")
130 index=0
131 # Let's add some information
132 for tempfile in temp_files:
133 f.write("# Disk%d was coming from %s\n" % (index,fio_data_file[index]))
134 f.write(tempfile.read())
135 f.write("\n")
136 tempfile.close()
137 index = index + 1
138 f.close()
139
140def average(s): return sum(s) * 1.0 / len(s)
141
142def compute_temp_file(fio_data_file,disk_perf,gnuplot_output_dir):
143 print "Processing data file 1/2"
144 files=[]
145 temp_outfile=[]
146 blk_size=0
147 for file in fio_data_file:
148 files.append(open(file))
149 pos = len(files) - 1
150 tmp_filename = "%sgnuplot_temp_file.%d" % (gnuplot_output_dir,pos)
151 gnuplot_file=open(tmp_filename,'w')
152 temp_outfile.append(gnuplot_file)
153 gnuplot_file.write("#Temporary file based on file %s\n" % file)
154 disk_perf.append([])
155
156 shall_break = False
157 while True:
158 current_line=[]
159 nb_empty_files=0
160 nb_files=len(files)
161 for file in files:
162 s=file.readline().replace(',',' ').split()
163 if not s:
164 nb_empty_files+=1
165 s="-1, 0, 0, 0".replace(',',' ').split()
166
167 if (nb_empty_files == nb_files):
168 shall_break=True
169 break;
170
171 current_line.append(s);
172
173 if shall_break == True:
174 break
175
176 last_time = -1
177 index=0
178 perfs=[]
179 for line in current_line:
180 time, perf, x, block_size = line
181 if (blk_size == 0):
182 try:
183 blk_size=int(block_size)
184 except:
185 print "Error while reading the following line :"
186 print line
187 sys.exit(1);
188
189 # We ignore the first 500msec as it doesn't seems to be part of the real benchmark
190 # Time < 500 usually reports BW=0 breaking the min computing
191 if (((int(time)) > 500) or (int(time)==-1)):
192 disk_perf[index].append(int(perf))
193 perfs.append("%s %s"% (time, perf))
194 index = index + 1
195
196 # If we reach this point, it means that all the traces are coherent
197 for p in enumerate(perfs):
198 perf_time,perf = p[1].split()
199 if (perf_time != "-1"):
200 temp_outfile[p[0]].write("%s %.2f %s\n" % (p[0], float(float(perf_time)/1000), perf))
201
202
203 for file in files:
204 file.close()
205 for file in temp_outfile:
206 file.close()
207 return blk_size
208
209def compute_math(fio_data_file, title,gnuplot_output_filename,gnuplot_output_dir,mode,disk_perf,gpm_dir):
210 print "Computing Maths"
211 global_min=[]
212 global_max=[]
213 average_file=open(gnuplot_output_dir+gnuplot_output_filename+'.average', 'w')
214 min_file=open(gnuplot_output_dir+gnuplot_output_filename+'.min', 'w')
215 max_file=open(gnuplot_output_dir+gnuplot_output_filename+'.max', 'w')
216 stddev_file=open(gnuplot_output_dir+gnuplot_output_filename+'.stddev', 'w')
217 global_file=open(gnuplot_output_dir+gnuplot_output_filename+'.global','w')
218
219 min_file.write('DiskName %s\n' % mode)
220 max_file.write('DiskName %s\n'% mode)
221 average_file.write('DiskName %s\n'% mode)
222 stddev_file.write('DiskName %s\n'% mode )
223 for disk in xrange(len(fio_data_file)):
224# print disk_perf[disk]
225 min_file.write("# Disk%d was coming from %s\n" % (disk,fio_data_file[disk]))
226 max_file.write("# Disk%d was coming from %s\n" % (disk,fio_data_file[disk]))
227 average_file.write("# Disk%d was coming from %s\n" % (disk,fio_data_file[disk]))
228 stddev_file.write("# Disk%d was coming from %s\n" % (disk,fio_data_file[disk]))
229 avg = average(disk_perf[disk])
230 variance = map(lambda x: (x - avg)**2, disk_perf[disk])
231 standard_deviation = math.sqrt(average(variance))
232# print "Disk%d [ min=%.2f max=%.2f avg=%.2f stddev=%.2f \n" % (disk,min(disk_perf[disk]),max(disk_perf[disk]),avg, standard_deviation)
233 average_file.write('%d %d\n' % (disk, avg))
234 stddev_file.write('%d %d\n' % (disk, standard_deviation))
235 local_min=min(disk_perf[disk])
236 local_max=max(disk_perf[disk])
237 min_file.write('%d %d\n' % (disk, local_min))
238 max_file.write('%d %d\n' % (disk, local_max))
239 global_min.append(int(local_min))
240 global_max.append(int(local_max))
241
242 global_disk_perf = sum(disk_perf, [])
243 avg = average(global_disk_perf)
244 variance = map(lambda x: (x - avg)**2, global_disk_perf)
245 standard_deviation = math.sqrt(average(variance))
246
247 global_file.write('min=%.2f\n' % min(global_disk_perf))
248 global_file.write('max=%.2f\n' % max(global_disk_perf))
249 global_file.write('avg=%.2f\n' % avg)
250 global_file.write('stddev=%.2f\n' % standard_deviation)
251 global_file.write('values_count=%d\n' % len(global_disk_perf))
252 global_file.write('disks_count=%d\n' % len(fio_data_file))
253 #print "Global [ min=%.2f max=%.2f avg=%.2f stddev=%.2f \n" % (min(global_disk_perf),max(global_disk_perf),avg, standard_deviation)
254
255 average_file.close()
256 min_file.close()
257 max_file.close()
258 stddev_file.close()
259 global_file.close()
260 try:
261 os.remove(gnuplot_output_dir+'mymath')
262 except:
263 True
264
265 generate_gnuplot_math_script("Average values of "+title,gnuplot_output_filename+'.average',mode,int(avg),gnuplot_output_dir,gpm_dir)
266 generate_gnuplot_math_script("Min values of "+title,gnuplot_output_filename+'.min',mode,average(global_min),gnuplot_output_dir,gpm_dir)
267 generate_gnuplot_math_script("Max values of "+title,gnuplot_output_filename+'.max',mode,average(global_max),gnuplot_output_dir,gpm_dir)
268 generate_gnuplot_math_script("Standard Deviation of "+title,gnuplot_output_filename+'.stddev',mode,int(standard_deviation),gnuplot_output_dir,gpm_dir)
269
270def parse_global_files(fio_data_file, global_search):
271 max_result=0
272 max_file=''
273 for file in fio_data_file:
274 f=open(file)
275 disk_count=0
276 search_value=-1
277
278 # Let's read the complete file
279 while True:
280 try:
281 # We do split the name from the value
282 name,value=f.readline().split("=")
283 except:
284 f.close()
285 break
286 # If we ended the file
287 if not name:
288 # Let's process what we have
289 f.close()
290 break
291 else:
292 # disks_count is not global_search item
293 # As we need it for some computation, let's save it
294 if name=="disks_count":
295 disks_count=int(value)
296
297 # Let's catch the searched item
298 if global_search in name:
299 search_value=float(value)
300
301 # Let's process the avg value by estimated the global bandwidth per file
302 # We keep the biggest in memory for reporting
303 if global_search == "avg":
304 if (disks_count > 0) and (search_value != -1):
305 result=disks_count*search_value
306 if (result > max_result):
307 max_result=result
308 max_file=file
309 # Let's print the avg output
310 if global_search == "avg":
311 print "Biggest aggregated value of %s was %2.f in file %s\n" % (global_search, max_result, max_file)
312 else:
313 print "Global search %s is not yet implemented\n" % global_search
314
315def render_gnuplot(fio_data_file, gnuplot_output_dir):
316 print "Running gnuplot Rendering"
317 try:
318 # Let's render all the compared files if some
319 if len(fio_data_file) > 1:
320 print " |-> Rendering comparing traces"
321 os.system("cd %s; for i in *.gnuplot; do gnuplot $i; done" % gnuplot_output_dir)
322 print " |-> Rendering math traces"
323 os.system("cd %s; gnuplot mymath" % gnuplot_output_dir)
324 print " |-> Rendering 2D & 3D traces"
325 os.system("cd %s; gnuplot mygraph" % gnuplot_output_dir)
326
327 name_of_directory="the current"
328 if gnuplot_output_dir != "./":
329 name_of_directory=gnuplot_output_dir
330 print "\nRendering traces are available in %s directory" % name_of_directory
331 except:
332 print "Could not run gnuplot on mymath or mygraph !\n"
333 sys.exit(1);
334
335def print_help():
336 print 'fio2gnuplot.py -ghbiod -t <title> -o <outputfile> -p <pattern> -G <type>'
337 print
338 print '-h --help : Print this help'
339 print '-p <pattern> or --pattern <pattern> : A pattern in regexp to select fio input files'
340 print '-b or --bandwidth : A predefined pattern for selecting *_bw.log files'
341 print '-i or --iops : A predefined pattern for selecting *_iops.log files'
342 print '-g or --gnuplot : Render gnuplot traces before exiting'
343 print '-o or --outputfile <file> : The basename for gnuplot traces'
344 print ' - Basename is set with the pattern if defined'
345 print '-d or --outputdir <dir> : The directory where gnuplot shall render files'
346 print '-t or --title <title> : The title of the gnuplot traces'
347 print ' - Title is set with the block size detected in fio traces'
348 print '-G or --Global <type> : Search for <type> in .global files match by a pattern'
349 print ' - Available types are : min, max, avg, stddev'
350 print ' - The .global extension is added automatically to the pattern'
351
352def main(argv):
353 mode='unknown'
354 pattern=''
355 pattern_set_by_user=False
356 title='No title'
357 gnuplot_output_filename='result'
358 gnuplot_output_dir='./'
359 gpm_dir="/usr/share/fio/"
360 disk_perf=[]
361 run_gnuplot=False
362 parse_global=False
363 global_search=''
364
365 if not os.path.isfile(gpm_dir+'math.gpm'):
366 gpm_dir="/usr/local/share/fio/"
367 if not os.path.isfile(gpm_dir+'math.gpm'):
368 print "Looks like fio didn't got installed properly as no gpm files found in '/usr/share/fio' or '/usr/local/share/fio'\n"
369 sys.exit(3)
370
371 try:
372 opts, args = getopt.getopt(argv[1:],"ghbio:d:t:p:G:")
373 except getopt.GetoptError:
374 print_help()
375 sys.exit(2)
376
377 for opt, arg in opts:
378 if opt in ("-b", "--bandwidth"):
379 pattern='*_bw.log'
380 elif opt in ("-i", "--iops"):
381 pattern='*_iops.log'
382 elif opt in ("-p", "--pattern"):
383 pattern_set_by_user=True
384 pattern=arg
385 pattern=pattern.replace('\\','')
386 elif opt in ("-o", "--outputfile"):
387 gnuplot_output_filename=arg
388 elif opt in ("-d", "--outputdir"):
389 gnuplot_output_dir=arg
390 if not gnuplot_output_dir.endswith('/'):
391 gnuplot_output_dir=gnuplot_output_dir+'/'
392 if not os.path.exists(gnuplot_output_dir):
393 os.makedirs(gnuplot_output_dir)
394 elif opt in ("-t", "--title"):
395 title=arg
396 elif opt in ("-g", "--gnuplot"):
397 run_gnuplot=True
398 elif opt in ("-G", "--Global"):
399 parse_global=True
400 global_search=arg
401 elif opt in ("-h", "--help"):
402 print_help()
403 sys.exit(1)
404
405 # Adding .global extension to the file
406 if parse_global==True:
407 if not gnuplot_output_filename.endswith('.global'):
408 pattern = pattern+'.global'
409
410 fio_data_file=find_file('.',pattern)
411 if len(fio_data_file) == 0:
412 print "No log file found with pattern %s!" % pattern
413 sys.exit(1)
414 else:
415 print "%d files Selected with pattern '%s'" % (len(fio_data_file), pattern)
416
417 fio_data_file=sorted(fio_data_file, key=str.lower)
418 for file in fio_data_file:
419 print ' |-> %s' % file
420 if "_bw.log" in file :
421 mode="Bandwidth (KB/sec)"
422 if "_iops.log" in file :
423 mode="IO per Seconds (IO/sec)"
424 if (title == 'No title') and (mode != 'unknown'):
425 if "Bandwidth" in mode:
426 title='Bandwidth benchmark with %d fio results' % len(fio_data_file)
427 if "IO" in mode:
428 title='IO benchmark with %d fio results' % len(fio_data_file)
429
430 print
431 #We need to adjust the output filename regarding the pattern required by the user
432 if (pattern_set_by_user == True):
433 gnuplot_output_filename=pattern
434 # As we do have some regexp in the pattern, let's make this simpliest
435 # We do remove the simpliest parts of the expression to get a clear file name
436 gnuplot_output_filename=gnuplot_output_filename.replace('-*-','-')
437 gnuplot_output_filename=gnuplot_output_filename.replace('*','-')
438 gnuplot_output_filename=gnuplot_output_filename.replace('--','-')
439 gnuplot_output_filename=gnuplot_output_filename.replace('.log','')
440 # Insure that we don't have any starting or trailing dash to the filename
441 gnuplot_output_filename = gnuplot_output_filename[:-1] if gnuplot_output_filename.endswith('-') else gnuplot_output_filename
442 gnuplot_output_filename = gnuplot_output_filename[1:] if gnuplot_output_filename.startswith('-') else gnuplot_output_filename
443
444 if parse_global==True:
445 parse_global_files(fio_data_file, global_search)
446 else:
447 blk_size=compute_temp_file(fio_data_file,disk_perf,gnuplot_output_dir)
448 title="%s @ Blocksize = %dK" % (title,blk_size/1024)
449 compute_aggregated_file(fio_data_file, gnuplot_output_filename, gnuplot_output_dir)
450 compute_math(fio_data_file,title,gnuplot_output_filename,gnuplot_output_dir,mode,disk_perf,gpm_dir)
451 generate_gnuplot_script(fio_data_file,title,gnuplot_output_filename,gnuplot_output_dir,mode,disk_perf,gpm_dir)
452
453 if (run_gnuplot==True):
454 render_gnuplot(fio_data_file, gnuplot_output_dir)
455
456 # Cleaning temporary files
457 try:
458 os.remove('gnuplot_temp_file.*')
459 except:
460 True
461
462#Main
463if __name__ == "__main__":
464 sys.exit(main(sys.argv))