Add support for randomness of any IO direction

[fio.git] / HOWTO
diff --git a/HOWTO b/HOWTO

index f7948c3f1d8e676227374a713a35ccec5bbd9784..8768b99670a1a09e97b748bbfa6e4a6a0cab1a19 100644 (file)
--- a/HOWTO
+++ b/HOWTO
@@ -9,6 +9,7 @@ Table of contents
  6. Normal output
  7. Terse output
  8. Trace file format
+9. CPU idleness profiling
  
  1.0 Overview and history
  ------------------------
@@ -284,6 +285,32 @@ filename=str       Fio normally makes up a filename based on the job name,
                 stdin or stdout. Which of the two depends on the read/write
                 direction set.
  
+filename_format=str
+               If sharing multiple files between jobs, it is usually necessary
+               to  have fio generate the exact names that you want. By default,
+               fio will name a file based on the default file format
+               specification of jobname.jobnumber.filenumber. With this
+               option, that can be customized. Fio will recognize and replace
+               the following keywords in this string:
+
+               $jobname
+                       The name of the worker thread or process.
+
+               $jobnum
+                       The incremental number of the worker thread or
+                       process.
+
+               $filenum
+                       The incremental number of the file for that worker
+                       thread or process.
+
+               To have dependent jobs share a set of files, this option can
+               be set to have fio generate filenames that are shared between
+               the two. For instance, if testfiles.$filenum is specified,
+               file number 4 for any job will be named testfiles.4. The
+               default of $jobname.$jobnum.$filenum will be used if
+               no other format specifier is given.
+
  opendir=str    Tell fio to recursively add any file it can find in this
                 directory and down the file system tree.
  
@@ -301,11 +328,6 @@ lockfile=str       Fio defaults to not locking any files before it does
                                         same time, but writes get exclusive
                                         access.
  
-               The option may be post-fixed with a lock batch number. If
-               set, then each thread/process may do that amount of IOs to
-               the file before giving up the lock. Since lock acquisition is
-               expensive, batching the lock/unlocks will speed up IO.
-
  readwrite=str
  rw=str         Type of io pattern. Accepted values are:
  
@@ -409,7 +431,7 @@ filesize=int        Individual file sizes. May be a range, in which case fio
  fill_device=bool
  fill_fs=bool   Sets size to something really large and waits for ENOSPC (no
                 space left on device) as the terminating condition. Only makes
-                sense with sequential write. For a read workload, the mount
+               sense with sequential write. For a read workload, the mount
                 point will be filled first then IO started on the result. This
                 option doesn't make sense if operating on a raw device node,
                 since the size of that is already known by the file system.
@@ -421,9 +443,11 @@ bs=int             The block size used for the io units. Defaults to 4k. Values
                 can be given for both read and writes. If a single int is
                 given, it will apply to both. If a second int is specified
                 after a comma, it will apply to writes only. In other words,
-               the format is either bs=read_and_write or bs=read,write.
-               bs=4k,8k will thus use 4k blocks for reads, and 8k blocks
-               for writes. If you only wish to set the write size, you
+               the format is either bs=read_and_write or bs=read,write,trim.
+               bs=4k,8k will thus use 4k blocks for reads, 8k blocks for
+               writes, and 8k for trims. You can terminate the list with
+               a trailing comma. bs=4k,8k, would use the default value for
+               trims.. If you only wish to set the write size, you
                 can do so by passing an empty read size - bs=,8k will set
                 8k for writes and leave the read default value.
  
@@ -546,6 +570,8 @@ ioengine=str        Defines how the job issues io to the file. The following
  
                         vsync   Basic readv(2) or writev(2) IO.
  
+                       psyncv  Basic preadv(2) or pwritev(2) IO.
+
                         libaio  Linux native asynchronous io. Note that Linux
                                 may only support queued behaviour with
                                 non-buffered IO (set direct=1 or buffered=0).
@@ -744,6 +770,15 @@ random_distribution=str:float      By default, fio will use a completely uniform
                 random_distribution=zipf:1.2 as the option. If a non-uniform
                 model is used, fio will disable use of the random map.
  
+percentage_random=int  For a random workload, set how big a percentage should
+               be random. This defaults to 100%, in which case the workload
+               is fully random. It can be set from anywhere from 0 to 100.
+               Setting it to 0 would make the workload fully sequential. Any
+               setting in between will result in a random mix of sequential
+               and random IO, at the given percentages. It is possible to
+               set different values for reads, writes, and trim. To do so,
+               simply use a comma separated list. See blocksize.
+       
  norandommap    Normally fio will cover every block of the file when doing
                 random IO. If this option is given, fio will just get a
                 new random offset without looking at past io history. This
@@ -775,7 +810,7 @@ random_generator=str        Fio supports the following engines for generating
                 block sizes, not with workloads that use multiple block
                 sizes. If used with such a workload, fio may read or write
                 some blocks multiple times.
-               
+
  nice=int       Run the job with the given nice value. See man nice(2).
  
  prio=int       Set the io priority value of this job. Linux limits us to
@@ -795,11 +830,15 @@ thinktime_spin=int
                 to sleeping for the rest of the period specified by
                 thinktime.
  
-thinktime_blocks
+thinktime_blocks=int
                 Only valid if thinktime is set - control how many blocks
                 to issue, before waiting 'thinktime' usecs. If not set,
                 defaults to 1 which will make fio wait 'thinktime' usecs
-               after every block.
+               after every block. This effectively makes any queue depth
+               setting redundant, since no more than 1 IO will be queued
+               before we have to complete it and do our thinktime. In
+               other words, this setting effectively caps the queue depth
+               if the latter is larger.
  
  rate=int       Cap the bandwidth used by this job. The number is in bytes/sec,
                 the normal suffix rules apply. You can use rate=500k to limit
@@ -1197,7 +1236,7 @@ write_lat_log=str Same as write_bw_log, except that this option stores io
  
                 write_lat_log=foo
  
-               The actual log names will be foo_slat.log, foo_slat.log,
+               The actual log names will be foo_slat.log, foo_clat.log,
                 and foo_lat.log. This helps fio_generate_plot fine the logs
                 automatically.
  
@@ -1219,12 +1258,15 @@ log_avg_msec=int By default, fio will log an entry in the iops, latency,
  lockmem=int    Pin down the specified amount of memory with mlock(2). Can
                 potentially be used instead of removing memory or booting
                 with less memory to simulate a smaller amount of memory.
+               The amount specified is per worker.
  
  exec_prerun=str        Before running this job, issue the command specified
-               through system(3).
+               through system(3). Output is redirected in a file called
+               jobname.prerun.txt.
  
  exec_postrun=str After the job completes, issue the command specified
-                though system(3).
+                though system(3). Output is redirected in a file called
+                jobname.postrun.txt.
  
  ioscheduler=str        Attempt to switch the device hosting the file to the specified
                 io scheduler before running.
@@ -1396,11 +1438,23 @@ that defines them is selected.
  [netsplice] hostname=str
  [net] hostname=str The host name or IP address to use for TCP or UDP based IO.
                 If the job is a TCP listener or UDP reader, the hostname is not
-               used and must be omitted.
+               used and must be omitted unless it is a valid UDP multicast
+               address.
  
  [netsplice] port=int
  [net] port=int The TCP or UDP port to bind to or connect to.
  
+[netsplice] interface=str
+[net] interface=str  The IP address of the network interface used to send or
+               receive UDP multicast
+
+[netsplice] ttl=int
+[net] ttl=int  Time-to-live value for outgoing UDP multicast packets.
+               Default: 1
+
+[netsplice] nodelay=bool
+[net] nodelay=bool     Set TCP_NODELAY on TCP connections.
+
  [netsplice] protocol=str
  [netsplice] proto=str
  [net] protocol=str
@@ -1418,7 +1472,7 @@ that defines them is selected.
  [net] listen   For TCP network connections, tell fio to listen for incoming
                 connections rather than initiating an outgoing connection. The
                 hostname must be omitted if this option is used.
-[net] pingpong Normal a network writer will just continue writing data, and
+[net] pingpong Normaly a network writer will just continue writing data, and
                 a network reader will just consume packages. If pingpong=1
                 is set, a writer will send its normal payload to the reader,
                 then wait for the reader to send the same payload back. This
@@ -1426,6 +1480,9 @@ that defines them is selected.
                 and completion latencies then measure local time spent
                 sending or receiving, and the completion latency measures
                 how long it took for the other end to receive and send back.
+               For UDP multicast traffic pingpong=1 should only be set for a
+               single reader when multiple readers are listening to the same
+               address.
  
  [e4defrag] donorname=str
                 File will be used as a block donor(swap extents between files)
@@ -1574,6 +1631,9 @@ util=             The disk utilization. A value of 100% means we kept the disk
  
  It is also possible to get fio to dump the current output while it is
  running, without terminating the job. To do that, send fio the USR1 signal.
+You can also get regularly timed dumps by using the --status-interval
+parameter, or by creating a file in /tmp named fio-dump-status. If fio
+sees this file, it will unlink it and dump the current output status.
  
  
  7.0 Terse output
@@ -1695,7 +1755,7 @@ trim       trim the given file from the given 'offset' for 'length' bytes
  
  
  9.0 CPU idleness profiling
-
+--------------------------
  In some cases, we want to understand CPU overhead in a test. For example,
  we test patches for the specific goodness of whether they reduce CPU usage.
  fio implements a balloon approach to create a thread per CPU that runs at