So, just tested with numbjob 4 and it actually went down. a lot. (do note that this is with the direct to SATA ports on mobo, not the HBA)
root@Network-Storage[~]# fio --name=seqwrite \
--rw=write \
--direct=0 \
--iodepth=32 \
--bs=1M \
--numjobs=4 \
--size=32G \
--runtime=30
seqwrite: (g=0): rw=write, bs=(R) 1024KiB-1024KiB, (W) 1024KiB-1024KiB, (T) 1024KiB-1024KiB, ioengine=psync, iodepth=32
...
fio-3.19
Starting 4 processes
seqwrite: Laying out IO file (1 file / 32768MiB)
seqwrite: Laying out IO file (1 file / 32768MiB)
seqwrite: Laying out IO file (1 file / 32768MiB)
seqwrite: Laying out IO file (1 file / 32768MiB)
Jobs: 4 (f=4): [W(4)][100.0%][w=407MiB/s][w=407 IOPS][eta 00m:00s]
seqwrite: (groupid=0, jobs=1): err= 0: pid=3587: Thu Nov 12 17:29:28 2020
write: IOPS=121, BW=121MiB/s (127MB/s)(3645MiB/30004msec)
clat (usec): min=111, max=411693, avg=8204.84, stdev=7181.83
lat (usec): min=123, max=411711, avg=8229.69, stdev=7181.83
clat percentiles (usec):
| 1.00th=[ 255], 5.00th=[ 996], 10.00th=[ 5669], 20.00th=[ 7767],
| 30.00th=[ 7832], 40.00th=[ 7898], 50.00th=[ 8979], 60.00th=[ 9372],
| 70.00th=[ 9503], 80.00th=[ 9503], 90.00th=[ 9503], 95.00th=[ 9634],
| 99.00th=[ 10028], 99.50th=[ 11338], 99.90th=[ 36439], 99.95th=[ 44303],
| 99.99th=[413139]
bw ( KiB/s): min=100151, max=312214, per=23.12%, avg=123778.90, stdev=36602.32, samples=59
iops : min= 97, max= 304, avg=120.34, stdev=35.74, samples=59
lat (usec) : 250=0.93%, 500=2.94%, 750=0.85%, 1000=0.33%
lat (msec) : 2=1.43%, 4=1.65%, 10=90.92%, 20=0.71%, 50=0.22%
lat (msec) : 500=0.03%
cpu : usr=0.31%, sys=2.39%, ctx=28533, majf=0, minf=0
IO depths : 1=100.0%, 2=0.0%, 4=0.0%, 8=0.0%, 16=0.0%, 32=0.0%, >=64=0.0%
submit : 0=0.0%, 4=100.0%, 8=0.0%, 16=0.0%, 32=0.0%, 64=0.0%, >=64=0.0%
complete : 0=0.0%, 4=100.0%, 8=0.0%, 16=0.0%, 32=0.0%, 64=0.0%, >=64=0.0%
issued rwts: total=0,3645,0,0 short=0,0,0,0 dropped=0,0,0,0
latency : target=0, window=0, percentile=100.00%, depth=32
seqwrite: (groupid=0, jobs=1): err= 0: pid=3588: Thu Nov 12 17:29:28 2020
write: IOPS=127, BW=127MiB/s (133MB/s)(3814MiB/30005msec)
clat (usec): min=114, max=387558, avg=7841.57, stdev=6887.42
lat (usec): min=125, max=387584, avg=7865.23, stdev=6888.03
clat percentiles (usec):
| 1.00th=[ 147], 5.00th=[ 363], 10.00th=[ 1106], 20.00th=[ 7635],
| 30.00th=[ 7832], 40.00th=[ 7898], 50.00th=[ 8356], 60.00th=[ 9372],
| 70.00th=[ 9503], 80.00th=[ 9503], 90.00th=[ 9503], 95.00th=[ 9634],
| 99.00th=[ 10028], 99.50th=[ 10814], 99.90th=[ 35914], 99.95th=[ 52167],
| 99.99th=[387974]
bw ( KiB/s): min=97912, max=624429, per=23.95%, avg=128241.80, stdev=70343.53, samples=59
iops : min= 95, max= 609, avg=124.69, stdev=68.68, samples=59
lat (usec) : 250=2.57%, 500=5.66%, 750=1.18%, 1000=0.45%
lat (msec) : 2=0.97%, 4=1.49%, 10=86.52%, 20=0.92%, 50=0.18%
lat (msec) : 100=0.03%, 500=0.03%
cpu : usr=0.32%, sys=2.58%, ctx=28317, majf=0, minf=0
IO depths : 1=100.0%, 2=0.0%, 4=0.0%, 8=0.0%, 16=0.0%, 32=0.0%, >=64=0.0%
submit : 0=0.0%, 4=100.0%, 8=0.0%, 16=0.0%, 32=0.0%, 64=0.0%, >=64=0.0%
complete : 0=0.0%, 4=100.0%, 8=0.0%, 16=0.0%, 32=0.0%, 64=0.0%, >=64=0.0%
issued rwts: total=0,3814,0,0 short=0,0,0,0 dropped=0,0,0,0
latency : target=0, window=0, percentile=100.00%, depth=32
seqwrite: (groupid=0, jobs=1): err= 0: pid=3589: Thu Nov 12 17:29:28 2020
write: IOPS=143, BW=144MiB/s (151MB/s)(4316MiB/30003msec)
clat (usec): min=90, max=264989, avg=6927.47, stdev=5438.61
lat (usec): min=99, max=265007, avg=6949.81, stdev=5440.84
clat percentiles (usec):
| 1.00th=[ 125], 5.00th=[ 225], 10.00th=[ 330], 20.00th=[ 775],
| 30.00th=[ 7701], 40.00th=[ 7832], 50.00th=[ 7898], 60.00th=[ 9241],
| 70.00th=[ 9503], 80.00th=[ 9503], 90.00th=[ 9503], 95.00th=[ 9634],
| 99.00th=[ 9896], 99.50th=[ 10421], 99.90th=[ 35914], 99.95th=[ 44827],
| 99.99th=[265290]
bw ( KiB/s): min=97912, max=1442982, per=26.52%, avg=141978.02, stdev=173961.74, samples=59
iops : min= 95, max= 1409, avg=138.12, stdev=169.94, samples=59
lat (usec) : 100=0.51%, 250=7.55%, 500=10.70%, 750=1.20%, 1000=0.28%
lat (msec) : 2=0.93%, 4=1.44%, 10=76.58%, 20=0.63%, 50=0.14%
lat (msec) : 100=0.02%, 500=0.02%
cpu : usr=0.33%, sys=3.04%, ctx=28394, majf=0, minf=0
IO depths : 1=100.0%, 2=0.0%, 4=0.0%, 8=0.0%, 16=0.0%, 32=0.0%, >=64=0.0%
submit : 0=0.0%, 4=100.0%, 8=0.0%, 16=0.0%, 32=0.0%, 64=0.0%, >=64=0.0%
complete : 0=0.0%, 4=100.0%, 8=0.0%, 16=0.0%, 32=0.0%, 64=0.0%, >=64=0.0%
issued rwts: total=0,4316,0,0 short=0,0,0,0 dropped=0,0,0,0
latency : target=0, window=0, percentile=100.00%, depth=32
seqwrite: (groupid=0, jobs=1): err= 0: pid=3590: Thu Nov 12 17:29:28 2020
write: IOPS=130, BW=130MiB/s (137MB/s)(3915MiB/30002msec)
clat (usec): min=95, max=392176, avg=7637.90, stdev=6969.66
lat (usec): min=106, max=392215, avg=7661.39, stdev=6970.70
clat percentiles (usec):
| 1.00th=[ 135], 5.00th=[ 322], 10.00th=[ 482], 20.00th=[ 7308],
| 30.00th=[ 7832], 40.00th=[ 7898], 50.00th=[ 8029], 60.00th=[ 9372],
| 70.00th=[ 9503], 80.00th=[ 9503], 90.00th=[ 9503], 95.00th=[ 9634],
| 99.00th=[ 10028], 99.50th=[ 10683], 99.90th=[ 36439], 99.95th=[ 51643],
| 99.99th=[392168]
bw ( KiB/s): min=97912, max=792669, per=24.46%, avg=130989.71, stdev=90972.39, samples=59
iops : min= 95, max= 774, avg=127.39, stdev=88.90, samples=59
lat (usec) : 100=0.05%, 250=3.04%, 500=7.20%, 750=1.48%, 1000=0.41%
lat (msec) : 2=1.12%, 4=1.48%, 10=84.29%, 20=0.69%, 50=0.18%
lat (msec) : 100=0.03%, 500=0.03%
cpu : usr=0.34%, sys=2.67%, ctx=28363, majf=0, minf=0
IO depths : 1=100.0%, 2=0.0%, 4=0.0%, 8=0.0%, 16=0.0%, 32=0.0%, >=64=0.0%
submit : 0=0.0%, 4=100.0%, 8=0.0%, 16=0.0%, 32=0.0%, 64=0.0%, >=64=0.0%
complete : 0=0.0%, 4=100.0%, 8=0.0%, 16=0.0%, 32=0.0%, 64=0.0%, >=64=0.0%
issued rwts: total=0,3915,0,0 short=0,0,0,0 dropped=0,0,0,0
latency : target=0, window=0, percentile=100.00%, depth=32
Run status group 0 (all jobs):
WRITE: bw=523MiB/s (548MB/s), 121MiB/s-144MiB/s (127MB/s-151MB/s), io=15.3GiB (16.5GB), run=30002-30005msec