FIO 磁盘IO性能测试-及测试报告解读

辣条①号 2022年 11月 5日性能测试 703 次浏览 0

【腾讯云】30M海外服务器99/年续费同价强烈推荐 https://cloud.tencent.com/act/cps/redirect?redirect=2446&cps_key=752564b15c36b5558a79fd5cbaf8e0bf&from=console

文章目录

操作系统具有的功能：预读 & 回写

FIO功能 + 引擎介绍

# 磁盘性能指标
    Latency(延迟):    # 一次I/O操作所消耗的时间
    Bandwidth(带宽):  # 单位时间内传输的数据量
    IOPS(TPS):        # 每秒完成的I/O操作次数

# FIO 支持的 测试功能如下
    1）支持十几种存储引擎，可以自定义
    2）自带做图工具，调用gnuplot做图
    3）支持几乎所有的存储描述参数
    4）大量对CPU，内存，进程/线程，文件，IO特性的配置
    5）压缩，trace回放，。。。这些都包含，灵活的配置

# FIO 支持的引擎介绍（rbd引擎 要求fio 版本大于 3.1）
    #支持19种不同的I/O引擎（可以使用 fio--enghelp 进行查看）
    sync（同步阻塞I/O，这是默认的），psync，vsync，pvsync，rbd，libaio（Linux的native异步I/O），posixaio，solarisaio，windowsaio，sg，syslet-rw等

# FIO 官方文档：https://fio.readthedocs.io/en/latest/fio_doc.html

# FIO 测试案例：https://github.com/get-set/fio-bench-disks-ceph

FIO安装与使用帮助说明

#首先安装fio磁盘性能专业测试工具
    yum install fio -y

#如何使用fio的在线帮助
    --help：     获得帮助信息。
    --cmdhelp：      获得命令的帮助文档。
    --enghelp：      获得引擎的帮助文档。
    --debug：        通过debug方式查看测试的详细信息。（process, file, io, mem, blktrace, verify, random, parse, diskutil, job, mutex, profile, time, net, rate）
    --output：       测试结果输出到文件。
    --output-format ：设置输出格式。（terse, json, normal）
    --crctest：      测试crc性能。（md5, crc64, crc32, crc32c, crc16, crc7, sha1, sha256, sha512, xxhash:）
    --cpuclock-test：CPU始终测试。

FIO工具选项及参数说明

# 本地磁盘，指定测试路径
    filename=/dev/sdb1  #对整个磁盘或分区测试，（会损坏数据的）
    directory=/root/ss  #对本地磁盘的某个目录进行测试（ filename | directory 二者选一）

# 其他参数
    direct=1        #测试过程绕过机器自带的buffer。使测试结果更真实。（布尔型）
    rw=read         #测试顺序读的I/O，可选参数（write 顺序写 |read 顺序读 |rw,readwrite 顺序混合读写 |randwrite 随机写 |randread 随机读 |randrw 随机混合读写）

    ioengine=libaio #定义使用哪种IO，此为libaio异步模式，（默认是sync）
    userspace_reap  #配合libaio，提高异步io的收割速度（只能配合libaio引擎使用）

    iodepth=16      #IO队列的深度，表示在这个文件上同一时刻运行16个I/O，默认为1。如果ioengine采用异步方式，该参数表示一批提交保持的io单元数。
    iodepth_batch=8 #当队列里面的IO数量达到8值的时候，就调用io_submit批次提交请求，然后开始调用io_getevents开始收割已经完成的IO
    iodepth_batch_complete=8    #每次收割多少呢？由于收割的时候，超时时间设置为0，所以有多少已完成就算多少，最多可以收割iodepth_batch_complete值个
    iodepth_low=8   #随着收割，IO队列里面的IO数就少了，那么需要补充新的IO，当IO数目降到iodepth_low值的时候，就重新填充，保证OS可以看到至少iodepth_low数目的io在电梯口排队着
    thread          #fio使用线程而不是进程
    bs=4k           #单次io的块文件大小为4k
    bsrange=512-2048    #同上，提定数据块的大小范围（单位：字节）
    size=5g         #本次的测试文件大小为5g，以每次4k的io进行测试（可以基于时间，也可以基于容量测试）
    runtime=120     #测试时间为120秒，如果不定义时间，则一直将5g文件分4k每次写完为止。。
    numjobs=4       #本次的测试线程为4
    group_reporting #关于显示结果的，汇总每个（线程/进程）的信息

    max-jobs=10     #最大允许的作业数线程数        
    rwmixwrite=30   #在混合读写的模式下，写占30%
    bssplit=4k/30:8k/40:16k/30  #随机读4k文件占30%、8k占40%、16k占30%
    rwmixread=70    #读占70% 
    name=ceshi      #指定job的名字，在命令行中表示新启动一个job
    invalidate=1        #开始io之前就失效buffer-cache（布尔型）
    randrepeat=0        #设置产生的随机数是不可重复的
    ioscheduler=psync   #将设备文件切换为这里指定的IO调度器（看场合使用）

    lockmem=1g      #只使用1g内存进行测试。
    zero_buffers    #用0初始化系统buffer。
    nrfiles=8       #每个进程生成文件的数量。

FIO 生成图片

# 先安装 fio 和 gnuplot
    yum install fio gnuplot

# 在执行的命令后面加入
    # writelog 是以job为单位进行记录，有几个jobs ,就会有相应的log生成
    -write_bw_log=rw        # 记录带宽
    -write_lat_log=rw       # 记录延迟（三种延迟：Completion Latency、I/O Latency、Submission Latency）
    -write_iops_log=rw      # 记录iops
    -iopsavgtime=1000       # 每隔1秒种记录一次iops
    -log_avg_msec=1000      # 每隔1秒种记录一次延迟
    -bwavgtime=1000         # 每隔1秒种记录一次带宽
    -write_bw_log=rw -write_lat_log=rw -write_iops_log=rw

# 将 生成的 日志文件重命名，不然抓取不到
    for i in clat lat slat bw iops; do mv rw_$i.1.log rw_$i.log; done

# 使用命令生成svg格式的图片
    fio_generate_plots rw

命令行模式-示例

FIO + libaio 引擎示例（注意：测试量级建议大于主机内存）

# 128K小文件顺序写(主要看带宽)
    fio -ioengine=libaio -direct=1 -iodepth=4 -thread=1 -randrepeat=0 -group_reporting -directory=/root/ss -bs=128k -size=4G -rw=write -name=128k-write
    fio -ioengine=libaio -direct=1 -iodepth=4 -thread=1 -randrepeat=0 -group_reporting -filename=/dev/rbd0 -bs=128k -size=4G -rw=write -name=128k-write

# 128K小文件顺序读(主要看带宽)
    fio -ioengine=libaio -direct=1 -iodepth=4 -thread=1 -randrepeat=0 -group_reporting -directory=/root/ss -bs=128k -size=4G -rw=read -name=128k-read

# 4K小文件随机写(主要看IOPS和延迟)
    fio -ioengine=libaio -direct=1 -iodepth=4 -thread=1 -randrepeat=0 -group_reporting -directory=/root/ss -bs=4k -size=4G -rw=randwrite -name=4k-randwrite

# 4K小文件随机读(主要看IOPS和延迟)
    fio -ioengine=libaio -direct=1 -iodepth=4 -thread=1 -randrepeat=0 -group_reporting -directory=/root/ss -bs=4k -size=4G -rw=randread -name=4k-randread

# 4K小文件顺序读写
    fio -ioengine=libaio -direct=1 -iodepth=4 -thread=1 -randrepeat=0 -group_reporting -directory=/root/ss -bs=4k -size=4G -rw=rw -name=4k-rw

# 4K小文件随机读写
    fio -ioengine=libaio -direct=1 -iodepth=4 -thread=1 -randrepeat=0 -group_reporting -directory=/root/ss -bs=4k -size=4G -rw=randrw -name=4k-randrw

FIO + rbd 引擎示例（测试rbd 块设备）

# 1、前提是，先正确安装好 ceph-common、fio 这两个软件，他们会附带安装相关依赖

# 2、并且要 配置好 ceph -s 能正常查看ceph集群信息（配置好这两个文件，没有就创建）
    /etc/ceph/ceph.conf
    /etc/ceph/ceph.client.admin.keyring

# 测试rbd 的 4k顺序写
    fio -ioengine=rbd -pool=volumes -rbdname=kvm001-system -rw=write -direct=1 -iodepth=4 -thread=1 -bs=4k -size=4G -name=4k-write

配置文件模式-示例

FIO + libaio 模式，以配置文件的形式进行IO测试

#执行时只需要直接运行 fio /root/conf-file 就行了

cat > /root/conf-file  << EOF
[global]
directory=/root/ss
ioengine=libaio
direct=1
thread=1
norandommap=1
invalidate=1
randrepeat=0
size=4g

[4k-write]
stonewall
group_reporting
bs=4k
rw=write
iodepth=4

[4k-read]
stonewall
group_reporting
bs=4k
rw=read
iodepth=4
EOF

FIO + rbd 模式，以配置文件的形式进行IO测试

# 注意、要先完成 ceph-common、ceph -s的环境准备

cat > /root/conf-file  << EOF
[global]
ioengine=rbd
clientname=admin
pool=volumes
rbdname=kvm001-system
invalidate=0    # mandatory
rw=randwrite
bs=4k
[rbd_iodepth32]
iodepth=32
EOF

显示报告解释

[root@localhost ss]# fio -directory=/root/ss -direct=1 -iodepth=1 -thread -ioengine=libaio -randrepeat=0 -bs=4k -size=4G -group_reporting -rw=read -name=4k-write
4k-write: (g=0): rw=read, bs=4K-4K/4K-4K/4K-4K, ioengine=libaio, iodepth=1
fio-2.2.8
Starting 1 thread
Jobs: 1 (f=1): [R(1)] [100.0% done] [62856KB/0KB/0KB /s] [15.8K/0/0 iops] [eta 00m:00s]
4k-write: (groupid=0, jobs=1): err= 0: pid=6889: Wed Aug  2 14:27:56 2017
#io方式，io：总的IO量, bw：带宽KB/s, iops：每秒钟的IO数, runt：总运行时间, lat (msec)：延迟(毫秒), msec毫秒, usec 微秒
  read : io=4096.0MB, bw=62504KB/s, iops=15625, runt= 67105msec

#提交延迟（submission latency）：表示需要多久将IO提交给linux的kernel做处理
    slat (usec): min=3, max=152, avg= 3.92, stdev= 1.19

#完成延迟（completion latency）：表示提交给kernel后到IO做完之间的时间，不包括submission latency，这是评估延迟性能最好指标

    clat (usec): min=19, max=39381, avg=59.45, stdev=71.22
     lat (usec): min=35, max=39384, avg=63.46, stdev=71.23

#完成延迟百分数
    clat percentiles (usec):
     |  1.00th=[   46],  5.00th=[   48], 10.00th=[   49], 20.00th=[   50],
     | 30.00th=[   50], 40.00th=[   51], 50.00th=[   57], 60.00th=[   58],
     | 70.00th=[   59], 80.00th=[   62], 90.00th=[   66], 95.00th=[   68],
     | 99.00th=[  133], 99.50th=[  434], 99.90th=[  462], 99.95th=[  466],
     | 99.99th=[  588]

#带宽，其中per不太清除
    bw (KB  /s): min=46200, max=63704, per=100.00%, avg=62509.19, stdev=2276.96

#下面三行，这是一组组数据，表示延迟，只是单位不同
    lat (usec) : 20=0.01%, 50=17.88%, 100=80.80%, 250=0.64%, 500=0.67%
        表示80.80%的request延迟小于100微秒，延迟小于50微秒的请求request占17.88%（下面也一样）
    lat (usec) : 750=0.01%, 1000=0.01%
    lat (msec) : 2=0.01%, 4=0.01%, 10=0.01%, 20=0.01%, 50=0.01%

#用户/系统CPU占用率，进程上下文切换(context switch)次数，主要和次要(major and minor)页面错误数量(page faults)。（若使用直接IO，page faults数量应该极少）
  cpu          : usr=2.03%, sys=6.82%, ctx=1048671, majf=0, minf=9

#Fio有一个iodepth设置，用来控制同一时刻发送给OS多少个IO。这完全是纯应用层面的行为，和盘的IO queue不是一回事。这里iodepth设成1，所以IO depth在全部时间都是1
  IO depths    : 1=100.0%, 2=0.0%, 4=0.0%, 8=0.0%, 16=0.0%, 32=0.0%, >=64=0.0%

#submit和complete代表同一时间段内fio发送上去和已完成的IO数量。对于产生这个输出的垃圾回收测试用例来说，iodepth是默认值1，所以100%的IO在同一时刻发送1次，放在1-4栏位里。通常来说，只有iodepth大于1才需要关注这一部分数据
     submit    : 0=0.0%, 4=100.0%, 8=0.0%, 16=0.0%, 32=0.0%, 64=0.0%, >=64=0.0%
     complete  : 0=0.0%, 4=100.0%, 8=0.0%, 16=0.0%, 32=0.0%, 64=0.0%, >=64=0.0%
     issued    : total=r=1048576/w=0/d=0, short=r=0/w=0/d=0, drop=r=0/w=0/d=0
     latency   : target=0, window=0, percentile=100.00%, depth=1

Run status group 0 (all jobs):
   READ: io=4096.0MB, aggrb=62503KB/s, minb=62503KB/s, maxb=62503KB/s, mint=67105msec, maxt=67105msec

Disk stats (read/write):
    dm-0: ios=1046013/25, merge=0/0, ticks=58687/1975, in_queue=60662, util=87.64%, aggrios=1048576/22, aggrmerge=0/5, aggrticks=58294/1532, aggrin_queue=59651, aggrutil=86.56%
  sda: ios=1048576/22, merge=0/5, ticks=58294/1532, in_queue=59651, util=86.56%

声明：本文为原创，作者为辣条①号，转载时请保留本声明及附带文章链接：https://boke.wsfnk.com/archives/126.html

赏

谢谢你请我吃辣条

如果文章对你有帮助，欢迎点击上方按钮打赏作者

FIO 磁盘IO性能测试-及测试报告解读

操作系统具有的功能：预读 & 回写

FIO功能 + 引擎介绍

FIO安装与使用帮助说明

FIO工具选项及参数说明

FIO 生成图片

命令行模式-示例

FIO + libaio 引擎示例（注意：测试量级建议大于主机内存）

FIO + rbd 引擎示例（测试rbd 块设备）

配置文件模式-示例

FIO + libaio 模式，以配置文件的形式进行IO测试

FIO + rbd 模式，以配置文件的形式进行IO测试

显示报告解释

最后编辑于：2023/7/6作者：辣条①号

暂无评论

发表回复取消回复

操作系统具有的功能：预读 & 回写

FIO功能 + 引擎介绍

FIO安装与使用帮助说明

FIO工具选项及参数说明

FIO 生成图片

命令行模式-示例

FIO + libaio 引擎 示例（注意：测试量级建议大于主机内存）

FIO + rbd 引擎 示例（测试rbd 块设备）

配置文件模式-示例

FIO + libaio 模式，以配置文件的形式进行IO测试

FIO + rbd 模式，以配置文件的形式进行IO测试

显示报告解释

最后编辑于：2023/7/6作者： 辣条①号

暂无评论

发表回复 取消回复

FIO + libaio 引擎示例（注意：测试量级建议大于主机内存）

FIO + rbd 引擎示例（测试rbd 块设备）

最后编辑于：2023/7/6作者：辣条①号

发表回复取消回复