[illumos-Developer] Important - time sensitive: Drive failures and infinite waits

Alasdair Lumsden alasdairrr at gmail.com
Thu May 26 08:14:40 PDT 2011


Hi Richard,

This box is running the latest oi_148 (actually it's running a slightly newer un-released oi_148 which has additional Illumos backports:

http://hg.openindiana.org/mq_onnv-gate/file/3e2c4091ddeb)

What makes you think the timeout values haven't stuck? mdb is showing the values did propagate to the per-disk sd state:

root ~ (san01.ixlon1): /usr/bin/uname -a
SunOS san01.ixlon1.everycity.co.uk 5.11 oi_148 i86pc i386 i86pc
root ~ (san01.ixlon1): fmdump -eV
TIME                           CLASS
fmdump: warning: /var/fm/fmd/errlog is empty
root ~ (san01.ixlon1): echo "sd_io_time::print" | mdb -k
0x7
root ~ (san01.ixlon1): echo "::walk sd_state | ::grep '.!=0' | ::sd_state" | mdb -k | egrep "^un|un_retry_count|un_cmd_timeout"
un: ffffff090f43c640

    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff09184a5940
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff09184a5300
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff09184a4cc0
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff09184a4680
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff09184a4040
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918a81980
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918a81340
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff090f43c000
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bd3980
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bd3340
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bd2d00
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bd26c0
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bd2080
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff09169c8000
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff090dfa26c0
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bd9940
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bb6640
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bd9300
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bd8cc0
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff090edde9c0
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff090eddd700
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bd8680
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bd8040
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bcad40
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bcb380
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff090eddd0c0
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff090f43d2c0
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bf0c80
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff090f43cc80
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918a806c0
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918a80d00
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bc79c0
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bc7380
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bc6d40
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bc6700
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bc60c0
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bb7900
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bb72c0
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bb6c80
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bcb9c0
    un_retry_count = 0x5
    un_cmd_timeout = 0x7
un: ffffff0918bca700
    un_retry_count = 0x5
    un_cmd_timeout = 0x7
un: ffffff0918a80080
    un_retry_count = 0x5
    un_cmd_timeout = 0x7
un: ffffff090edddd40
    un_retry_count = 0x5
    un_cmd_timeout = 0x7
un: ffffff0918bf12c0
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff090dfa2d00
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff090dfa2080
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bb6000
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bca0c0
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bf0640
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bf1900
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
un: ffffff0918bf0000
    un_retry_count = 0x3
    un_cmd_timeout = 0x7
root ~ (san01.ixlon1): 
root ~ (san01.ixlon1): 

But I might have misunderstood.

Cheers,

Alasdair


More information about the Developer mailing list