We have seen this behavior, but it appears to be entirely related to the hardware having 
the "Intel IPMI" stuff swallow up the NFS traffic on port 623 directly by the 
network hardware and never getting.

http://blogs.sun.com/shepler/entry/port_623_or_the_mount

Unfortunately, this nfs hangs across 3 separate machines, none of
which should have this IPMI issue.  It did spur me on to dig a little
deeper, though, so thanks for the encouragement that all may not be
well.

Can anyone debug this?  Remember that this is Nexenta Alpha 7, so it
should be b61.  nfsd is totally hung (rpc timeouts) and zfs would be
having problems taking snapshots, if I hadn't disabled the hourly
snapshots.

Thanks!
Thomas

[EMAIL PROTECTED] ~]$ rpcinfo -t filer0 nfs
rpcinfo: RPC: Timed out
program 100003 version 0 is not available

echo "::pgrep nfsd | ::walk thread | ::findstack -v" | mdb -k

stack pointer for thread 821cda00: 822d6e28
 822d6e5c swtch+0x17d()
 822d6e8c cv_wait_sig_swap_core+0x13f(8b8a9232, 8b8a9200, 0)
 822d6ea4 cv_wait_sig_swap+0x13(8b8a9232, 8b8a9200)
 822d6ee0 cv_waituntil_sig+0x100(8b8a9232, 8b8a9200, 0)
 822d6f44 poll_common+0x3e1(8069480, a, 0, 0)
 822d6f84 pollsys+0x7c()
 822d6fac sys_sysenter+0x102()
stack pointer for thread 821d2e00: 8c279d98
 8c279dcc swtch+0x17d()
 8c279df4 cv_wait_sig+0x123(8988796e, 89887970)
 8c279e2c svc_wait+0xaa(1)
 8c279f84 nfssys+0x423()
 8c279fac sys_sysenter+0x102()
stack pointer for thread a9f88800: 8c92e218
 8c92e244 swtch+0x17d()
 8c92e254 cv_wait+0x4e(8a4169ea, 8a4169e0)
 8c92e278 mv_wait_for_dma+0x32()
 8c92e2a4 mv_start+0x278(88252c78, 89833498)
 8c92e2d4 sata_hba_start+0x79(8987d23c, 8c92e304)
 8c92e308 sata_txlt_synchronize_cache+0xb7(8987d23c)
 8c92e334 sata_scsi_start+0x1b7(8987d1e4, 8987d1e0)
 8c92e368 scsi_transport+0x52(8987d1e0)
 8c92e3a4 sd_start_cmds+0x28a(8a2710c0, 0)
 8c92e3c0 sd_core_iostart+0x158(18, 8a2710c0, 8da3be70)
 8c92e3f8 sd_uscsi_strategy+0xe8(8da3be70)
 8c92e414 sd_send_scsi_SYNCHRONIZE_CACHE+0xd4(8a2710c0, 8c50074c)
 8c92e4b0 sdioctl+0x48e(1ac0080, 422, 8c50074c, 80100000, 883cee68, 0)
 8c92e4dc cdev_ioctl+0x2e(1ac0080, 422, 8c50074c, 80100000, 883cee68, 0)
 8c92e504 ldi_ioctl+0xa4(8a671700, 422, 8c50074c, 80100000, 883cee68, 0)
 8c92e544 vdev_disk_io_start+0x187(8c500580)
 8c92e554 vdev_io_start+0x18(8c500580)
 8c92e580 zio_vdev_io_start+0x142(8c500580)
 8c92e59c zio_next_stage+0xaa(8c500580)
 8c92e5b0 zio_ready+0x136(8c500580)
 8c92e5cc zio_next_stage+0xaa(8c500580)
 8c92e5ec zio_wait_for_children+0x46(8c500580, 1, 8c50076c)
 8c92e600 zio_wait_children_ready+0x18(8c500580)
 8c92e614 zio_next_stage_async+0xac(8c500580)
 8c92e624 zio_nowait+0xe(8c500580)
 8c92e660 zio_ioctl+0x94(9c6f8300, 89557c80, 89556400, 422, 0, 0)
 8c92e694 zil_flush_vdev+0x54(89557c80, 0, 0, 8c92e6e0, 9c6f8500)
 8c92e6e4 zil_flush_vdevs+0x6b(8bbe46c0)
 8c92e734 zil_commit_writer+0x35f(8bbe46c0, 3497c, 0, 4af5, 0)
 8c92e774 zil_commit+0x96(8bbe46c0, ffffffff, ffffffff, 4af5, 0)
 8c92e7e8 zfs_putpage+0x1e4(8c8ab480, 0, 0, 0, 0, 8c6c75c0)
 8c92e824 vhead_putpage+0x95(8c8ab480, 0, 0, 0, 0, 8c6c75c0)
 8c92e86c fop_putpage+0x27(8c8ab480, 0, 0, 0, 0, 8c6c75c0)
 8c92e91c rfs4_op_commit+0x153(82141dd4, b28c3100, 8c92ed8c, 8c92e948)
 8c92ea48 rfs4_compound+0x1ce(8c92ead0, 8c92ea7c, 0, 8c92ed8c, 0)
 8c92eaac rfs4_dispatch+0x65(8bf9b248, 8c92ed8c, b28c5a40, 8c92ead0)
 8c92ed10 common_dispatch+0x6b0(8c92ed8c, b28c5a40, 2, 4, 8bf9c01c, 8bf9b1f0)
 8c92ed34 rfs_dispatch+0x1f(8c92ed8c, b28c5a40)
 8c92edc4 svc_getreq+0x158(b28c5a40, 842952a0)
 8c92ee0c svc_run+0x146(898878e8)
 8c92ee2c svc_do_run+0x6e(1)
 8c92ef84 nfssys+0x3fb()
 8c92efac sys_sysenter+0x102()
<snipping out a bunch of other threads>
_______________________________________________
zfs-discuss mailing list
zfs-discuss@opensolaris.org
http://mail.opensolaris.org/mailman/listinfo/zfs-discuss

Reply via email to