Re: kernel panics involving NFS+RPCSEC_GSS

2011-08-18 Thread Clinton Adams
On Thu, Aug 18, 2011 at 3:25 PM, Clinton Adams clinton.ad...@gmail.com wrote:
 Hello,

 Kernel panics if clients hit the nfs server sufficiently hard -
 happens repeatedly with 13 clients logging in at the same approximate
 time, using nfsv4 mounted homes.

 server is running freebsd 8.2-RELEASE-p2. clients are linux 2.6.38-10

 Running a memtest on the server now to rule out bad mem. The server
 has been used for samba, and it's only with the attempted switch to
 nfs that this problem has appeared.


Err, wrong paste from another forum. Here's the trace from my server:

Fatal trap 12: page fault while in kernel mode
Fatal trap 12: page fault while in kernel mode
cpuid = 0;
cpuid = 2; apic id = 00apic id = 06
fault virtual address   = 0x0
fault virtual address   = 0x8
fault code  = supervisor write data, page not present
fault code  = supervisor read data, page not present
instruction pointer = 0x20:0x807db856
instruction pointer = 0x20:0x807dc0d7
stack pointer   = 0x28:0xff8096c0d840
stack pointer   = 0x28:0xff8096c17860
frame pointer   = 0x28:0xff8096c0d860
frame pointer   = 0x28:0xff8096c17a80
code segment= base 0x0, limit 0xf, type 0x1b
code segment= base 0x0, limit 0xf, type 0x1b
= DPL 0, pres 1, long 1, def32 0, gran 1
= DPL 0, pres 1, long 1, def32 0, gran 1
processor eflags=
processor eflags= interrupt enabled, interrupt enabled,
resume, resume, IOPL = 0IOPL = 0
current process =
current process = 765 (nfsd: service)765 (nfsd: service)
trap number = 12
trap number = 12
panic: page fault

cpuid = 1
Uptime: 3h22m48s
Physical memory: 2032 MB
Dumping 406 MB: 391 375 359 343 327 311 295 279 263 247 231 215
199 183 167 151 135 119 103 87 71 55 39 23 7

Reading symbols from /boot/kernel/linux.ko...done.
Loaded symbols for /boot/kernel/linux.ko
Reading symbols from /boot/kernel/nfscommon.ko...done.
Loaded symbols for /boot/kernel/nfscommon.ko
Reading symbols from /boot/kernel/nfsd.ko...done.
Loaded symbols for /boot/kernel/nfsd.ko
Reading symbols from /boot/kernel/snp.ko...done.
Loaded symbols for /boot/kernel/snp.ko
#0  doadump () at pcpu.h:224
224 __asm(movq %%gs:0,%0 : =r (td));
(kgdb) list *0x807db856
0x807db856 is in svc_rpc_gss_forget_client
(/usr/src/sys/rpc/rpcsec_gss/svc_rpcsec_gss.c:622).
617 struct svc_rpc_gss_client_list *list;
618
619 list =
svc_rpc_gss_client_hash[client-cl_id.ci_id % CLIENT_HASH_SIZE];
620 sx_xlock(svc_rpc_gss_lock);
621 TAILQ_REMOVE(list, client, cl_link);
622 TAILQ_REMOVE(svc_rpc_gss_clients, client, cl_alllink);
623 svc_rpc_gss_client_count--;
624 sx_xunlock(svc_rpc_gss_lock);
625 svc_rpc_gss_release_client(client);
626 }
(kgdb) backtrace
#0  doadump () at pcpu.h:224
#1  0x805cbabe in boot (howto=260) at
/usr/src/sys/kern/kern_shutdown.c:419
#2  0x805cbed3 in panic (fmt=0x0) at
/usr/src/sys/kern/kern_shutdown.c:592
#3  0x808d239d in trap_fatal (frame=0xff0004c89460,
eva=Variable eva is not available.
) at /usr/src/sys/amd64/amd64/trap.c:783
#4  0x808d275f in trap_pfault (frame=0xff8096c0d790,
usermode=0) at /usr/src/sys/amd64/amd64/trap.c:699
#5  0x808d2b5f in trap (frame=0xff8096c0d790) at
/usr/src/sys/amd64/amd64/trap.c:449
#6  0x808bada4 in calltrap () at
/usr/src/sys/amd64/amd64/exception.S:224
#7  0x807db856 in svc_rpc_gss_forget_client
(client=0xff001c015200) at atomic.h:158
#8  0x807dc0e3 in svc_rpc_gss (rqst=0xff0004a24000,
msg=0xff8096c0db20) at
/usr/src/sys/rpc/rpcsec_gss/svc_rpcsec_gss.c:642
#9  0x807d48f3 in svc_run_internal
(pool=0xff0004ca6200, ismaster=0) at /usr/src/sys/rpc/svc.c:837
#10 0x807d50ab in svc_thread_start (arg=Variable arg is
not available.
) at /usr/src/sys/rpc/svc.c:1200
#11 0x805a26f8 in fork_exit (callout=0x807d50a0
svc_thread_start, arg=0xff0004ca6200, frame=0xff8096c0dc40)
at /usr/src/sys/kern/kern_fork.c:845
#12 0x808bb26e in fork_trampoline () at
/usr/src/sys/amd64/amd64/exception.S:565
#13 0x0080 in ?? ()
#14 0x7fffe6e0 in ?? ()
#15 0x002e in ?? ()
#16 0x in ?? ()
#17 0xfef4 in ?? ()
#18 0x in ?? ()
#19 0x009b in ?? ()
#20 0x7fffe6e0 in ?? ()
#21 0x0008 in ?? ()
#22 0x0003 in ?? ()
#23 0x in ?? ()

kernel panics involving NFS+RPCSEC_GSS

2011-08-18 Thread Clinton Adams
Hello,

Kernel panics if clients hit the nfs server sufficiently hard -
happens repeatedly with 13 clients logging in at the same approximate
time, using nfsv4 mounted homes.

server is running freebsd 8.2-RELEASE-p2. clients are linux 2.6.38-10

Running a memtest on the server now to rule out bad mem. The server
has been used for samba, and it's only with the attempted switch to
nfs that this problem has appeared.

Fatal trap 12: page fault while in kernel mode
cpuid = 0; apic id = 00
fault virtual address   = 0xff80007bd260
fault code  = supervisor read data, page not present
instruction pointer = 0x20:0x80e20939
stack pointer   = 0x28:0xff80732baaa0
frame pointer   = 0x28:0xff80732bab80
code segment= base 0x0, limit 0xf, type 0x1b
= DPL 0, pres 1, long 1, def32 0, gran 1
processor eflags= interrupt enabled, resume, IOPL = 0
current process = 0 (wpi0 taskq)
trap number = 12
panic: page fault
cpuid = 0
Uptime: 12m21s
Physical memory: 4002 MB
#0  doadump () at pcpu.h:223
223 __asm __volatile(movq %%gs:0,%0 : =r (td));
(kgdb) list *0x80e20939
0x80e20939 is in wpi_newstate
(/usr/src/sys/modules/wpi/../../dev/wpi/if_wpi.c:2453).
2448device_printf(sc-sc_dev, could not configure\n);
2449return error;
2450}
2451
2452/* configuration has changed, set Tx power accordingly */
2453if ((error = wpi_set_txpower(sc, ni-ni_chan, 1)) != 0) {
2454device_printf(sc-sc_dev, could not set
Tx power\n);
2455return error;
2456}
2457
(kgdb) backtrace
#0  doadump () at pcpu.h:223
#1  0x8056f9c0 in boot (howto=260) at
/usr/src/sys/kern/kern_shutdown.c:416
#2  0x8056fe2d in panic (fmt=0x80917ba4 %s) at
/usr/src/sys/kern/kern_shutdown.c:579
#3  0x80842c20 in trap_fatal (frame=0xff0002a80740,
eva=Variable eva is not available.
)
at /usr/src/sys/amd64/amd64/trap.c:857
#4  0x80842fcc in trap_pfault (frame=0xff80732ba9f0, usermode=0)
at /usr/src/sys/amd64/amd64/trap.c:773
#5  0x80843618 in trap (frame=0xff80732ba9f0) at
/usr/src/sys/amd64/amd64/trap.c:499
#6  0x8082a6d3 in calltrap () at
/usr/src/sys/amd64/amd64/exception.S:224
#7  0x80e20939 in wpi_newstate (vap=0xff0005aca000,
nstate=IEEE80211_S_AUTH, arg=192)
at /usr/src/sys/modules/wpi/../../dev/wpi/if_wpi.c:2482
#8  0x806517dc in ieee80211_newstate_cb (xvap=Variable
xvap is not available.
)
at /usr/src/sys/net80211/ieee80211_proto.c:1654
#9  0x805a9ded in taskqueue_run (queue=0xff000314cd00)
at /usr/src/sys/kern/subr_taskqueue.c:239
#10 0x805aa052 in taskqueue_thread_loop (arg=Variable
arg is not available.
) at /usr/src/sys/kern/subr_taskqueue.c:360
#11 0x80548e4d in fork_exit (callout=0x805aa00c
taskqueue_thread_loop,
arg=0xff80003ab0b8, frame=0xff80732bac80) at
/usr/src/sys/kern/kern_fork.c:843
#12 0x8082abae in fork_trampoline () at
/usr/src/sys/amd64/amd64/exception.S:561
#13 0x in ?? ()
#14 0x in ?? ()
#15 0x in ?? ()
#16 0x in ?? ()
#17 0x in ?? ()
#18 0x in ?? ()
#19 0x in ?? ()
#20 0x in ?? ()
#21 0x in ?? ()
#22 0x in ?? ()
#23 0x in ?? ()
#24 0x in ?? ()
#25 0x in ?? ()
#26 0x in ?? ()
#27 0x in ?? ()
#28 0x in ?? ()
#29 0x in ?? ()
#30 0x in ?? ()
#31 0x in ?? ()
#32 0x in ?? ()
#33 0x in ?? ()
#34 0x in ?? ()
#35 0x in ?? ()
#36 0x in ?? ()
#37 0x01c71000 in ?? ()
#38 0x in ?? ()
#39 0x in ?? ()
#40 0xff000239ee40 in ?? ()
#41 0xff0003901000 in ?? ()
#42 0xff80732ba140 in ?? ()
#43 0xff80732ba0f8 in ?? ()
#44 0xff0002a80740 in ?? ()
#45 0x80592283 in sched_switch (td=0xff80003ab0b8,
newtd=0x805aa00c, flags=Variable flags is not available.
)
at /usr/src/sys/kern/sched_ule.c:1844
Previous frame inner to this frame (corrupt stack?)
___
freebsd-questions@freebsd.org mailing list
http://lists.freebsd.org/mailman/listinfo/freebsd-questions
To unsubscribe, send any mail to