On Sat, Sep 20, 2025 at 10:59:51PM +0200, Claudio Jeker wrote:
> The M10-1 hits this panic in roughly 24h of running make -j 32 build in a
> loop. First time it exploded inside the reaper for me. So maybe this is
> closer to the truth.
Another run, took a bit more than 24h this time.
This is from my top running when it paniced:
load averages: 20.59, 10.40, 6.74 m10.zyd.ch 08:39:30
135 processes: 6 starting, 4 running, 98 idle, 1 dead, 26 on up 1 days 11:39:33
32 CPUs: 19.0% user, 0.0% nice, 12.8% sys, 67.4% spin, 0.0% intr, 0.8% idle
Memory: Real: 504M/7786M act/tot Free: 116G Cache: 6008M Swap: 0K/88G
cpu13 crashed because on mi_switch cpuswitch corrupted the registers.
CPU after 17 did not stop (probably because the cpu mondo broke down).
Three make processes are running:
pid 83460 cpu 13 is toast but somewhere between fork and exec.
pid 27987 cpu 4 is in uvmspace_exec()
pid 2638 cpu 9 is spinning on the kernel lock for some syscall
No process in ps /o seems to hold the KERNEL_LOCK which is a bit strange since
the parent make process is waiting for the lock.
--
:wq Claudio
ddb{13}> show panic
cpu2: uobjlk rwlock 0x4077ae3b6b0: enter write deadlock
*cpu13: mutex 0x0 not held in mi_switch
cpu18: Unable to broadcast mondo 1011cc4: 9
cpu20: kernel data fault: pc=1769a44 addr=1c78b7e000
cpu25: trap type 0x34 (mem address not aligned): pc=1063d70 npc=1063e0c pstate
=44820006<PRIV,IE>
cpu31: Unable to broadcast mondo 1011cc4: 9
ddb{13}> tr
sun4v_send_ipi(11, 1011ddc, 2710, 9, ffffffffffffffff, 0) at sun4v_send_ipi+0xa
c
db_enter_ddb(41b9fef8000, a, 1cbffc0, 1c80ac0, 1c189e0, 40000) at db_enter_ddb+
0x244
db_ktrap(101, 407659b1390, 1, 0, 407659b1610, 0) at db_ktrap+0x104
trap(407659b1390, 101, 1300ca4, 820006, 0, 1f) at trap+0x2d8
Lslowtrap_reenter(27, 41b9ff388ac, 17cf618, 407659b16d8, 1a06e90, 0) at Lslowtr
ap_reenter+0xf8
panic(17cf618, 0, 19f4810, 0, 100, 41b9ff388ac) at panic+0xcc
mi_switch(0, 0, 0, 0, 0, 0) at mi_switch+0x388
ddb{13}> ps /o
TID PID UID PRFLAGS PFLAGS CPU COMMAND
*203859 83460 21 0x100001 0 13 make
44218 27987 21 0x101005 0 4 make
490412 87307 21 0x3 0 5 cc
355576 75008 21 0x3 0 17 cc
355245 55821 21 0x3 0 20 cc
384888 87907 21 0x100003 0 18 cc
462853 25796 21 0x100003 0 6 ld
368951 38484 21 0x100003 0 11 cc1
419968 12491 21 0x100003 0 16 cc1
327300 77705 21 0x100003 0 3 cc1
422105 21158 21 0x100003 0 12 as
154033 17629 21 0x100003 0 7 cc1
26369 29404 21 0x100003 0 14 cc1
130757 4217 21 0x100003 0 10 cc1
257136 33437 21 0x100003 0 15 cc1
9396 70728 21 0x100003 0 1 cc1
313747 2638 21 0x10100003 0 9 make
510201 65806 115 0x100012 0 26 slaacd
171627 71222 115 0x100012 0 28 slaacd
39953 28730 0 0x14000 0x200 0 reaper
470293 89415 0 0x14000 0x200 23 softnet0
ddb{13}> ps
PID TID PPID UID S FLAGS WAIT COMMAND
*83460 203859 2638 21 7 0x100001 make
27987 44218 2638 21 7 0x101005 make
87307 490412 2638 21 7 0x3 cc
29978 253097 2638 21 3 0x3 uobjlk cc
15695 197186 2638 21 3 0x3 uobjlk cc
75008 355576 2638 21 7 0x3 cc
55821 355245 2638 21 7 0x3 cc
87907 384888 2638 21 7 0x100003 cc
333 427413 90561 21 3 0x100083 piperd as
9370 367604 90561 21 3 0x100003 inode cc1
24712 51419 76483 21 3 0x100083 piperd as
74182 171943 76483 21 3 0x100003 inode cc1
25796 462853 2638 21 7 0x100003 ld
55683 169684 59514 21 3 0x100083 piperd as
64090 413637 59514 21 3 0x100003 inode cc1
90561 492487 2638 21 3 0x100083 wait cc
8353 382079 23335 21 3 0x100083 piperd as
76483 302250 2638 21 3 0x100083 wait cc
59514 166217 2638 21 3 0x100083 wait cc
38484 368951 23335 21 7 0x100003 cc1
23335 96000 2638 21 3 0x100083 wait cc
81439 105417 34605 21 3 0x100083 piperd as
6895 247934 54518 21 3 0x100083 piperd as
62855 97939 34605 21 3 0x100003 inode cc1
12491 419968 54518 21 7 0x100003 cc1
54518 166956 2638 21 3 0x100083 wait cc
34605 28207 2638 21 3 0x100083 wait cc
62623 342208 18323 21 3 0x100083 piperd as
77705 327300 18323 21 7 0x100003 cc1
18323 438745 2638 21 3 0x100083 wait cc
91545 37025 30776 21 3 0x100083 piperd as
84584 30157 30776 21 3 0x100003 inode cc1
30776 488756 2638 21 3 0x100083 wait cc
21158 422105 83687 21 7 0x100003 as
83687 510796 2638 21 3 0x100083 wait cc
37707 192885 77861 21 3 0x100083 piperd as
17629 154033 77861 21 7 0x100003 cc1
77861 96407 2638 21 3 0x100083 wait cc
45088 8998 2765 21 3 0x100083 piperd as
29404 26369 2765 21 7 0x100003 cc1
64386 326829 5796 21 3 0x100083 piperd as
4217 130757 5796 21 7 0x100003 cc1
2765 464726 2638 21 3 0x100083 wait cc
5796 19327 2638 21 3 0x100083 wait cc
98228 386403 63771 21 3 0x100083 piperd as
33437 257136 63771 21 7 0x100003 cc1
63771 91825 2638 21 3 0x100083 wait cc
80973 297569 12821 21 3 0x100083 piperd as
70728 9396 12821 21 7 0x100003 cc1
12821 365734 2638 21 3 0x100083 wait cc
35145 126344 2638 21 3 0x100083 wait cc
2638 313747 82086 21 7 0x10100003 make
82086 387179 7908 21 3 0x10008b sigsusp sh
7908 464733 51747 21 3 0x10008b sigsusp make
51747 461444 16433 0 3 0x10008b sigsusp sh
16433 350032 12765 0 3 0x10008b sigsusp make
12765 92966 66947 0 3 0x10008b sigsusp make
66947 354988 41804 0 3 0x100083 wait time
41804 291802 59417 0 3 0x100083 wait time
71036 327746 70600 0 3 0x100083 piperd tee
59417 497258 70600 0 3 0x100089 sigsusp sh
70600 511505 55184 0 3 0x10008b sigsusp sh
36395 193047 98843 1000 3 0x100083 kqread tail
98843 480682 85946 1000 3 0x10008b sigsusp ksh
60405 234733 99431 1000 3 0x100083 kqread top
99431 129956 85946 1000 3 0x10008b sigsusp ksh
85844 240848 6294 1000 3 0x83 kqread systat
6294 467906 85946 1000 3 0x10008b sigsusp ksh
55184 295301 85946 1000 3 0x10008b sigsusp ksh
85946 193395 1 1000 3 0x100080 kqread tmux
33451 84859 86833 1000 3 0x100083 kqread tmux
86833 124813 36245 1000 3 0x10008b sigsusp ksh
36245 293646 16037 1000 3 0x98 kqread sshd-session
16037 223564 8899 0 3 0x82 kqread sshd-session
42375 2491 1 0 3 0x100083 ttyin ksh
39678 457854 1 0 3 0x100098 kqread cron
26985 107453 1 99 3 0x1100090 kqread sndiod
91672 198225 1 110 3 0x100090 kqread sndiod
65750 404389 79014 95 3 0x1100092 kqread smtpd
34479 369135 79014 103 3 0x1100092 kqread smtpd
26626 31062 79014 95 3 0x1100092 kqread smtpd
6996 108112 79014 95 3 0x100092 kqread smtpd
91984 216217 79014 95 3 0x1100092 kqread smtpd
60436 393440 79014 95 3 0x1100092 kqread smtpd
79014 442861 1 0 3 0x100080 kqread smtpd
8899 161590 1 0 3 0x88 kqread sshd
15440 287074 1 0 3 0x100080 kqread ntpd
39263 361534 9686 83 3 0x100092 kqread ntpd
9686 409798 1 83 3 0x1100092 kqread ntpd
39393 284534 5827 74 3 0x1100092 bpf pflogd
5827 209189 1 0 3 0x80 sbwait pflogd
14302 155928 38669 73 3 0x1100090 kqread syslogd
38669 407555 1 0 3 0x100082 sbwait syslogd
44494 220072 1 0 3 0x100080 kqread resolvd
21339 505439 60763 77 3 0x100092 kqread dhcpleased
74356 361194 60763 77 3 0x100092 kqread dhcpleased
60763 325943 1 0 3 0x80 kqread dhcpleased
65806 510201 75067 115 7 0x100012 slaacd
71222 171627 75067 115 7 0x100012 slaacd
75067 124777 1 0 3 0x100080 sysctllk slaacd
80151 453697 0 0 3 0x14200 bored smr
24408 170266 0 0 3 0x14200 pgzero zerothread
36407 427572 0 0 3 0x14200 aiodoned aiodoned
62565 55260 0 0 3 0x14200 syncer update
64116 201669 0 0 3 0x14200 cleaner cleaner
28730 39953 0 0 7 0x14200 reaper
33431 157164 0 0 3 0x14200 pgdaemon pagedaemon
46161 472629 0 0 3 0x14200 usbtsk usbtask
2992 126411 0 0 3 0x14200 usbatsk usbatsk
84640 423001 0 0 3 0x14200 bored sensors
54658 520770 0 0 3 0x40014200 idle31
19399 499906 0 0 7 0x40014200 idle30
20858 482044 0 0 7 0x40014200 idle29
79829 50353 0 0 3 0x40014200 idle28
1546 195916 0 0 7 0x40014200 idle27
61902 85967 0 0 3 0x40014200 idle26
89974 484980 0 0 3 0x40014200 idle25
2447 481193 0 0 7 0x40014200 idle24
28705 54131 0 0 3 0x40014200 idle23
14687 482436 0 0 7 0x40014200 idle22
80080 523569 0 0 7 0x40014200 idle21
73543 477047 0 0 3 0x40014200 idle20
90851 461175 0 0 7 0x40014200 idle19
67402 467610 0 0 3 0x40014200 idle18
92980 470105 0 0 3 0x40014200 idle17
25688 373 0 0 3 0x40014200 idle16
2140 359395 0 0 3 0x40014200 idle15
30307 298916 0 0 3 0x40014200 idle14
78276 222991 0 0 3 0x40014200 idle13
53698 232569 0 0 3 0x40014200 idle12
25040 169137 0 0 3 0x40014200 idle11
52331 91953 0 0 3 0x40014200 idle10
80801 298113 0 0 3 0x40014200 idle9
71270 356160 0 0 3 0x40014200 idle8
37142 63435 0 0 3 0x40014200 idle7
41282 158113 0 0 3 0x40014200 idle6
46031 294695 0 0 3 0x40014200 idle5
68521 268223 0 0 3 0x40014200 idle4
61895 101641 0 0 3 0x40014200 idle3
80865 338317 0 0 3 0x40014200 idle2
33775 6315 0 0 3 0x40014200 idle1
3052 79059 0 0 3 0x14200 bored softnet7
27723 260168 0 0 3 0x14200 bored softnet6
40405 54896 0 0 3 0x14200 bored softnet5
46409 135364 0 0 3 0x14200 bored softnet4
54015 335233 0 0 3 0x14200 bored softnet3
75531 132971 0 0 3 0x14200 bored softnet2
55071 464772 0 0 3 0x14200 bored softnet1
89415 470293 0 0 7 0x14200 softnet0
59654 170171 0 0 3 0x14200 bored systqmp
2035 521522 0 0 3 0x14200 bored systq
44922 452892 0 0 3 0x14200 tmoslp softclockmp
13424 132664 0 0 3 0x40014200 tmoslp softclock
92466 443387 0 0 3 0x40014200 idle0
15310 87170 0 0 3 0x14200 kmalloc kmthread
1 308242 0 0 3 0x82 wait init
0 0 -1 0 3 0x10200 scheduler swapper
ddb{13}> show uvm
Current UVM status:
pagesize=8192 (0x2000), pagemask=0x1fff, pageshift=13
16258622 VM pages: 33991 active, 41539 inactive, 1 wired, 15294921 free (1912
382 zero)
freemin=541954, free-target=722605, inactive-target=0, wired-max=5419540
faults=-543425818, traps=1357591386, intrs=972970408, ctxswitch=642541198 fpu
switch=3254093
softint=32992076, syscalls=-1651139276, kmapent=20
fault counts:
noram=0, noanon=0, noamap=0, pgwait=0, pgrele=0
relocks=6641422(72444), upgrades=0(0) anget(retries)=812094109(0), amapcopy
=304977889
neighbor anon/obj pg=151753437/735668315, gets(lock/unlock)=493797378/67142
16
cases: anon=730615483, anoncow=81478626, obj=454908346, prcopy=38816238, pr
zero=-1849244513
daemon and swap counts:
woke=0, revs=0, scans=0, obscans=0, anscans=0
busy=0, freed=0, reactivate=0, deactivate=0
pageouts=0, pending=0, nswget=0
nswapdev=1
swpages=11590896, swpginuse=0, swpgonly=0 paging=0
kernel pointers:
objs(kern)=0x1c72d40
ddb{13}> show pool
POOL panic: kernel data fault: pc=1369664 addr=300ffff83286000
Stopped at db_enter+0x8: nop
data_access_fault(407659b0340, 31, 1369664, 300ffff83286000, 300ffff83286000, 1
) at data_access_fault+0x2f0
sun4v_datatrap(300ffff8328700f, 300ffff83287010, 1, 0, 407659b06f0, 0) at sun4v
_datatrap+0x200
kprintf(5, 14, 0, 0, 0, 0) at kprintf+0xf94
db_printf(18322f8, 300ffff8328700f, 86290001, 81cfe008, 407659b0920, 0) at db_p
rintf+0x40
pool_print1(1300ca8, 407659b0800, 1263720, 407659b0800, 0, 1c866d8) at pool_pri
nt1+0x54
db_command(1c24a88, 0, 0, 0, 1300ca8, 407659b0958) at db_command+0x134
db_command_loop(91, 407659b1650, e, 5, 1263720, 1937900) at db_command_loop+0x1
0c
db_trap(1c26000, 0, 0, 0, 0, 1f) at db_trap+0x214
db_ktrap(101, 407659b0cc0, 1, 407659b16d8, 407659b0f38, 0) at db_ktrap+0x1b4
trap(407659b0cc0, 101, 1300ca4, 820006, 0, 0) at trap+0x2d8
Lslowtrap_reenter(1, 14, 0, 0, 0, 1) at Lslowtrap_reenter+0xf8
panic(18374e0, 1011ddc, 11, 9, 104, 41b9ff388ac) at panic+0xcc
sun4v_send_ipi(11, 1011ddc, 2710, 9, ffffffffffffffff, 0) at sun4v_send_ipi+0xa
c
db_enter_ddb(41b9fef8000, a, 1cbffc0, 1c80ac0, 1c189e0, 40000) at db_enter_ddb+
0x244
ddb{13}> x /i 0x1369664
strlen+0x4: ldsb [%o0 + %g0], %o2
ddb{13}> show panic
cpu2: uobjlk rwlock 0x4077ae3b6b0: enter write deadlock
*cpu13: mutex 0x0 not held in mi_switch
cpu18: Unable to broadcast mondo 1011cc4: 9
cpu20: kernel data fault: pc=1769a44 addr=1c78b7e000
cpu25: trap type 0x34 (mem address not aligned): pc=1063d70 npc=1063e0c pstate
=44820006<PRIV,IE>
cpu31: Unable to broadcast mondo 1011cc4: 9
ddb{13}> x /i 0x1769a44
mi_switch+0x164: ld [%g1 + 0xd80], %g2
ddb{13}> x /i 1063d70
sched_steal_proc+0xd0: ld [%l0 + 0x60], %g1
ddb{13}> show proc
PROC (make) tid=203859 pid=83460 tcnt=1 stat=onproc
flags process=100001<CONTROLT,PLEDGE> proc=0
runpri=86, usrpri=86, slppri=32, nice=20
wchan=0x0, wmesg=, ps_single=0x0 scnt=0 ecnt=0
forw=0xffffffffffffffff, list=0x4077ca59360,0x1c7e858
process=0x407714e8920 user=0x407659ae000, vmspace=0x40774792310
estcpu=36, cpticks=0, pctcpu=0.0, user=0, sys=0, intr=0
ddb{13}> mach ddbcpu 0
Stopped at __mp_lock+0x64: nop
sparc_intr_retry(1c19850, 0, 1813488, 40770b4c000, 1be, 1cd2f90) at sparc_intr_
retry+0x58
msleep_nsec(1c19860, 1c19850, 4, 1813488, 0, 6) at msleep_nsec+0x88
reaper(4008f8842f0, 4008f8842f0, 381, 100, 1c19860, 4000) at reaper+0xa0
proc_trampoline(0, 0, 0, 0, 0, 0) at proc_trampoline+0x10
ddb{0}> mach ddbcpu 1
Stopped at hv_cpu_mondo_send+0xc: nop
pmap_enter(40778204240, 294b78000, 7e16b5a44000, 407713f5a00, 21, 4) at pmap_en
ter+0x45c
uvm_fault_lower(407713f5d08, 407713f5cd0, 4076cb4f440, 407713f5bd0, 407713f5af0
, 1cb9440) at uvm_fault_lower+0x4a4
uvm_fault(0, 407713f5d08, 0, 0, 11782e0, 2) at uvm_fault+0x1b8
data_access_fault(407713f5ee0, 31, 49f8e0, 294b78dc9, 294b78000, 1) at data_acc
ess_fault+0x184
sun4v_datatrap(294b78000, ffffffff, 206260, 2042d8cd0, 100, 268) at sun4v_datat
rap+0x200
ddb{1}> mach ddbcpu 2
Stopped at hv_cons_putchar+0xc: nop
cnputc(74, 74, 0, 40787973b30, 11782e0, 3) at cnputc+0x30
db_putchar(74, 14, 1, 0, 40762b1b820, 0) at db_putchar+0x140
kprintf(27, 14, 0, 0, 0, 31) at kprintf+0x99c
db_printf(18c0208, 41b9ffe88ac, 19031a8, 40762b1b8e8, 0, 41b9ff388ac) at db_pri
ntf+0x40
panic(19031a8, 1915230, 4077ae3b6b0, 0, 104, 41b9ffe88ac) at panic+0xa8
rw_do_enter_write(4077ae3b6b0, 1, 40762b1bd30, 0, 0, 0) at rw_do_enter_write+0x
1e4
uvm_fault_lower_lookup(40762b1bd08, 40762b1bcd0, 40762b1bbd0, 0, 0, 1a06e90) at
uvm_fault_lower_lookup+0x2c
uvm_fault_lower(40762b1bd08, 40762b1bcd0, 0, 40762b1bbd0, 40762b1baf0, 1cb9440)
at uvm_fault_lower+0x44
uvm_fault(0, 40762b1bd08, 0, 40787973b30, 11782e0, 3) at uvm_fault+0x1b8
data_access_fault(40762b1bee0, 31, 22300b508, 221afae65, 221afa000, 1) at data_
access_fault+0x184
sun4v_datatrap(4a31, 2e, 1, a3, 2e29b2, 0) at sun4v_datatrap+0x200
ddb{2}> mach ddbcpu 4
Stopped at delay+0x40: rdpr %tick, %o2
pmap_remove(6a5220c000, 6a52200000, 6a5221e000, 7fffffffe000, 19470c8, 1cbf000)
at pmap_remove+0x1e0
uvm_unmap_kill_entry_withlock(40774793a10, 40786305010, 1, 4076265d728, 0, 1) a
t uvm_unmap_kill_entry_withlock+0xd0
uvm_unmap_remove(40774793a10, ffffffffffffe000, 40786305010, 4076265d728, 1, 0)
at uvm_unmap_remove+0x244
uvmspace_exec(4077ca59360, 2000, ffffffffffffe000, 24f0, 0, 6d4e144948) at uvms
pace_exec+0x154
sys_execve(c, 6d4e144940, 4008f8d6930, 4011cff6000, 3c, 40770f21b10) at sys_exe
cve+0x5ac
syscall(4076265dee0, 1a06e90, 4076265df40, 1c00, 40770f21f10, 17d06e0) at sysca
ll+0x3c0
syscall_setup(fffffea81d8d35e8, 6cea8ae000, 6d4e1448c0, 1002, ffffffffffffffff,
0) at syscall_setup+0x124
ddb{4}> show proc
PROC (make) tid=44218 pid=27987 tcnt=1 stat=onproc
flags process=101005<CONTROLT,INEXEC,SINGLEEXIT,PLEDGE> proc=0
runpri=36, usrpri=86, slppri=36, nice=20
wchan=0x0, wmesg=, ps_single=0x4077ca59360 scnt=0 ecnt=0
forw=0xffffffffffffffff, list=0x4077ca58090,0x4077ca58b60
process=0x40770f21b10 user=0x4076265a000, vmspace=0x40774793a10
estcpu=36, cpticks=5159913, pctcpu=0.0, user=0, sys=5159913, intr=0
ddb{4}> mach ddbcpu 9
Stopped at __mp_lock+0x64: nop
syscall_setup(ffffffffffffffff, fffffea81d8d3dd4, 1, 0, 17a8, 6a52530248) at sy
scall_setup+0x124
ddb{9}> show proc
PROC (make) tid=313747 pid=2638 tcnt=1 stat=onproc
flags process=10100003<CONTROLT,EXEC,PLEDGE,WAITEVENT> proc=0
runpri=32, usrpri=86, slppri=32, nice=20
wchan=0x0, wmesg=, ps_single=0x0 scnt=0 ecnt=0
forw=0xffffffffffffffff, list=0x4076ab0ee10,0x40774512890
process=0x4076ab428f0 user=0x4076093a000, vmspace=0x4008f606ff0
estcpu=36, cpticks=5163642, pctcpu=9.6, user=30, sys=5163608, intr=3