I ran an strace as well. Below is from the last question from lxd init until I killed the process. All I can see is a connection to the unix socket and then a HTTP 200. I can provide the full strace if that would be helpful to anyone:
futex(0x17e5628, FUTEX_WAIT, 0, NULLChoose the local disk or dataset for storage pool "btrfspool1" (empty for loop disk): /dev/sdj Would you like a YAML "lxd init" preseed to be printed? (yes/no) [default=no]: no ) = 0 futex(0xc4200d3548, FUTEX_WAKE, 1) = 1 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 sched_yield() = 0 futex(0x17e4af0, FUTEX_WAKE, 1) = 0 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 futex(0xc4203ff148, FUTEX_WAKE, 1) = 1 sched_yield() = 0 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 sched_yield() = 0 futex(0x17e4af0, FUTEX_WAIT, 2, NULL) = -1 EAGAIN (Resource temporarily unavailable) futex(0x17e4af0, FUTEX_WAKE, 1) = 0 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 futex(0xc42009cd48, FUTEX_WAKE, 1) = 1 sched_yield() = 0 futex(0x17e4af0, FUTEX_WAIT, 2, NULL) = -1 EAGAIN (Resource temporarily unavailable) futex(0x17e4af0, FUTEX_WAKE, 1) = 0 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = -1 EAGAIN (Resource temporarily unavailable) sched_yield() = 0 futex(0x17e4af0, FUTEX_WAIT, 2, NULL) = 0 futex(0x17e4af0, FUTEX_WAKE, 1) = 1 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 futex(0xc4204e1548, FUTEX_WAKE, 1) = 1 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 sched_yield() = 0 futex(0x17e4af0, FUTEX_WAIT, 2, NULL) = -1 EAGAIN (Resource temporarily unavailable) futex(0x17e4af0, FUTEX_WAKE, 1) = 1 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 futex(0xc4204e1148, FUTEX_WAKE, 1) = 1 sched_yield() = 0 futex(0x17e4af0, FUTEX_WAIT, 2, NULL) = -1 EAGAIN (Resource temporarily unavailable) futex(0x17e4af0, FUTEX_WAKE, 1) = 1 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 sched_yield() = 0 futex(0x17e4af0, FUTEX_WAIT, 2, NULL) = 0 futex(0x17e4af0, FUTEX_WAKE, 1) = 0 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 futex(0xc4200d3948, FUTEX_WAKE, 1) = 1 sched_yield() = 0 futex(0x17e4af0, FUTEX_WAKE, 1) = 0 futex(0x17e4be8, FUTEX_WAKE, 1) = 0 futex(0x17e4af0, FUTEX_WAKE, 1) = 1 futex(0x17e4bc0, FUTEX_WAIT, 0, {tv_sec=0, tv_nsec=100000}) = -1 EAGAIN (Resource temporarily unavailable) futex(0xc42027a148, FUTEX_WAKE, 1) = 1 futex(0xc4200d3948, FUTEX_WAKE, 1) = 1 futex(0xc4200d2d48, FUTEX_WAKE, 1) = 1 futex(0xc4204e1d48, FUTEX_WAKE, 1) = 1 futex(0xc42027a548, FUTEX_WAKE, 1) = 1 futex(0xc4203ff948, FUTEX_WAKE, 1) = 1 futex(0xc42009dd48, FUTEX_WAKE, 1) = 1 futex(0xc42027b948, FUTEX_WAKE, 1) = 1 futex(0xc4203fe148, FUTEX_WAKE, 1) = 1 futex(0xc42009cd48, FUTEX_WAKE, 1) = 1 futex(0xc4203fed48, FUTEX_WAKE, 1) = 1 futex(0xc4203ff148, FUTEX_WAKE, 1) = 1 futex(0xc42009d548, FUTEX_WAKE, 1) = 1 futex(0xc4200d3148, FUTEX_WAKE, 1) = 1 futex(0xc4204e0148, FUTEX_WAKE, 1) = 1 futex(0xc4204e1148, FUTEX_WAKE, 1) = 1 futex(0xc4204e1948, FUTEX_WAKE, 1) = 1 futex(0xc4204e1548, FUTEX_WAKE, 1) = 1 futex(0xc42027a948, FUTEX_WAKE, 1) = 1 futex(0xc420628148, FUTEX_WAKE, 1) = 1 futex(0xc420628548, FUTEX_WAKE, 1) = 1 futex(0xc42027bd48, FUTEX_WAKE, 1) = 1 futex(0xc42009d148, FUTEX_WAKE, 1) = 1 futex(0xc4203ff548, FUTEX_WAKE, 1) = 1 futex(0xc4204e0948, FUTEX_WAKE, 1) = 1 futex(0xc4200d3548, FUTEX_WAKE, 1) = 1 futex(0xc4203ffd48, FUTEX_WAKE, 1) = 1 futex(0xc42027b148, FUTEX_WAKE, 1) = 1 futex(0xc4203fe548, FUTEX_WAKE, 1) = 1 futex(0xc42027b548, FUTEX_WAKE, 1) = 1 futex(0xc4204e0548, FUTEX_WAKE, 1) = 1 futex(0x17e4af0, FUTEX_WAKE, 1) = 1 epoll_pwait(4, [], 128, 0, NULL, 34) = 0 futex(0xc4200d2d48, FUTEX_WAKE, 1) = 1 rt_sigprocmask(SIG_SETMASK, ~[RTMIN RT_1], [], 8) = 0 mmap(NULL, 8392704, PROT_NONE, MAP_PRIVATE|MAP_ANONYMOUS|MAP_STACK, -1, 0) = 0x7fc751ffc000 mprotect(0x7fc751ffd000, 8388608, PROT_READ|PROT_WRITE) = 0 clone(child_stack=0x7fc7527fbe70, flags=CLONE_VM|CLONE_FS|CLONE_FILES|CLONE_SIGHAND|CLONE_THREAD|CLONE_SYSVSEM|CLONE_SETTLS|CLONE_PARENT_SETTID|CLONE_CHILD_CLEARTID, parent_tidptr=0x7fc7527fc9d0, tls=0x7fc7527fc700, child_tidptr=0x7fc7527fc9d0) = 13862 rt_sigprocmask(SIG_SETMASK, [], NULL, 8) = 0 futex(0xc420628548, FUTEX_WAKE, 1) = 1 futex(0x17e4af0, FUTEX_WAKE, 1) = 1 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 epoll_pwait(4, [], 128, 0, NULL, 0) = 0 epoll_pwait(4, [{EPOLLIN|EPOLLOUT, {u32=90537520, u64=140497060724272}}], 128, -1, NULL, 25054624) = 1 futex(0x17e4bd0, FUTEX_WAKE, 1) = 1 read(5, "\26\3\3\0001\2\0\0-\3\3[cp*\373\264A\34[\234\326\304\3104_yi,v\214\370"..., 1024) = 1024 read(5, "\"\372\347=\244\257\32\vxu\323J5\204\301'\3274\330\332\1\344\316\326,\342`\355\251\350E\334"..., 1078) = 1043 getrandom("\x74\xc4\x77\xb7\x69\xa7\x5f\xe2\x17\x03\x6c\x40\xfd\xb1\x71\xd5\x62\xc9\x02\xa1\x1f\xf0\xf9\xc4\x5b\xe9\x19\xc8\xe2\xb5\xf8\x10", 32, 0) = 32 write(5, "\26\3\3\0\7\v\0\0\3\0\0\0\26\3\3\0%\20\0\0! \33O%\336`\277\340\321\16\362"..., 105) = 105 read(5, 0xc42059e400, 1024) = -1 EAGAIN (Resource temporarily unavailable) epoll_pwait(4, [], 128, 0, NULL, 0) = 0 epoll_pwait(4, [{EPOLLIN|EPOLLOUT, {u32=90537520, u64=140497060724272}}], 128, -1, NULL, 0) = 1 futex(0x17e4bd0, FUTEX_WAKE, 1) = 1 futex(0x17e4af0, FUTEX_WAKE, 1) = 1 read(5, "\24\3\3\0\1\1\26\3\3\0(\0\0\0\0\0\0\0\0\235\203\332>S\214\214\nz]\211\215\4"..., 1024) = 51 futex(0xc42027ad48, FUTEX_WAKE, 1) = 1 write(5, "\27\3\3\0\243\0\0\0\0\0\0\0\1\354tY\204\0\272\36\302W\200\337S\270\315b\300\2231\201"..., 168) = 168 futex(0xc42027ad48, FUTEX_WAKE, 1) = 1 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 epoll_pwait(4, [], 128, 0, NULL, 0) = 0 epoll_pwait(4, [{EPOLLIN|EPOLLOUT, {u32=90537520, u64=140497060724272}}], 128, -1, NULL, 25054624) = 1 futex(0x17e4bd0, FUTEX_WAKE, 1) = 1 futex(0x17e4af0, FUTEX_WAKE, 1) = 1 read(5, "\26\3\3\0001\2\0\0-\3\0038E$W\267\2146\332\252\241\256$Hw\333\24\314@\f\v\337"..., 1024) = 1024 read(5, "\"\372\347=\244\257\32\vxu\323J5\204\301'\3274\330\332\1\344\316\326,\342`\355\251\350E\334"..., 1078) = 1043 getrandom("\x02\xb0\xb3\x20\xd4\x8d\x58\x56\x0b\x6f\x21\x5e\xe4\x29\x11\xd3\x50\x69\x62\x70\xbe\x6a\x09\x45\x50\xf7\x3a\xeb\xc7\x28\x5e\x2a", 32, 0) = 32 write(5, "\26\3\3\0\7\v\0\0\3\0\0\0\26\3\3\0%\20\0\0! \23\273\263nk\221\227>\305\337"..., 105) = 105 read(5, 0xc42028d000, 1024) = -1 EAGAIN (Resource temporarily unavailable) epoll_pwait(4, [], 128, 0, NULL, 0) = 0 epoll_pwait(4, [{EPOLLIN|EPOLLOUT, {u32=90537520, u64=140497060724272}}], 128, -1, NULL, 0) = 1 futex(0x17e4bd0, FUTEX_WAKE, 1) = 1 futex(0x17e4af0, FUTEX_WAKE, 1) = 1 read(5, "\24\3\3\0\1\1\26\3\3\0(\0\0\0\0\0\0\0\0005T\350\7F\326U\241?\246\7\365\346"..., 1024) = 51 futex(0xc42027ad48, FUTEX_WAKE, 1) = 1 read(5, 0xc420344800, 2048) = -1 EAGAIN (Resource temporarily unavailable) futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 epoll_pwait(4, [], 128, 0, NULL, 0) = 0 epoll_pwait(4, [{EPOLLOUT, {u32=90537520, u64=140497060724272}}], 128, -1, NULL, 25054624) = 1 epoll_pwait(4, [{EPOLLOUT, {u32=90537520, u64=140497060724272}}], 128, -1, NULL, 25054624) = 1 epoll_pwait(4, [{EPOLLIN|EPOLLOUT, {u32=90537520, u64=140497060724272}}], 128, -1, NULL, 25054624) = 1 futex(0x17e4bd0, FUTEX_WAKE, 1) = 1 futex(0x17e4af0, FUTEX_WAKE, 1) = 1 read(5, "HTTP/1.1 101 Switching Protocols"..., 4096) = 311 futex(0xc4200d2d48, FUTEX_WAKE, 1) = 1 futex(0xc4200d2d48, FUTEX_WAKE, 1) = 1 socket(AF_UNIX, SOCK_STREAM|SOCK_CLOEXEC|SOCK_NONBLOCK, 0) = 6 setsockopt(6, SOL_SOCKET, SO_BROADCAST, [1], 4) = 0 connect(6, {sa_family=AF_UNIX, sun_path="/var/lib/lxd/unix.socket"}, 27) = 0 epoll_ctl(4, EPOLL_CTL_ADD, 6, {EPOLLIN|EPOLLOUT|EPOLLRDHUP|EPOLLET, {u32=90537312, u64=140497060724064}}) = 0 getsockname(6, {sa_family=AF_UNIX}, [112->2]) = 0 getpeername(6, {sa_family=AF_UNIX, sun_path="/var/lib/lxd/unix.socket"}, [112->27]) = 0 futex(0xc4200d2d48, FUTEX_WAKE, 1) = 1 read(6, 0xc4203f0000, 4096) = -1 EAGAIN (Resource temporarily unavailable) futex(0x17e5628, FUTEX_WAIT, 0, NULL) = -1 EAGAIN (Resource temporarily unavailable) futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 epoll_pwait(4, [], 128, 0, NULL, 0) = 0 epoll_pwait(4, [{EPOLLOUT, {u32=90537312, u64=140497060724064}}], 128, -1, NULL, 25054624) = 1 epoll_pwait(4, [{EPOLLOUT, {u32=90537312, u64=140497060724064}}], 128, -1, NULL, 25054624) = 1 epoll_pwait(4, [{EPOLLIN|EPOLLOUT, {u32=90537312, u64=140497060724064}}], 128, -1, NULL, 25054624) = 1 futex(0x17e4bd0, FUTEX_WAKE, 1) = 1 futex(0x17e4af0, FUTEX_WAKE, 1) = 1 read(6, "HTTP/1.1 200 OK\r\nContent-Type: a"..., 4096) = 538 futex(0xc4204e0548, FUTEX_WAKE, 1) = 1 epoll_ctl(4, EPOLL_CTL_DEL, 6, 0xc4205d79d4) = 0 close(6) = 0 futex(0xc4200d2d48, FUTEX_WAKE, 1) = 1 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = 0 futex(0xc42027b548, FUTEX_WAKE, 1) = 1 futex(0x17e5628, FUTEX_WAIT, 0, NULL) = -1 EAGAIN (Resource temporarily unavailable) futex(0x17e5628, FUTEX_WAIT, 0, NULL) = -1 EAGAIN (Resource temporarily unavailable) futex(0xc4200d2d48, FUTEX_WAKE, 1) = 1 sched_yield() = 0 futex(0x17e4af0, FUTEX_WAIT, 2, NULL) = -1 EAGAIN (Resource temporarily unavailable) futex(0x17e4af0, FUTEX_WAKE, 1) = 0 futex(0x17e4be8, FUTEX_WAKE, 1) = 1 futex(0x17e4af0, FUTEX_WAKE, 1) = 1 futex(0x17e4bc0, FUTEX_WAKE, 1) = 1 futex(0x17e4af0, FUTEX_WAKE, 1) = 1 sched_yield() = 0 futex(0x17e4af0, FUTEX_WAIT, 2, NULL) = 0 futex(0x17e4af0, FUTEX_WAKE, 1) = 1 futex(0x17e5628, FUTEX_WAIT, 0, NULL ^C) = ? ERESTARTSYS (To be restarted if SA_RESTART is set) strace: Process 13785 detached On 3/19/20 11:41, Joshua Schaeffer wrote: > Hey all, I'm trying to build a cluster on Ubuntu 18.04 with lxd 3.0.3. I was > able to bootstrap the first node without any issues, but when I try to add a > second node it just hangs and never returns the terminal prompt. Here is my > bootstrapped node: > > lxcuser@blllxc02:~$ lxc cluster list > +----------+----------------------------------------------+----------+--------+-------------------+ > | NAME | URL | DATABASE | STATE > | MESSAGE | > +----------+----------------------------------------------+----------+--------+-------------------+ > | blllxc02 | https://blllxc02-mgmt.harmonywave.cloud:8443 | YES | ONLINE > | fully operational | > +----------+----------------------------------------------+----------+--------+-------------------+ > > And here is the second node I am trying to add: > > lxcuser@blllxc01:~$ sudo lxd init > Would you like to use LXD clustering? (yes/no) [default=no]: yes > What name should be used to identify this node in the cluster? > [default=blllxc01]: > What IP address or DNS name should be used to reach this node? > [default=fe80::6a1c:a2ff:fe13:1ec6]: blllxc01-mgmt.harmonywave.cloud > Are you joining an existing cluster? (yes/no) [default=no]: yes > IP address or FQDN of an existing cluster node: > blllxc02-mgmt.harmonywave.cloud > Cluster fingerprint: > 20b51145761f3444278317331feeded8492c263920889f5dccd83772da0c42cf > You can validate this fingerpring by running "lxc info" locally on an > existing node. > Is this the correct fingerprint? (yes/no) [default=no]: yes > Cluster trust password: > All existing data is lost when joining a cluster, continue? (yes/no) > [default=no] yes > Choose the local disk or dataset for storage pool "btrfspool1" (empty for > loop disk): /dev/sdj > Would you like a YAML "lxd init" preseed to be printed? (yes/no) [default=no]: > > ^C > lxcuser@blllxc01:~$ lxc cluster list > Error: LXD server isn't part of a cluster > > After the last question from lxd init my terminal never returns. I've left it > like this overnight with no change. This is all I'm seeing in the logs as > well from the time I run lxd init to when I abort the process: > > Logs from the node trying to be added: > t=2020-03-18T20:17:07-0600 lvl=info msg="Creating BTRFS storage pool > \"btrfspool1\"" > t=2020-03-18T20:17:08-0600 lvl=warn msg="Failed to detect UUID by looking at > /dev/disk/by-uuid" > t=2020-03-18T20:17:08-0600 lvl=info msg="Created BTRFS storage pool > \"btrfspool1\"" > t=2020-03-19T02:12:27-0600 lvl=info msg="Updating images" > t=2020-03-19T02:12:27-0600 lvl=info msg="Done updating images" > t=2020-03-19T08:12:27-0600 lvl=info msg="Updating images" > t=2020-03-19T08:12:27-0600 lvl=info msg="Done updating images" > > Logs from the bootstrapped node: > t=2020-03-18T17:05:58-0600 lvl=info msg="Initializing global database" > t=2020-03-18T17:06:02-0600 lvl=warn msg="Raft: Heartbeat timeout from \"\" > reached, starting election" > t=2020-03-18T17:06:03-0600 lvl=info msg="Initializing storage pools" > t=2020-03-18T17:06:03-0600 lvl=info msg="Initializing networks" > t=2020-03-18T17:06:03-0600 lvl=info msg="Pruning leftover image files" > t=2020-03-18T17:06:03-0600 lvl=info msg="Done pruning leftover image files" > t=2020-03-18T17:06:03-0600 lvl=info msg="Loading daemon configuration" > t=2020-03-18T17:06:03-0600 lvl=info msg="Pruning expired images" > t=2020-03-18T17:06:03-0600 lvl=info msg="Done pruning expired images" > t=2020-03-18T17:06:03-0600 lvl=info msg="Expiring log files" > t=2020-03-18T17:06:03-0600 lvl=info msg="Done expiring log files" > t=2020-03-18T17:06:03-0600 lvl=info msg="Updating images" > t=2020-03-18T17:06:03-0600 lvl=info msg="Done updating images" > t=2020-03-18T17:06:03-0600 lvl=info msg="Updating instance types" > t=2020-03-18T17:06:03-0600 lvl=info msg="Done updating instance types" > t=2020-03-18T23:06:03-0600 lvl=info msg="Updating images" > t=2020-03-18T23:06:03-0600 lvl=info msg="Done updating images" > t=2020-03-19T05:06:03-0600 lvl=info msg="Updating images" > t=2020-03-19T05:06:03-0600 lvl=info msg="Done updating images" > t=2020-03-19T11:06:03-0600 lvl=info msg="Updating images" > t=2020-03-19T11:06:03-0600 lvl=info msg="Done updating images" > > Any idea where I can get more information about what is going on to > successfully add the node to the cluster? > -- > Thanks, > Joshua Schaeffer > > _______________________________________________ > lxc-users mailing list > lxc-users@lists.linuxcontainers.org > http://lists.linuxcontainers.org/listinfo/lxc-users -- Thanks, Joshua Schaeffer
_______________________________________________ lxc-users mailing list lxc-users@lists.linuxcontainers.org http://lists.linuxcontainers.org/listinfo/lxc-users