[OpenAFS-devel] fileserver crash on Solaris 2.6 with 1.2.7

Martin MOKREJŠ mmokrejs@natur.cuni.cz
Fri, 13 Dec 2002 03:21:31 +0100 (CET)


Hi,
  couldn't this be a problem with ptserver/vlserver on my Solaris box?


bash-2.04$ fs getserverprefs
wormhole                                           40011
pf-i400.natur.cuni.cz                              20014
nmrindy.natur.cuni.cz                              20004
bash-2.04$

The 'wormhole' used to be a second network card on this host.
Currently it is shutdown for some years. But, is unreachable.
To make it more difficult, the second Solaris machine has it's
second ethernet card enabled, with wormhole as a hostname,
same IP address. Is it possible that afsd on that second
machine propagates the information about vlserver running
on that IP address (10.0.0.1) to this problematic Solaris machine1?

tracing fileserver on server1 gives me:
time()                                          = 1039744101
lwp_sema_post(0xEF568590)                       = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
lwp_sema_wait(0xEF568590)                       = 0
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
recvmsg(5, 0xEF305C80, 0)                       = 65
time()                                          = 1039744101
recvmsg(5, 0xEF305C80, 0)                       = 28
lwp_sema_post(0xEE386E78)                       = 0
lwp_sema_wait(0xEE386E78)                       = 0
time()                                          = 1039744101
lwp_sema_post(0xEE386E78)                       = 0
lwp_sema_wait(0xEE386E78)                       = 0
lwp_mutex_unlock(0xEF56B280)                    = 0
lwp_mutex_lock(0xEF56B280)                      = 0
stat("/usr/afs/local/sysid", 0xEE386BB8)        = 0
rename("/usr/afs/local/sysid", "/usr/afs/local/sysid.old") = 0
    Received signal #14, SIGALRM, in lwp_sema_wait() [caught]
open("/usr/afs/local/sysid", O_WRONLY|O_CREAT|O_TRUNC, 0666) = 12
write(12, "88AABBCC\0\0\001", 8)                = 8
lwp_sema_wait(0xEF568590)                       Err#91 ERESTART
write(12, "\0 -D2C8BEE719E5AAA8C3 q".., 16)     = 16
write(12, "\0\0\001", 4)                        = 4
write(12, "C3 q ; y", 4)                        = 4
sigprocmask(SIG_SETMASK, 0xEF103E28, 0x00000000) = 0
close(12)                                       = 0
lwp_sema_post(0xEF204E78)                       = 0
lwp_sema_wait(0xEF204E78)                       = 0
setitimer(ITIMER_REAL, 0xEF103880, 0x00000000)  = 0
lwp_sema_post(0xEF568590)                       = 0
sigprocmask(SIG_SETMASK, 0xEF570AA0, 0x00000000) = 0
setcontext(0xEF103B18)
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
lwp_sema_wait(0xEF568590)                       = 0
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
    Received signal #14, SIGALRM, in lwp_sema_wait() [caught]
lwp_sema_wait(0xEF568590)                       Err#91 ERESTART
sigprocmask(SIG_SETMASK, 0xEF103E28, 0x00000000) = 0
lwp_sema_post(0xEF204E78)                       = 0
lwp_sema_wait(0xEF204E78)                       = 0
setitimer(ITIMER_REAL, 0xEF103880, 0x00000000)  = 0
sigprocmask(SIG_SETMASK, 0xEF570AA0, 0x00000000) = 0
sendmsg(5, 0xEF204AA8, 0)                       = 65
setcontext(0xEF103B18)
time()                                          = 1039744102
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
lwp_sema_post(0xEF568590)                       = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
lwp_sema_wait(0xEF568590)                       = 0
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
recvmsg(5, 0xEF305C80, 0)       (sleeping...)
    Received signal #14, SIGALRM, in lwp_sema_wait() [caught]
lwp_sema_wait(0xEF568590)                       Err#91 ERESTART
sigprocmask(SIG_SETMASK, 0xEF103E28, 0x00000000) = 0
lwp_sema_post(0xEF204E78)                       = 0
lwp_sema_wait(0xEF204E78)                       = 0
setitimer(ITIMER_REAL, 0xEF103880, 0x00000000)  = 0
sigprocmask(SIG_SETMASK, 0xEF570AA0, 0x00000000) = 0
lwp_sema_post(0xEF568590)                       = 0
setcontext(0xEF103B18)
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
lwp_sema_wait(0xEF568590)                       = 0
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
sigprocmask(SIG_BLOCK, 0xEF568580, 0xEF103CB8)  = 0
lwp_sema_post(0xEF204E78)                       = 0
lwp_sema_wait(0xEF204E78)                       = 0
setitimer(ITIMER_REAL, 0xEF103B60, 0x00000000)  = 0
sigprocmask(SIG_SETMASK, 0xEF103CB8, 0x00000000) = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
time()                                          = 1039744160
lwp_sema_post(0xEF568590)                       = 0
lwp_sema_wait(0xEF568590)                       = 0
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
recvmsg(5, 0xEF305C80, 0)       (sleeping...)
    Received signal #14, SIGALRM, in lwp_sema_wait() [caught]
lwp_sema_wait(0xEF568590)                       Err#91 ERESTART
sigprocmask(SIG_SETMASK, 0xEF103E28, 0x00000000) = 0
lwp_sema_post(0xEF204E78)                       = 0
lwp_sema_wait(0xEF204E78)                       = 0
setitimer(ITIMER_REAL, 0xEF103880, 0x00000000)  = 0
sigprocmask(SIG_SETMASK, 0xEF570AA0, 0x00000000) = 0
lwp_sema_post(0xEF568590)                       = 0
setcontext(0xEF103B18)
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
lwp_sema_wait(0xEF568590)                       = 0
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
recvmsg(5, 0xEF305C80, 0)       (sleeping...)
    Received signal #14, SIGALRM, in lwp_sema_wait() [caught]
lwp_sema_wait(0xEF568590)                       Err#91 ERESTART
sigprocmask(SIG_SETMASK, 0xEF103E28, 0x00000000) = 0
lwp_sema_post(0xEF204E78)                       = 0
lwp_sema_wait(0xEF204E78)                       = 0
setitimer(ITIMER_REAL, 0xEF103880, 0x00000000)  = 0
sigprocmask(SIG_SETMASK, 0xEF570AA0, 0x00000000) = 0
setcontext(0xEF103B18)
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
recvmsg(5, 0xEF305C80, 0)       (sleeping...)
lwp_cond_wait(0xEF56B270, 0xEF56B280, 0xEF514C48) Err#62 ETIME
time()                                          = 1039744399
    Received signal #14, SIGALRM, in lwp_sema_wait() [caught]
lwp_sema_wait(0xEF568590)                       Err#91 ERESTART
sigprocmask(SIG_SETMASK, 0xEF103E28, 0x00000000) = 0
lwp_sema_post(0xEE386E78)                       = 0
lwp_sema_wait(0xEE386E78)                       = 0
lwp_mutex_unlock(0xEF56B280)                    = 0
lwp_mutex_lock(0xEF56B280)                      = 0
setitimer(ITIMER_REAL, 0xEF103880, 0x00000000)  = 0
sigprocmask(SIG_SETMASK, 0xEF570AA0, 0x00000000) = 0
setcontext(0xEF103B18)
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
    Received signal #14, SIGALRM, in lwp_sema_wait() [caught]
lwp_sema_wait(0xEF568590)                       Err#91 ERESTART
sigprocmask(SIG_SETMASK, 0xEF103E28, 0x00000000) = 0
lwp_sema_post(0xEF204E78)                       = 0
lwp_sema_wait(0xEF204E78)                       = 0
setitimer(ITIMER_REAL, 0xEF103880, 0x00000000)  = 0
sigprocmask(SIG_SETMASK, 0xEF570AA0, 0x00000000) = 0
access("/usr/afs/logs/FileLog", 0)              = 0
setcontext(0xEF103B18)
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
statvfs("/vicepa", 0xEE386B2C)                  = 0
recvmsg(5, 0xEF305C80, 0)       (sleeping...)
    Received signal #14, SIGALRM, in lwp_sema_wait() [caught]
lwp_sema_wait(0xEF568590)                       Err#91 ERESTART
sigprocmask(SIG_SETMASK, 0xEF103E28, 0x00000000) = 0
lwp_sema_post(0xEE285E78)                       = 0
lwp_sema_wait(0xEE285E78)                       = 0
lwp_mutex_unlock(0xEF56B280)                    = 0
lwp_mutex_lock(0xEF56B280)                      = 0
setitimer(ITIMER_REAL, 0xEF103880, 0x00000000)  = 0
lwp_sema_post(0xEF568590)                       = 0
sigprocmask(SIG_SETMASK, 0xEF570AA0, 0x00000000) = 0
setcontext(0xEF103B18)
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
lwp_sema_wait(0xEF568590)                       = 0
sigprocmask(SIG_BLOCK, 0xEF568580, 0x00000000)  = 0
setitimer(ITIMER_REAL, 0xEF103CC8, 0x00000000)  = 0
sigprocmask(SIG_UNBLOCK, 0xEF568580, 0x00000000) = 0
recvmsg(5, 0xEF305C80, 0)       (sleeping...)

-- 
Martin Mokrejs <mmokrejs@natur.cuni.cz>, <m.mokrejs@gsf.de>
PGP5.0i key is at http://www.natur.cuni.cz/~mmokrejs
MIPS / Institute for Bioinformatics <http://mips.gsf.de>
GSF - National Research Center for Environment and Health
Ingolstaedter Landstrasse 1, D-85764 Neuherberg, Germany
tel.: +49-89-3187 3683 , fax: +49-89-3187 3585