Coda File System

venus instability and crash

From: Steffen Neumann <sneumann_at_TechFak.Uni-Bielefeld.DE>
Date: 20 Feb 2002 14:31:26 +0100
Hi,

the last two days we had venus crashing
shortly after any access. Some diagnosis is attached.

It only worked after venus -init, all volumes 
were connected so no data was lost.

Yours,
Steffen


=========================================================================
console.log:
----------------------------------------------------------
Coda Venus, version 5.3.17

Date: Tue 02/19/2002

08:58:57 /opt/coda/coda_client/LOG size is 6483456 bytes
08:58:57 /opt/coda/coda_client/DATA size is 25927736 bytes
08:58:57 Loading RVM data
08:58:58 Last init was Fri Dec  7 15:15:56 2001
08:58:58 Last shutdown was dirty
08:58:58 starting VDB scan
08:58:58        42 volume replicas
08:58:58        41 replicated volumes
08:58:58        0 CML entries allocated
08:58:58        32 CML entries on free-list
08:58:58 starting FSDB scan (10416, 250000) (25, 75, 4)
08:58:58        9915 cache files in table (60886 blocks)
08:58:58        501 cache files on free-list
08:58:59 starting HDB scan
08:58:59        0 hdb entries in table
08:58:59        0 hdb entries on free-list
08:58:59 Getting Root Volume information...
08:58:59 Venus starting...
08:58:59 /coda now mounted.

09:45:00 root acquiring Coda tokens!
...
22:45:00 root acquiring Coda tokens!
RVMLIB_ASSERT: error in rvmlib_malloc

Assertion failed: 0, file "rvmlib.c", line 209
Sleeping forever.  You may use gdb to attach to process 27386.
----------------------------------------------------------
venus.log:
----------------------------------------------------------
...
[ W(21) : 0000 : 23:24:03 ] Cachefile::SetLength 512
[ W(21) : 0000 : 23:24:03 ] Cachefile::SetLength 512
[ W(21) : 0000 : 23:24:03 ] Cachefile::SetLength 512
[ W(21) : 0000 : 23:24:03 ] Cachefile::SetLength 512
[ W(21) : 0000 : 23:24:03 ] Cachefile::SetLength 512
[ W(21) : 0000 : 23:24:03 ] Cachefile::SetLength 512
[ W(21) : 0000 : 23:24:03 ] Cachefile::SetLength 512
[ W(21) : 0000 : 23:24:03 ] Cachefile::SetLength 512
[ W(21) : 0000 : 23:24:03 ] Cachefile::SetLength 512
[ W(21) : 0000 : 23:24:03 ] Cachefile::SetLength 512
[ W(21) : 0000 : 23:24:03 ] Cachefile::SetLength 10752
----------------------------------------------------------
gdb venus:
----------------------------------------------------------
(gdb) where
#0  0x401783a1 in nanosleep () from /lib/libc.so.6
#1  0x401782dc in __sleep (seconds=1) at ../sysdeps/unix/sysv/linux/sleep.c:67
#2  0x80cf5ca in coda_assert (pred=0x80f3053 "0", file=0x80f2fe4 "rvmlib.c", line=209) at coda_assert.c:46
#3  0x80b6352 in rvmlib_malloc (size=24576, file=0x80f34ea "codadir.c", line=222) at rvmlib.c:209
#4  0x80b8a6c in DH_Alloc (dh=0x2132cf88, size=24576, in_rvm=1) at codadir.c:222
#5  0x805c466 in fsobj::Fetch (this=0x21540d88, vuid=0) at fso_cfscalls0.cc:204
#6  0x8053064 in fsdb::Get (this=0x218b5c88, f_addr=0x151d9dcc, key=0x151dbe34, vuid=0, rights=12, 
    comp=0x0, rcode=0x0, GetInconsistent=0) at fso0.cc:876
#7  0x80ac8f8 in vproc::open (this=0x81e5528, cp=0x151dbe30, flags=1) at vproc_vfscalls.cc:193
#8  0x80b16e9 in worker::main (this=0x81e5528) at worker.cc:1301
#9  0x80a7cd2 in VprocPreamble (init_lock=0x81e5568) at vproc.cc:146
#10 0x4008d2d0 in Create_Process_Part2 () at lwp.c:792

(gdb) up 3
#3  0x80b6352 in rvmlib_malloc (size=24576, file=0x80f34ea "codadir.c", line=222) at rvmlib.c:209
209     rvmlib.c: No such file or directory.
(gdb) p err
$13 = -9
(gdb) p RvmType
$9 = UFS
(gdb) p size
$10 = 24576
(gdb) p _rvm_data
$11 = (rvm_perthread_t *) 0x0
(gdb) p *rvmlib_thread_data()
$12 = {tid = 0x81e5544, tids = {struct_id = rvm_tid_id, from_heap = rvm_false, uname = {
      tv_sec = 1014157444, tv_usec = 666708}, tid = 0x8112108, reserved = 0}, list = {size = 0, count = 0, 
    table = 0x0}}

(gdb) up       
#4  0x80b8a6c in DH_Alloc (dh=0x2132cf88, size=24576, in_rvm=1) at codadir.c:222
222     codadir.c: No such file or directory.
(gdb) p *dh
$15 = {dh_lock = {wait_states = 0 '\000', excl_locked = 2 '\002', readers_reading = 0 '\000', 
    num_waiting = 0 '\000', excl_locker = 0x811a5d8}, dh_data = 0x0, dh_dirty = 1}

(gdb) up
#5  0x805c466 in fsobj::Fetch (this=0x21540d88, vuid=0) at fso_cfscalls0.cc:204
204     fso_cfscalls0.cc: No such file or directory.
(gdb) p *this
$21 = {MagicNumber = 2687694, fid = {Volume = 2130706477, Vnode = 309, Unique = 3195}, 
  comp = 0x20da08c8 "html", vol = 0x20e8a288, primary_handle = {next = 0x216362e0}, vol_handle = {
    next = 0x21746164, _vptr. = 0x0}, prio_handle = {mytree = 0x8116b50, parent = 0x21491dac, 
    leftchild = 0x0, rightchild = 0x0, _vptr. = 0x0}, del_handle = {next = 0x0, prev = 0x0, _vptr. = 0x0}, 
  owrite_handle = {next = 0x0, _vptr. = 0x0}, state = FsoNormal, stat = {VnodeType = Directory, 
    LinkCount = 2 '\002', Length = 24576, DataVersion = 593, VV = {Versions = {Site0 = 593, Site1 = 0, 
        Site2 = 0, Site3 = 0, Site4 = 0, Site5 = 0, Site6 = 0, Site7 = 0}, StoreId = {Host = 1015241729, 
        Uniquifier = 27918}, Flags = 0}, Date = 980442462, Author = 4294967295, Owner = 10157, Mode = 493}, 
  GotThisData = 0, RcRights = 3, AnyUser = {uid = 4294967295, rights = 9 '\t', inuse = 1, valid = 1}, 
  SpecificUser = {{uid = 4294967295, rights = 0 '\000', inuse = 0, valid = 0}, {uid = 4294967295, 
      rights = 0 '\000', inuse = 0, valid = 0}, {uid = 4294967295, rights = 0 '\000', inuse = 0, 
      valid = 0}, {uid = 4294967295, rights = 0 '\000', inuse = 0, valid = 0}, {uid = 4294967295, 
      rights = 0 '\000', inuse = 0, valid = 0}, {uid = 4294967295, rights = 0 '\000', inuse = 0, 
      valid = 0}, {uid = 4294967295, rights = 0 '\000', inuse = 0, valid = 0}, {uid = 0, rights = 9 '\t', 
      inuse = 1, valid = 1}}, flags = {random = 10755, fake = 0, owrite = 0, dirty = 0, local = 0, 
    ckmtpt = 0, fetching = 1, padding = 0}, mvstat = NORMAL, u = {root = 0x0, mtpoint = 0x0}, pfid = {
    Volume = 2130706477, Vnode = 305, Unique = 3193}, pfso = 0x2172a148, children = 0x0, child_link = {
    next = 0x21755914, prev = 0x218521d4, _vptr. = 0x0}, priority = 25000, HoardPri = 0, 
  HoardVuid = 4294967294, hdb_bindings = 0x0, FetchAllowed = 1, AskingAllowed = 0, mle_bindings = 0x0, 
  CleanStat = {Length = -1, Date = 4294967295}, tSid = {Host = 0, Uniquifier = 0}, shadow = 0x0, data = {
    havedata = 556978056, file = 0x2132cf88, dir = 0x2132cf88, symlink = 0x2132cf88 ""}, ix = 7960, cf = {
    length = 0, validdata = 0, refcnt = 1, inode = 1956393, name = "00/00/1F/18", numopens = 0}, 
  fso_sync = 0 '\000', readers = 0, writers = 1, openers = 0, Writers = 0, Execers = 0, refcnt = 1, 
  lastresolved = 0}
(gdb) p *data.dir
$19 = {dh = {dh_lock = {wait_states = 0 '\000', excl_locked = 2 '\002', readers_reading = 0 '\000', 
      num_waiting = 0 '\000', excl_locker = 0x811a5d8}, dh_data = 0x0, dh_dirty = 1}, udcfvalid = 0, 
  udcf = 0x0, padding = 0}
(gdb) p *sei
$20 = {TransmissionDirection = SERVERTOCLIENT, hashmark = 0 '\000', SeekOffset = 0, BytesTransferred = 0, 
  ByteQuota = -1, QuotaExceeded = 0, Tag = 0, FileInfo = {ByName = {ProtectionBits = 0, 
      LocalFileName = '\000' <repeats 255 times>}, ByInode = {Device = 0, Inode = 0}, ByFD = {fd = 0}, 
    ByAddr = {vmfile = {MaxSeqLen = 0, SeqLen = 0, SeqBody = 0x0}, vmfilep = 0}}}

Received on 2002-02-20 08:31:43