[Lustre-discuss] mkfs.lustre hangs the system (SUSE Linux 11 sp1, Lustre MGS/MDT)

Jon Zhu jon.zhu at gmail.com
Sat Jun 11 08:02:59 PDT 2011


Hi,

Does anyone know why mkfs.lustre hangs the system? This problem occurred on
Lustre 1.8.5 SUSE Linux 11 x86_64 version, h/w platform is Amazon EC2.
Here's the full strace log:

ldiskfs # strace mkfs.lustre --fsname=temp --mgs --mdt /dev/sdf
execve("/usr/sbin/mkfs.lustre", ["mkfs.lustre", "--fsname=temp", "--mgs",
"--mdt                                             ", "/dev/sdf"], [/* 51
vars */]) = 0
brk(0)                                  = 0x612000
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) =
0x7f3                                             0124b4000
access("/etc/ld.so.preload", R_OK)      = -1 ENOENT (No such file or
directory)
open("/etc/ld.so.cache", O_RDONLY)      = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=50926, ...}) = 0
mmap(NULL, 50926, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f30124a7000
close(3)                                = 0
open("/lib64/libc.so.6", O_RDONLY)      = 3
read(3,
"\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\340\354\1\0\0\0\0\0"...,
                                         832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=1661454, ...}) = 0
mmap(NULL, 3528776, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) =
0x7f                                             3011f39000
fadvise64(3, 0, 3528776, POSIX_FADV_WILLNEED) = 0
mprotect(0x7f301208d000, 2097152, PROT_NONE) = 0
mmap(0x7f301228d000, 20480, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_DENY
WRITE, 3, 0x154000) = 0x7f301228d000
mmap(0x7f3012292000, 18504, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_ANON
YMOUS, -1, 0) = 0x7f3012292000
close(3)                                = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) =
0x7f3                                             0124a6000
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) =
0x7f3                                             0124a5000
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) =
0x7f3                                             0124a4000
arch_prctl(ARCH_SET_FS, 0x7f30124a5700) = 0
mprotect(0x7f301228d000, 16384, PROT_READ) = 0
mprotect(0x608000, 4096, PROT_READ)     = 0
mprotect(0x7f30124b5000, 4096, PROT_READ) = 0
munmap(0x7f30124a7000, 50926)           = 0
open("/proc/sys/kernel/osrelease", O_RDONLY) = 3
read(3, "2.6.", 4)                      = 4
close(3)                                = 0
access("/dev/sdf", F_OK)                = 0
stat("/dev/sdf", {st_mode=S_IFBLK|0660, st_rdev=makedev(8, 80), ...}) = 0
access("/usr/sbin/l_getgroups", R_OK|X_OK) = 0
fstat(1, {st_mode=S_IFCHR|0620, st_rdev=makedev(136, 0), ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) =
0x7f3                                             0124b3000
write(1, "\n", 1
)                       = 1
write(1, "   Permanent disk data:\n", 24   Permanent disk data:
) = 24
write(1, "Target:     temp-MDTffff\n", 25Target:     temp-MDTffff
) = 25
write(1, "Index:      unassigned\n", 23Index:      unassigned
) = 23
write(1, "Lustre FS:  temp\n", 17Lustre FS:  temp
)      = 17
write(1, "Mount type: ldiskfs\n", 20Mount type: ldiskfs
)   = 20
write(1, "Flags:      0x75\n", 17Flags:      0x75
)      = 17
write(1, "              (MDT MGS needs_ind"..., 55              (MDT MGS
needs_i                                             ndex first_time update )
) = 55
write(1, "Persistent mount opts: iopen_nop"..., 65Persistent mount opts:
iopen_n
opriv,user_xattr,errors=remount-ro
) = 65
write(1, "Parameters: mdt.group_upcall=/us"..., 51Parameters:
mdt.group_upcall=/
usr/sbin/l_getgroups
) = 51
write(1, "\n", 1
)                       = 1
brk(0)                                  = 0x612000
brk(0x633000)                           = 0x633000
open("/etc/mtab", O_RDONLY)             = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=349, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) =
0x7f3                                             0124b2000
read(3, "/dev/sda1 / ext3 rw,acl,user_xat"..., 4096) = 349
read(3, "", 4096)                       = 0
close(3)                                = 0
munmap(0x7f30124b2000, 4096)            = 0
syscall_293(0x7fff65afd9c0, 0x80000, 0x406af9, 0x7f30124a5700, 0, 0x612100,
0x61                                             1820, 0x611820, 0x611820,
0x611820, 0x611820, 0x611820, 0x611820, 0x611820, 0x61
                      1820, 0x611820, 0x611820, 0x611820, 0x611820,
0x611820, 0x611820, 0x611820, 0x61
  1820, 0x611820, 0x611820, 0x611820, 0x611820, 0x611820, 0x611820,
0x611820, 0x61                                             1820, 0x611820) =
0
clone(child_stack=0, flags=CLONE_CHILD_CLEARTID|CLONE_CHILD_SETTID|SIGCHLD,
chil                                             d_tidptr=0x7f30124a59d0) =
3978
close(4)                                = 0
fcntl(3, F_SETFD, 0)                    = 0
fstat(3, {st_mode=S_IFIFO|0600, st_size=0, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) =
0x7f3                                             0124b2000
read(3, "", 4096)                       = 0
--- SIGCHLD (Child exited) @ 0 (0) ---
read(3, "", 4096)                       = 0
close(3)                                = 0
wait4(3978, [{WIFEXITED(s) && WEXITSTATUS(s) == 1}], 0, NULL) = 3978
munmap(0x7f30124b2000, 4096)            = 0
syscall_293(0x7fff65afd9c0, 0x80000, 0x406af9, 0x7f30124a5700, 0x1,
0x612100, 0x                                             611820, 0x611820,
0x611820, 0x611820, 0x611820, 0x611820, 0x611820, 0x611820, 0x
                              611820, 0x611820, 0x611820, 0x611820,
0x611820, 0x611820, 0x611820, 0x611820, 0x
          611820, 0x611820, 0x611820, 0x611820, 0x611820, 0x611820,
0x611820, 0x611820, 0x                                             611820,
0x611820) = 0
clone(child_stack=0, flags=CLONE_CHILD_CLEARTID|CLONE_CHILD_SETTID|SIGCHLD,
chil                                             d_tidptr=0x7f30124a59d0) =
3981
close(4)                                = 0
fcntl(3, F_SETFD, 0)                    = 0
fstat(3, {st_mode=S_IFIFO|0600, st_size=0, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) =
0x7f3                                             0124b2000
read(3, "", 4096)                       = 0
--- SIGCHLD (Child exited) @ 0 (0) ---
read(3, "", 4096)                       = 0
close(3)                                = 0
wait4(3981, [{WIFEXITED(s) && WEXITSTATUS(s) == 1}], 0, NULL) = 3981
munmap(0x7f30124b2000, 4096)            = 0
write(1, "checking for existing Lustre dat"..., 45checking for existing
Lustre d                                             ata: not found
) = 45
open("/dev/sdf", O_RDONLY)              = 3
ioctl(3, BLKGETSIZE64, 0x7fff65afc910)  = 0
close(3)                                = 0
write(1, "device size = 5120MB\n", 21device size = 5120MB
)  = 21
syscall_293(0x7fff65afb870, 0x80000, 0x406af9, 0x7f30124a5700, 0x1,
0x612100, 0x                                             609210, 0x609210,
0x609210, 0x609210, 0x609210, 0x609210, 0x609210, 0x609210, 0x
                              609210, 0x609210, 0x609210, 0x609210,
0x609210, 0x609210, 0x609210, 0x609210, 0x
          609210, 0x609210, 0x609210, 0x609210, 0x609210, 0x609210,
0x609210, 0x609210, 0x                                             609210,
0x609210) = 0
clone(child_stack=0, flags=CLONE_CHILD_CLEARTID|CLONE_CHILD_SETTID|SIGCHLD,
chil                                             d_tidptr=0x7f30124a59d0) =
3984
close(4)                                = 0
fcntl(3, F_SETFD, 0)                    = 0
fstat(3, {st_mode=S_IFIFO|0600, st_size=0, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) =
0x7f3                                             0124b2000
read(3, "debugfs 1.41.9 (22-Aug-2009)\n", 4096) = 29
read(3, "Supported feature: uninit_groups"..., 4096) = 33
read(3, "", 4096)                       = 0
uname({sys="Linux", node="ip-10-196-34-143", ...}) = 0
write(1, "2 6 32\n", 72 6 32
)                 = 7
write(1, "formatting backing filesystem ld"..., 50formatting backing
filesystem                                              ldiskfs on /dev/sdf
) = 50
write(1, "\ttarget name  temp-MDTffff\n", 27    target name  temp-MDTffff
) = 27
write(1, "\t4k blocks     1310720\n", 23        4k blocks     1310720
) = 23
write(1, "\toptions        -J size=204 -i 4"..., 76     options        -J
size=2                                             04 -i 4096 -I 512 -q -O
dir_index,uninit_groups -F
) = 76
write(1, "mkfs_cmd = mke2fs -j -b 4096 -L "..., 123mkfs_cmd = mke2fs -j -b
4096  -L temp-MDTffff  -J size=204 -i 4096 -I 512 -q -O
dir_index,uninit_groups -F /dev/sdf 1310720
) = 123
gettimeofday({1307462203, 738431}, NULL) = 0
getpid()                                = 3977
open("/tmp/run_command_logiIQsXq", O_RDWR|O_CREAT|O_EXCL, 0600) = 4
close(4)                                = 0
rt_sigaction(SIGINT, {0x1, [], SA_RESTORER, 0x7f3011f6b9e0}, {SIG_DFL, [],
0}, 8                                             ) = 0
rt_sigaction(SIGQUIT, {0x1, [], SA_RESTORER, 0x7f3011f6b9e0}, {SIG_DFL, [],
0},                                              8) = 0
rt_sigprocmask(SIG_BLOCK, [CHLD], [], 8) = 0
clone(child_stack=0, flags=CLONE_PARENT_SETTID|SIGCHLD,
parent_tidptr=0x7fff65af                                             c828) =
3986
wait4(3986, [{WIFEXITED(s) && WEXITSTATUS(s) == 0}], 0, NULL) = 3986
rt_sigaction(SIGINT, {SIG_DFL, [], SA_RESTORER, 0x7f3011f6b9e0}, NULL, 8) =
0
rt_sigaction(SIGQUIT, {SIG_DFL, [], SA_RESTORER, 0x7f3011f6b9e0}, NULL, 8) =
0
rt_sigprocmask(SIG_SETMASK, [], NULL, 8) = 0
--- SIGCHLD (Child exited) @ 0 (0) ---
unlink("/tmp/run_command_logiIQsXq")    = 0
mkdir("/tmp/mntFdZiJN", 0700)           = 0
mount("/dev/sdf", "/tmp/mntFdZiJN", "ldiskfs", 0,
"iopen_nopriv,user_xattr,error                              s=r"...


Thanks,
-Jon
jon.zhu at gmail.com
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://lists.lustre.org/pipermail/lustre-discuss-lustre.org/attachments/20110611/f1e8afaa/attachment.htm>


More information about the lustre-discuss mailing list