Hi folks. I've just updated our cluster formely based
on RedHat 7.2 + openmosix to Red Hat Enterprise Linux
AS 3 + openmosix (2.4.26-om1). The cluster works but I
can see *many* seg faults to *many* programs, from the
Inter Fortran Compiler, to make, to host or... seems to
be anything! I'crawling the Internet for 3 days, with
no clues, so I'm posting here. If I strace the call to
the plain "host", I get:
# strace host
execve("/usr/bin/host", ["host"], [/* 33 vars */]) = 0
uname({sys="Linux", node="knot02.elettra.trieste.it",
...}) = 0
brk(0) = 0x8056588
open("/etc/ld.so.preload", O_RDONLY) = -1 ENOENT (No
such file or directory)
open("/opt/intel_fc_80/lib/tls/i686/mmx/libdns.so.16",
O_RDONLY) = -1 ENOENT (No such file or directory)
stat64("/opt/intel_fc_80/lib/tls/i686/mmx", 0xbfffefa0)
= -1 ENOENT (No such file or directory)
open("/opt/intel_fc_80/lib/tls/i686/libdns.so.16",
O_RDONLY) = -1 ENOENT (No such file or directory)
stat64("/opt/intel_fc_80/lib/tls/i686", 0xbfffefa0) =
-1 ENOENT (No such file or directory)
open("/opt/intel_fc_80/lib/tls/mmx/libdns.so.16",
O_RDONLY) = -1 ENOENT (No such file or directory)
stat64("/opt/intel_fc_80/lib/tls/mmx", 0xbfffefa0) = -1
ENOENT (No such file or directory)
open("/opt/intel_fc_80/lib/tls/libdns.so.16", O_RDONLY)
= -1 ENOENT (No such file or directory)
stat64("/opt/intel_fc_80/lib/tls", 0xbfffefa0) = -1
ENOENT (No such file or directory)
open("/opt/intel_fc_80/lib/i686/mmx/libdns.so.16",
O_RDONLY) = -1 ENOENT (No such file or directory)
stat64("/opt/intel_fc_80/lib/i686/mmx", 0xbfffefa0) =
-1 ENOENT (No such file or directory)
open("/opt/intel_fc_80/lib/i686/libdns.so.16",
O_RDONLY) = -1 ENOENT (No such file or directory)
stat64("/opt/intel_fc_80/lib/i686", 0xbfffefa0) = -1
ENOENT (No such file or directory)
open("/opt/intel_fc_80/lib/mmx/libdns.so.16", O_RDONLY)
= -1 ENOENT (No such file or directory)
stat64("/opt/intel_fc_80/lib/mmx", 0xbfffefa0) = -1
ENOENT (No such file or directory)
open("/opt/intel_fc_80/lib/libdns.so.16", O_RDONLY) =
-1 ENOENT (No such file or directory)
stat64("/opt/intel_fc_80/lib", {st_mode=S_IFDIR|0755,
st_size=64, ...}) = 0
open("/etc/ld.so.cache", O_RDONLY) = 3
fstat64(3, {st_mode=S_IFREG|0644, st_size=88703, ...}) = 0
old_mmap(NULL, 88703, PROT_READ, MAP_PRIVATE, 3, 0) =
0x40016000
close(3) = 0
open("/usr/lib/libdns.so.16", O_RDONLY) = 3
read(3,
"\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\320\"\1"...,
512) = 512
fstat64(3, {st_mode=S_IFREG|0755, st_size=1026680,
...}) = 0
old_mmap(NULL, 4096, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x4002c000
old_mmap(NULL, 1030972, PROT_READ|PROT_EXEC,
MAP_PRIVATE, 3, 0) = 0x4002d000
old_mmap(0x40125000, 16384, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED, 3, 0xf7000) = 0x40125000
close(3) = 0
open("/opt/intel_fc_80/lib/libisc.so.7", O_RDONLY) = -1
ENOENT (No such file or directory)
open("/usr/lib/libisc.so.7", O_RDONLY) = 3
read(3,
"\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\200z\0"...,
512) = 512
fstat64(3, {st_mode=S_IFREG|0755, st_size=221592, ...}) = 0
old_mmap(NULL, 224824, PROT_READ|PROT_EXEC,
MAP_PRIVATE, 3, 0) = 0x40129000
old_mmap(0x4015f000, 4096, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED, 3, 0x35000) = 0x4015f000
close(3) = 0
open("/opt/intel_fc_80/lib/libcrypto.so.4", O_RDONLY) =
-1 ENOENT (No such file or directory)
open("/lib/libcrypto.so.4", O_RDONLY) = 3
read(3,
"\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\360\252"...,
512) = 512
fstat64(3, {st_mode=S_IFREG|0755, st_size=976284, ...}) = 0
old_mmap(NULL, 989496, PROT_READ|PROT_EXEC,
MAP_PRIVATE, 3, 0) = 0x40160000
old_mmap(0x4023d000, 73728, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED, 3, 0xdd000) = 0x4023d000
old_mmap(0x4024f000, 10552, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) =
0x4024f000close(3) = 0
open("/opt/intel_fc_80/lib/libnsl.so.1", O_RDONLY) = -1
ENOENT (No such file or directory)
open("/lib/libnsl.so.1", O_RDONLY) = 3
read(3,
"\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0
<\0\000"..., 512) = 512
fstat64(3, {st_mode=S_IFREG|0755, st_size=91040, ...}) = 0
old_mmap(NULL, 84864, PROT_READ|PROT_EXEC, MAP_PRIVATE,
3, 0) = 0x40252000
old_mmap(0x40264000, 4096, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED, 3, 0x11000) = 0x40264000
old_mmap(0x40265000, 7040, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x40265000
close(3) = 0
open("/opt/intel_fc_80/lib/libpthread.so.0", O_RDONLY)
= -1 ENOENT (No such file or directory)
open("/lib/tls/libpthread.so.0", O_RDONLY) = 3
read(3,
"\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\20G\0\000"...,
512) = 512
fstat64(3, {st_mode=S_IFREG|0755, st_size=97712, ...}) = 0
old_mmap(NULL, 64820, PROT_READ|PROT_EXEC, MAP_PRIVATE,
3, 0) = 0x40267000
old_mmap(0x40274000, 4096, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED, 3, 0xc000) = 0x40274000
old_mmap(0x40275000, 7476, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x40275000
close(3) = 0
open("/opt/intel_fc_80/lib/libc.so.6", O_RDONLY) = -1
ENOENT (No such file or directory)
open("/lib/tls/libc.so.6", O_RDONLY) = 3
read(3,
"\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0pX\1\000"...,
512) = 512
fstat64(3, {st_mode=S_IFREG|0755, st_size=1571824,
...}) = 0
old_mmap(NULL, 1275340, PROT_READ|PROT_EXEC,
MAP_PRIVATE, 3, 0) = 0x40277000
old_mmap(0x403a9000, 12288, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED, 3, 0x132000) = 0x403a9000
old_mmap(0x403ac000, 9676, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x403ac000
close(3) = 0
open("/opt/intel_fc_80/lib/libgssapi_krb5.so.2",
O_RDONLY) = -1 ENOENT (No such file or directory)
open("/usr/kerberos/lib/libgssapi_krb5.so.2", O_RDONLY) = 3
read(3,
"\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\340H\0"...,
512) = 512
fstat64(3, {st_mode=S_IFREG|0755, st_size=76712, ...}) = 0
old_mmap(NULL, 4096, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x403af000
old_mmap(NULL, 75588, PROT_READ|PROT_EXEC, MAP_PRIVATE,
3, 0) = 0x403b0000
old_mmap(0x403c2000, 4096, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED, 3, 0x12000) = 0x403c2000
close(3) = 0
open("/opt/intel_fc_80/lib/libkrb5.so.3", O_RDONLY) =
-1 ENOENT (No such file or directory)
open("/usr/kerberos/lib/libkrb5.so.3", O_RDONLY) = 3
read(3,
"\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\320\362"...,
512) = 512
fstat64(3, {st_mode=S_IFREG|0755, st_size=385252, ...}) = 0
old_mmap(NULL, 384636, PROT_READ|PROT_EXEC,
MAP_PRIVATE, 3, 0) = 0x403c3000
old_mmap(0x4041f000, 8192, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED, 3, 0x5c000) = 0x4041f000
close(3) = 0
open("/opt/intel_fc_80/lib/libcom_err.so.3", O_RDONLY)
= -1 ENOENT (No such file or directory)
open("/usr/kerberos/lib/libcom_err.so.3", O_RDONLY) = 3
read(3,
"\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\240\t\0"...,
512) = 512
fstat64(3, {st_mode=S_IFREG|0755, st_size=5540, ...}) = 0
old_mmap(NULL, 4520, PROT_READ|PROT_EXEC, MAP_PRIVATE,
3, 0) = 0x40421000
old_mmap(0x40422000, 4096, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED, 3, 0x1000) = 0x40422000
close(3) = 0
open("/opt/intel_fc_80/lib/libk5crypto.so.3", O_RDONLY)
= -1 ENOENT (No such file or directory)
open("/usr/kerberos/lib/libk5crypto.so.3", O_RDONLY) = 3
read(3,
"\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\0&\0\000"...,
512) = 512
fstat64(3, {st_mode=S_IFREG|0755, st_size=72552, ...}) = 0
old_mmap(NULL, 73108, PROT_READ|PROT_EXEC, MAP_PRIVATE,
3, 0) = 0x40423000
old_mmap(0x40434000, 4096, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED, 3, 0x11000) = 0x40434000
close(3) = 0
open("/opt/intel_fc_80/lib/libresolv.so.2", O_RDONLY) =
-1 ENOENT (No such file or directory)
open("/lib/libresolv.so.2", O_RDONLY) = 3
read(3,
"\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\20*\0\000"...,
512) = 512
fstat64(3, {st_mode=S_IFREG|0755, st_size=76540, ...}) = 0
old_mmap(NULL, 73604, PROT_READ|PROT_EXEC, MAP_PRIVATE,
3, 0) = 0x40435000
old_mmap(0x40444000, 4096, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED, 3, 0xf000) = 0x40444000
old_mmap(0x40445000, 8068, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x40445000
close(3) = 0
open("/opt/intel_fc_80/lib/libdl.so.2", O_RDONLY) = -1
ENOENT (No such file or directory)
open("/lib/libdl.so.2", O_RDONLY) = 3
read(3,
"\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\260\32"...,
512) = 512
fstat64(3, {st_mode=S_IFREG|0755, st_size=14868, ...}) = 0
old_mmap(NULL, 12244, PROT_READ|PROT_EXEC, MAP_PRIVATE,
3, 0) = 0x40447000
old_mmap(0x40449000, 4096, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED, 3, 0x1000) = 0x40449000
close(3) = 0
open("/opt/intel_fc_80/lib/libz.so.1", O_RDONLY) = -1
ENOENT (No such file or directory)
open("/usr/lib/libz.so.1", O_RDONLY) = 3
read(3,
"\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\340\31"...,
512) = 512
fstat64(3, {st_mode=S_IFREG|0755, st_size=52584, ...}) = 0
old_mmap(NULL, 4096, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x4044a000
old_mmap(NULL, 55564, PROT_READ|PROT_EXEC, MAP_PRIVATE,
3, 0) = 0x4044b000
old_mmap(0x40457000, 8192, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED, 3, 0xb000) = 0x40457000
close(3) = 0
old_mmap(NULL, 4096, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x40459000
set_thread_area({entry_number:-1 -> -1,
base_addr:0x40459080, limit:1048575, seg_32bit:1,
contents:0, read_exec_only:0, limit_in_pages:1,
seg_not_present:0, useable:1}) = -1 ENOSYS (Function
not implemented)
modify_ldt(1, {entry_number:0, base_addr:0x40459080,
limit:1048575, seg_32bit:1, contents:0,
read_exec_only:0, limit_in_pages:1, seg_not_present:0,
useable:1}, 16) = 0
munmap(0x40016000, 88703) = 0
set_tid_address(0x404590c8) = -1 ENOSYS
(Function not implemented)
rt_sigaction(SIGRTMIN, {0x4026b670, [],
SA_RESTORER|SA_SIGINFO, 0x40271e40}, NULL, 8) = 0
rt_sigprocmask(SIG_UNBLOCK, [RTMIN], NULL, 8) = 0
getrlimit(RLIMIT_STACK, {rlim_cur=8192*1024,
rlim_max=RLIM_INFINITY}) = 0
rt_sigaction(SIGINT, {0x40148a50, ~[RTMIN],
SA_RESTORER, 0x40271e48}, NULL, 8) = 0
rt_sigaction(SIGTERM, {0x40148a50, ~[RTMIN],
SA_RESTORER, 0x40271e48}, NULL, 8) = 0
rt_sigaction(SIGPIPE, {SIG_IGN}, NULL, 8) = 0
rt_sigaction(SIGHUP, {SIG_DFL}, NULL, 8) = 0
rt_sigprocmask(SIG_BLOCK, [HUP INT TERM], NULL, 8) = 0
socket(PF_INET, SOCK_STREAM, IPPROTO_IP) = 3
close(3) = 0
socket(PF_INET6, SOCK_STREAM, IPPROTO_IP) = -1
EAFNOSUPPORT (Address family not supported by protocol)
futex(0x4015f6b0, FUTEX_WAKE, 2147483647) = -1 ENOSYS
(Function not implemented)
brk(0) = 0x8056588
brk(0x8077588) = 0x8077588
brk(0) = 0x8077588
brk(0x8078000) = 0x8078000
mmap2(NULL, 8392704, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x4045a000
mprotect(0x4045a000, 4096, PROT_NONE) = 0
clone(child_stack=0x40c5ab04,
flags=CLONE_VM|CLONE_FS|CLONE_FILES|CLONE_SIGHAND|CLONE_THREAD|CLONE_SYSVSEM|CLONE_SETTLS|CLONE_PARENT_SETTID|CLONE_CHILD_CLEARTID|CLONE_DETACHED,
parent_tidptr=0x40c5abf8, {entry_number:0,
base_addr:0x40c5abb0, limit:1048575, seg_32bit:1,
contents:0, read_exec_only:0, limit_in_pages:1,
seg_not_present:0, useable:1}, child_tidptr=0x40c5abf8)
= 1133
mmap2(NULL, 8392704, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x40c5b000
mprotect(0x40c5b000, 4096, PROT_NONE) = 0
clone(child_stack=0x4145bb04,
flags=CLONE_VM|CLONE_FS|CLONE_FILES|CLONE_SIGHAND|CLONE_THREAD|CLONE_SYSVSEM|CLONE_SETTLS|CLONE_PARENT_SETTID|CLONE_CHILD_CLEARTID|CLONE_DETACHED,
parent_tidptr=0x4145bbf8, {entry_number:0,
base_addr:0x4145bbb0, limit:1048575, seg_32bit:1,
contents:0, read_exec_only:0, limit_in_pages:1,
seg_not_present:0, useable:1}, child_tidptr=0x4145bbf8)
= 1134
--- SIGSEGV (Segmentation fault) @ 0 (0) ---
+++ killed by SIGSEGV +++
I've tried with all the om kernels from 2.4.21 to
2.4.26, both UP and SMP with same results. Obviously,
the system kernel (kernel-2.4.21-32.0.1.EL) works...
Ivan <ivan.andrian@elettra.trieste.it>