Ok, here is the output from "strace xrx n0000\!6667 /bin/ls" :
execve("/usr/local/bin/xrx", ["xrx", "n0000!6667", "/bin/ls"], [/* 31
vars */]) = 0
brk(0) = 0x622000
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c539000
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c538000
access("/etc/ld.so.preload", R_OK) = -1 ENOENT (No such file or directory)
open("/etc/ld.so.cache", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=170055, ...}) = 0
mmap(NULL, 170055, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f732c50e000
close(3) = 0
open("/lib64/libcrypto.so.6", O_RDONLY) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\320b\205\3768\0\0\0"...,
832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=1329816, ...}) = 0
mmap(0x38fe800000, 3437784, PROT_READ|PROT_EXEC,
MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x38fe800000
mprotect(0x38fe925000, 2097152, PROT_NONE) = 0
mmap(0x38feb25000, 126976, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x125000) = 0x38feb25000
mmap(0x38feb44000, 13528, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x38feb44000
close(3) = 0
open("/lib64/libm.so.6", O_RDONLY) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0`>\240\3206\0\0\0"...,
832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=615136, ...}) = 0
mmap(0x36d0a00000, 2629848, PROT_READ|PROT_EXEC,
MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x36d0a00000
mprotect(0x36d0a82000, 2093056, PROT_NONE) = 0
mmap(0x36d0c81000, 8192, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x81000) = 0x36d0c81000
close(3) = 0
open("/lib64/libc.so.6", O_RDONLY) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\260\331a\3206\0\0\0"...,
832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=1699912, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c50d000
mmap(0x36d0600000, 3481848, PROT_READ|PROT_EXEC,
MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x36d0600000
mprotect(0x36d074a000, 2093056, PROT_NONE) = 0
mmap(0x36d0949000, 20480, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x149000) = 0x36d0949000
mmap(0x36d094e000, 16632, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x36d094e000
close(3) = 0
open("/lib64/libdl.so.2", O_RDONLY) = 3
read(3,
"\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\20\16\340\3206\0\0\0"...,
832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=23360, ...}) = 0
mmap(0x36d0e00000, 2109696, PROT_READ|PROT_EXEC,
MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x36d0e00000
mprotect(0x36d0e02000, 2097152, PROT_NONE) = 0
mmap(0x36d1002000, 8192, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x2000) = 0x36d1002000
close(3) = 0
open("/usr/lib64/libz.so.1", O_RDONLY) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\320\37`\3216\0\0\0"...,
832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=85928, ...}) = 0
mmap(0x36d1600000, 2178920, PROT_READ|PROT_EXEC,
MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x36d1600000
mprotect(0x36d1614000, 2093056, PROT_NONE) = 0
mmap(0x36d1813000, 4096, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x13000) = 0x36d1813000
close(3) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c50c000
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c50b000
arch_prctl(ARCH_SET_FS, 0x7f732c50b6e0) = 0
mprotect(0x36d1002000, 4096, PROT_READ) = 0
mprotect(0x36d0949000, 16384, PROT_READ) = 0
mprotect(0x36d0c81000, 4096, PROT_READ) = 0
mprotect(0x36d041a000, 4096, PROT_READ) = 0
munmap(0x7f732c50e000, 170055) = 0
geteuid() = 0
brk(0) = 0x622000
brk(0x643000) = 0x643000
socket(PF_FILE, SOCK_STREAM, 0) = 3
fcntl(3, F_GETFL) = 0x2 (flags O_RDWR)
fcntl(3, F_SETFL, O_RDWR|O_NONBLOCK) = 0
connect(3, {sa_family=AF_FILE, path="/var/run/nscd/socket"}, 110) = -1
ENOENT (No such file or directory)
close(3) = 0
socket(PF_FILE, SOCK_STREAM, 0) = 3
fcntl(3, F_GETFL) = 0x2 (flags O_RDWR)
fcntl(3, F_SETFL, O_RDWR|O_NONBLOCK) = 0
connect(3, {sa_family=AF_FILE, path="/var/run/nscd/socket"}, 110) = -1
ENOENT (No such file or directory)
close(3) = 0
open("/etc/nsswitch.conf", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=1722, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c537000
read(3, "#\n# /etc/nsswitch.conf\n#\n# An ex"..., 4096) = 1722
read(3, "", 4096) = 0
close(3) = 0
munmap(0x7f732c537000, 4096) = 0
open("/etc/ld.so.cache", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=170055, ...}) = 0
mmap(NULL, 170055, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f732c50e000
close(3) = 0
open("/lib64/libnss_files.so.2", O_RDONLY) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\340\37\0\0\0\0\0\0"...,
832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=53880, ...}) = 0
mmap(NULL, 2139432, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3,
0) = 0x7f732c300000
mprotect(0x7f732c30a000, 2093056, PROT_NONE) = 0
mmap(0x7f732c509000, 8192, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x9000) = 0x7f732c509000
close(3) = 0
mprotect(0x7f732c509000, 4096, PROT_READ) = 0
munmap(0x7f732c50e000, 170055) = 0
open("/etc/passwd", O_RDONLY) = 3
fcntl(3, F_GETFD) = 0
fcntl(3, F_SETFD, FD_CLOEXEC) = 0
fstat(3, {st_mode=S_IFREG|0644, st_size=1672, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c537000
read(3, "root:x:0:0:root:/root:/bin/bash\n"..., 4096) = 1672
close(3) = 0
munmap(0x7f732c537000, 4096) = 0
socket(PF_FILE, SOCK_STREAM, 0) = 3
fcntl(3, F_GETFL) = 0x2 (flags O_RDWR)
fcntl(3, F_SETFL, O_RDWR|O_NONBLOCK) = 0
connect(3, {sa_family=AF_FILE, path="/var/run/nscd/socket"}, 110) = -1
ENOENT (No such file or directory)
close(3) = 0
socket(PF_FILE, SOCK_STREAM, 0) = 3
fcntl(3, F_GETFL) = 0x2 (flags O_RDWR)
fcntl(3, F_SETFL, O_RDWR|O_NONBLOCK) = 0
connect(3, {sa_family=AF_FILE, path="/var/run/nscd/socket"}, 110) = -1
ENOENT (No such file or directory)
close(3) = 0
open("/etc/group", O_RDONLY) = 3
fcntl(3, F_GETFD) = 0
fcntl(3, F_SETFD, FD_CLOEXEC) = 0
fstat(3, {st_mode=S_IFREG|0644, st_size=720, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c537000
read(3, "root:x:0:root\nbin:x:1:root,bin,d"..., 4096) = 720
close(3) = 0
munmap(0x7f732c537000, 4096) = 0
open("/etc/group", O_RDONLY) = 3
fcntl(3, F_GETFD) = 0
fcntl(3, F_SETFD, FD_CLOEXEC) = 0
fstat(3, {st_mode=S_IFREG|0644, st_size=720, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c537000
lseek(3, 0, SEEK_CUR) = 0
read(3, "root:x:0:root\nbin:x:1:root,bin,d"..., 4096) = 720
read(3, "", 4096) = 0
open("/etc/ld.so.cache", O_RDONLY) = 4
fstat(4, {st_mode=S_IFREG|0644, st_size=170055, ...}) = 0
mmap(NULL, 170055, PROT_READ, MAP_PRIVATE, 4, 0) = 0x7f732c2d6000
close(4) = 0
open("/lib64/libnss_nis.so.2", O_RDONLY) = 4
read(4, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\300\37\0\0\0\0\0\0"...,
832) = 832
fstat(4, {st_mode=S_IFREG|0755, st_size=53432, ...}) = 0
mmap(NULL, 2139320, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 4,
0) = 0x7f732c0cb000
mprotect(0x7f732c0d4000, 2097152, PROT_NONE) = 0
mmap(0x7f732c2d4000, 8192, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 4, 0x9000) = 0x7f732c2d4000
close(4) = 0
open("/lib64/libnsl.so.1", O_RDONLY) = 4
read(4, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>[EMAIL PROTECTED]"...,
832) = 832
fstat(4, {st_mode=S_IFREG|0755, st_size=114352, ...}) = 0
mmap(0x36da800000, 2194096, PROT_READ|PROT_EXEC,
MAP_PRIVATE|MAP_DENYWRITE, 4, 0) = 0x36da800000
mprotect(0x36da815000, 2093056, PROT_NONE) = 0
mmap(0x36daa14000, 8192, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 4, 0x14000) = 0x36daa14000
mmap(0x36daa16000, 6832, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x36daa16000
close(4) = 0
mprotect(0x36daa14000, 4096, PROT_READ) = 0
mprotect(0x7f732c2d4000, 4096, PROT_READ) = 0
munmap(0x7f732c2d6000, 170055) = 0
open("/etc/default/nss", O_RDONLY) = 4
fstat(4, {st_mode=S_IFREG|0644, st_size=1302, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c536000
read(4, "# /etc/default/nss\n# This file c"..., 4096) = 1302
read(4, "", 4096) = 0
close(4) = 0
munmap(0x7f732c536000, 4096) = 0
uname({sys="Linux", node="dgk3.chem.utoronto.ca", ...}) = 0
close(3) = 0
munmap(0x7f732c537000, 4096) = 0
open("/root/.ssh/id_rsa", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0600, st_size=1675, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c537000
read(3, "-----BEGIN RSA PRIVATE KEY-----\n"..., 4096) = 1675
close(3) = 0
munmap(0x7f732c537000, 4096) = 0
uname({sys="Linux", node="dgk3.chem.utoronto.ca", ...}) = 0
getcwd("/root", 1024) = 6
getpid() = 4467
open("/etc/resolv.conf", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=103, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c537000
read(3, "search chem.utoronto.ca\nnameserv"..., 4096) = 103
read(3, "", 4096) = 0
close(3) = 0
munmap(0x7f732c537000, 4096) = 0
socket(PF_FILE, SOCK_STREAM, 0) = 3
fcntl(3, F_GETFL) = 0x2 (flags O_RDWR)
fcntl(3, F_SETFL, O_RDWR|O_NONBLOCK) = 0
connect(3, {sa_family=AF_FILE, path="/var/run/nscd/socket"}, 110) = -1
ENOENT (No such file or directory)
close(3) = 0
socket(PF_FILE, SOCK_STREAM, 0) = 3
fcntl(3, F_GETFL) = 0x2 (flags O_RDWR)
fcntl(3, F_SETFL, O_RDWR|O_NONBLOCK) = 0
connect(3, {sa_family=AF_FILE, path="/var/run/nscd/socket"}, 110) = -1
ENOENT (No such file or directory)
close(3) = 0
open("/etc/host.conf", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=17, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c537000
read(3, "order hosts,bind\n", 4096) = 17
read(3, "", 4096) = 0
close(3) = 0
munmap(0x7f732c537000, 4096) = 0
open("/etc/hosts", O_RDONLY) = 3
fcntl(3, F_GETFD) = 0
fcntl(3, F_SETFD, FD_CLOEXEC) = 0
fstat(3, {st_mode=S_IFREG|0644, st_size=267, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c537000
read(3, "# Do not remove the following li"..., 4096) = 267
read(3, "", 4096) = 0
close(3) = 0
munmap(0x7f732c537000, 4096) = 0
uname({sys="Linux", node="dgk3.chem.utoronto.ca", ...}) = 0
open("/etc/ld.so.cache", O_RDONLY) = 3
fstat(3, {st_mode=S_IFREG|0644, st_size=170055, ...}) = 0
mmap(NULL, 170055, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f732c50e000
close(3) = 0
open("/lib64/libnss_dns.so.2", O_RDONLY) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\240\17\0\0\0\0\0\0"...,
832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=23632, ...}) = 0
mmap(NULL, 2113792, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3,
0) = 0x7f732bec6000
mprotect(0x7f732beca000, 2093056, PROT_NONE) = 0
mmap(0x7f732c0c9000, 8192, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x3000) = 0x7f732c0c9000
close(3) = 0
open("/lib64/libresolv.so.2", O_RDONLY) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>[EMAIL PROTECTED]"...,
832) = 832
fstat(3, {st_mode=S_IFREG|0755, st_size=92736, ...}) = 0
mmap(0x36db400000, 2181864, PROT_READ|PROT_EXEC,
MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x36db400000
mprotect(0x36db411000, 2097152, PROT_NONE) = 0
mmap(0x36db611000, 8192, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x11000) = 0x36db611000
mmap(0x36db613000, 6888, PROT_READ|PROT_WRITE,
MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x36db613000
close(3) = 0
mprotect(0x36db611000, 4096, PROT_READ) = 0
mprotect(0x7f732c0c9000, 4096, PROT_READ) = 0
munmap(0x7f732c50e000, 170055) = 0
socket(PF_INET, SOCK_DGRAM, IPPROTO_IP) = 3
connect(3, {sa_family=AF_INET, sin_port=htons(53),
sin_addr=inet_addr("142.150.224.224")}, 28) = 0
fcntl(3, F_GETFL) = 0x2 (flags O_RDWR)
fcntl(3, F_SETFL, O_RDWR|O_NONBLOCK) = 0
poll([{fd=3, events=POLLOUT, revents=POLLOUT}], 1, 0) = 1
sendto(3, "\313\303\1\0\0\1\0\0\0\0\0\0\nn0000!6667\4chem\10uto"...,
45, MSG_NOSIGNAL, NULL, 0) = 45
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 5000) = 1
ioctl(3, FIONREAD, [94]) = 0
recvfrom(3, "\313\303\205\203\0\1\0\0\0\1\0\0\nn0000!6667\4chem\10uto"...,
1024, 0, {sa_family=AF_INET, sin_port=htons(53),
sin_addr=inet_addr("142.150.224.224")}, [16]) = 94
close(3) = 0
socket(PF_INET, SOCK_STREAM, IPPROTO_IP) = 3
open("/etc/hosts", O_RDONLY) = 4
fcntl(4, F_GETFD) = 0
fcntl(4, F_SETFD, FD_CLOEXEC) = 0
fstat(4, {st_mode=S_IFREG|0644, st_size=267, ...}) = 0
mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
0) = 0x7f732c537000
read(4, "# Do not remove the following li"..., 4096) = 267
close(4) = 0
munmap(0x7f732c537000, 4096) = 0
connect(3, {sa_family=AF_INET, sin_port=htons(6667),
sin_addr=inet_addr("10.10.0.10")}, 16) = 0
fcntl(3, F_SETFL, O_RDONLY|O_NONBLOCK) = 0
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
write(3, "\25\0\0\0d\377\377\30\200\0\0\10\0009P2000.u", 21) = 21
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\25\0\0\0e\377\377\30\200\0\0\10\0009P2000.u", 32792) = 21
write(3, "\27\0\0\0f\0\0\0\0\0\0\4\0root\0\0\0\0\0\0", 23) = 23
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\24\0\0\0g\0\0\10\0\0\0\0\0\0\0\0\0\0\0\0", 32792) = 20
write(3, "\27\0\0\0t\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\20\0\0", 23) = 23
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\33\0\0\0u\0\0\20\0\0\0|%V\3211\275\354\351o:\373\365Q\336:\33",
32792) = 27
brk(0x669000) = 0x669000
write(3, "\27\0\0\0t\0\0\0\0\0\0\20\0\0\0\0\0\0\0\360\17\0\0", 23) = 23
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\v\0\0\0u\0\0\0\0\0\0", 32792) = 11
brk(0x661000) = 0x661000
open("/dev/urandom", O_RDONLY|O_NOCTTY|O_NONBLOCK) = 4
fstat(4, {st_mode=S_IFCHR|0444, st_rdev=makedev(1, 9), ...}) = 0
poll([{fd=4, events=POLLIN, revents=POLLIN}], 1, 10) = 1
read(4,
"\362\353D\226\276\10\357]\273M\375\343k\204\235\367\204\235\231\377C\30\10\237\233\344\337B\324l\216\177",
32) = 32
close(4) = 0
getuid() = 0
write(3,
"\27\1\0\0v\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\1\0\0\233?\16\323q\26\207\366\356"...,
279) = 279
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\v\0\0\0w\0\0\0\1\0\0", 32792) = 11
write(3, "\33\0\0\0h\0\0\1\0\0\0\0\0\0\0\4\0root\0\0\0\0\0\0", 27) = 27
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\24\0\0\0i\0\0\200\0\0\0\0\1\0\0\0\0\0\0\0", 32792) = 20
brk(0x654000) = 0x654000
getsockname(3, {sa_family=AF_INET, sin_port=htons(55574),
sin_addr=inet_addr("10.10.0.1")}, [12884901904]) = 0
write(3, "\27\0\0\0n\0\0\1\0\0\0\2\0\0\0\1\0\4\0arch", 23) = 23
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\26\0\0\0o\0\0\1\0\0\0\0\0\0\4\0\0\0\0\0\0\0", 32792) = 22
write(3, "\f\0\0\0p\0\0\2\0\0\0\0", 12) = 12
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\30\0\0\0q\0\0\0\0\0\0\0\4\0\0\0\0\0\0\0\0\0\0\0", 32792) = 24
write(3, "\27\0\0\0t\0\0\2\0\0\0\0\0\0\0\0\0\0\0?\0\0\0", 23) = 23
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\30\0\0\0u\0\0\r\0\0\0/Linux/x86_64", 32792) = 24
write(3, "\27\0\0\0t\0\0\2\0\0\0\r\0\0\0\0\0\0\0002\0\0\0", 23) = 23
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\v\0\0\0u\0\0\0\0\0\0", 32792) = 11
write(3, "\v\0\0\0x\0\0\2\0\0\0", 11) = 11
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\7\0\0\0y\0\0", 32792) = 7
write(3, "\30\0\0\0n\0\0\1\0\0\0\2\0\0\0\1\0\5\0clone", 24) = 24
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\26\0\0\0o\0\0\1\0\0\0\0\0\0\2\0\0\0\0\0\0\0", 32792) = 22
write(3, "\f\0\0\0p\0\0\2\0\0\0\0", 12) = 12
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\30\0\0\0q\0\0\0\0\0\0\0\2\0\0\0\0\0\0\0\0\0\0\0", 32792) = 24
write(3, "\27\0\0\0t\0\0\2\0\0\0\0\0\0\0\0\0\0\0?\0\0\0", 23) = 23
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\f\0\0\0u\0\0\1\0\0\0006", 32792) = 12
write(3, "\27\0\0\0t\0\0\2\0\0\0\1\0\0\0\0\0\0\0>\0\0\0", 23) = 23
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\v\0\0\0u\0\0\0\0\0\0", 32792) = 11
write(3, "\31\0\0\0n\0\0\1\0\0\0\3\0\0\0\2\0\1\0006\3\0ctl", 25) = 25
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "#\0\0\0o\0\0\2\0\200\0\0\0\0\0\0\0\7\0\0\0\0\0\0\0\0\0\1\0\0\7\0"...,
32792) = 35
write(3, "\f\0\0\0p\0\0\3\0\0\0\1", 12) = 12
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\30\0\0\0q\0\0\0\0\0\0\0\1\0\0\7\0\0\0\0\0\0\0\0", 32792) = 24
write(3, "\32\0\0\0n\0\0\1\0\0\0\4\0\0\0\2\0\1\0006\4\0wait", 26) = 26
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "#\0\0\0o\0\0\2\0\200\0\0\0\0\0\0\0\7\0\0\0\0\0\0\0\0\0\t\0\0\7\0"...,
32792) = 35
write(3, "\f\0\0\0p\0\0\4\0\0\0\0", 12) = 12
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\30\0\0\0q\0\0\0\0\0\0\0\t\0\0\7\0\0\0\0\0\0\0\0", 32792) = 24
write(3, "\33\0\0\0n\0\0\1\0\0\0\5\0\0\0\2\0\1\0006\5\0stdin", 27) = 27
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "#\0\0\0o\0\0\2\0\200\0\0\0\0\0\0\0\7\0\0\0\0\0\0\0\0\0\5\0\0\7\0"...,
32792) = 35
write(3, "\f\0\0\0p\0\0\5\0\0\0\1", 12) = 12
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\30\0\0\0q\0\0\0\0\0\0\0\5\0\0\7\0\0\0\0\0\0\0\0", 32792) = 24
write(3, "\34\0\0\0n\0\0\1\0\0\0\6\0\0\0\2\0\1\0006\6\0stdout", 28) = 28
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "#\0\0\0o\0\0\2\0\200\0\0\0\0\0\0\0\7\0\0\0\0\0\0\0\0\0\6\0\0\7\0"...,
32792) = 35
write(3, "\f\0\0\0p\0\0\6\0\0\0\0", 12) = 12
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\7\0\0\0y\0\0", 32792) = 7
stat("//Linux/x86_64", 0x7fff345357b0) = -1 ENOENT (No such file or directory)
socket(PF_INET, SOCK_STREAM, IPPROTO_IP) = 4
setsockopt(4, SOL_SOCKET, SO_REUSEADDR, [1], 4) = 0
socket(PF_INET, SOCK_STREAM, IPPROTO_IP) = 5
fcntl(5, F_SETFD, FD_CLOEXEC) = 0
bind(5, {sa_family=AF_INET, sin_port=htons(0),
sin_addr=inet_addr("0.0.0.0")}, 16) = 0
listen(5, 128) = 0
getsockname(5, {sa_family=AF_INET, sin_port=htons(39140),
sin_addr=inet_addr("0.0.0.0")}, [16]) = 0
fcntl(5, F_SETFL, O_RDONLY|O_NONBLOCK) = 0
write(3, "\31\0\0\0n\0\0\1\0\0\0\2\0\0\0\2\0\1\0006\3\0env", 25) = 25
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}, {fd=5,
events=POLLIN|POLLOUT}], 2, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}, {fd=5,
events=POLLIN|POLLOUT}], 2, 300000) = 1
read(3, "#\0\0\0o\0\0\2\0\200\0\0\0\0\0\0\0\7\0\0\0\0\0\0\0\0\0\4\0\0\7\0"...,
32792) = 35
write(3, "\f\0\0\0p\0\0\2\0\0\0\201", 12) = 12
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}, {fd=5,
events=POLLIN|POLLOUT}], 2, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}, {fd=5,
events=POLLIN|POLLOUT}], 2, 300000) = 1
read(3, "\30\0\0\0q\0\0\0\0\0\0\0\4\0\0\7\0\0\0\0\0\0\0\0", 32792) = 24
write(3, "\32\0\0\0n\0\0\1\0\0\0\10\0\0\0\2\0\1\0006\4\0argv", 26) = 26
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}, {fd=5,
events=POLLIN|POLLOUT}], 2, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}, {fd=5,
events=POLLIN|POLLOUT}], 2, 300000) = 1
read(3, "#\0\0\0o\0\0\2\0\200\0\0\0\0\0\0\0\7\0\0\0\0\0\0\0\0\0\3\0\0\7\0"...,
32792) = 35
write(3, "\f\0\0\0p\0\0\10\0\0\0\21", 12) = 12
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}], 1, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}], 1, 300000) = 1
read(3, "\30\0\0\0q\0\0\0\0\0\0\0\7\0\0\7\0\0\0\0\0\0\0\0", 32792) = 24
write(3, "\v\0\0\0x\0\0\2\0\0\0", 11) = 11
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}, {fd=5,
events=POLLIN|POLLOUT}], 2, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}, {fd=5,
events=POLLIN|POLLOUT}], 2, 300000) = 1
read(3, "\30\0\0\0q\0\0\0\0\0\0\0\3\0\0\7\0\0\0\0\0\0\0\0", 32792) = 24
write(3, "\30\0\0\0n\0\0\1\0\0\0\t\0\0\0\2\0\1\0006\2\0ns", 24) = 24
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}, {fd=5,
events=POLLIN|POLLOUT}], 2, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}, {fd=5,
events=POLLIN|POLLOUT}], 2, 300000) = 1
read(3, "\26\0\0\0o\0\0\1\0\200\0\0\0\0\0\0\0\7\0\0\0\0", 32792) = 22
write(3, "\v\0\0\0x\0\0\t\0\0\0", 11) = 11
poll([{fd=3, events=POLLIN|POLLOUT, revents=POLLOUT}, {fd=5,
events=POLLIN|POLLOUT}], 2, 300000) = 1
poll([{fd=3, events=POLLIN, revents=POLLIN}, {fd=5,
events=POLLIN|POLLOUT}], 2, 300000) = 1
read(3, "\7\0\0\0y\0\0", 32792) = 7
poll( <unfinished ...>
On Fri, Aug 29, 2008 at 8:29 PM, Daniel Gruner <[EMAIL PROTECTED]> wrote:
> Yes, I used the xrx command as normal. The back-slash is to escape
> the '!', which the shell
> (bash) interprets. That is not the problem. I will try to do the
> debug bit and/or strace, and post
> it for you guys to decipher...
>
> Daniel
>
> On Fri, Aug 29, 2008 at 6:11 PM, Abhishek Kulkarni <[EMAIL PROTECTED]> wrote:
>>
>>
>> On Fri, Aug 29, 2008 at 12:45 PM, Daniel Gruner <[EMAIL PROTECTED]> wrote:
>>>
>>> On 8/29/08, Abhishek Kulkarni <[EMAIL PROTECTED]> wrote:
>>> >
>>> >
>>> >
>>> > On Fri, Aug 29, 2008 at 10:13 AM, Daniel Gruner <[EMAIL PROTECTED]>
>>> > wrote:
>>> > >
>>> > > Hi Ab
>>> > >
>>> > >
>>> > > On 8/29/08, Abhishek Kulkarni <[EMAIL PROTECTED]> wrote:
>>> > > > Hi Daniel,
>>> > > >
>>> > > > Understand the way in which XCPU is supposed to integrate with
>>> > > > oneSIS
>>> > and/or
>>> > > > Perceus. It uses these as a "launch vehicle" to build minimal images
>>> > with
>>> > > > xcpufs running on them, and provision the nodes with these images.
>>> > > > In
>>> > the
>>> > > > best case, that's all that you need to be running on the compute
>>> > > > nodes.
>>> > >
>>> > > I understand.
>>> > >
>>> > >
>>> > > >
>>> > > > On Fri, Aug 29, 2008 at 8:46 AM, Daniel Gruner <[EMAIL PROTECTED]>
>>> > wrote:
>>> > > > >
>>> > > > > Hi Greg,
>>> > > > >
>>> > > > > I definitely have additional questions! :-)
>>> > > > >
>>> > > > > Ok, here we go:
>>> > > > >
>>> > > > > - assume I am totally new to this - what would one do in order to
>>> > > > > set
>>> > > > > up a perceus/xcpu cluster?
>>> > > >
>>> > > > As Greg said, you have two ways to go about it. You could choose
>>> > > > either
>>> > of
>>> > > > them or try both to see what works for ya. It's just a matter of
>>> > > > playing
>>> > > > with different configurations and rebooting your nodes to try them.
>>> > > >
>>> > > > >
>>> > > > >
>>> > > > > - now, I am not totally new to this game, and my background is
>>> > > > > with
>>> > > > > bproc clusters, so I would like to have a replacement for these,
>>> > > > > but
>>> > > > > with the same basic principle of having a minimal node
>>> > > > > installation,
>>> > > > > and basically no management of nodes needed. I definitely do not
>>> > > > > want
>>> > > > > to go to a model where the nodes have password files, and you ssh
>>> > > > > into
>>> > > > > them in order to run your codes.
>>> > > > >
>>> > > > > - in the caos-NSA installation, the warewulfd is started by
>>> > > > > default.
>>> > > > > I assume it needs to be stopped and perceus started, correct?
>>> > > >
>>> > > > You can enable Perceus from "sidekick" in NSA. Warewulf focuses on
>>> > cluster
>>> > > > monitoring starting with 3.0.
>>> > >
>>> > > Ok, I am concentrating on my RHEL5 machine for now. It seems to be
>>> > > working, at least insofar as the nodes boot. I haven't been able to
>>> > > contact them to try to do anything, other than running xstat with a
>>> > > positive response:
>>> > >
>>> > > n0000 tcp!10.10.0.170!6667 /Linux/x86_64 up 0
>>> > > n0001 tcp!10.10.0.185!6667 /Linux/x86_64 up 0
>>> > >
>>> > > I'd like the nodes to get sequential IP addresses, for ease of
>>> > > identification and management, and I have yet to find out how you do
>>> > > that in perceus.
>>> >
>>> > Take a look at the ipaddr module in Perceus.
>>>
>>> Thanks for the pointer. I am looking at it, but the manual leaves a
>>> lot to be desired in terms of describing what each module does and how
>>> to configure them. I'll try the perceus list if I keep getting stuck
>>> on this.
>>>
>>> >
>>> > >
>>> > >
>>> > > Now, when I try to do anything on the nodes I get, for example:
>>> > >
>>> > > xgroupset 10.10.0.170 root 0
>>> > > xgroupset: Error: Connection refused:10.10.0.170
>>> >
>>> > Whoops! What about telnet 10.10.0.170 6667?
>>> > Perceus might possibly be running xcpufs on some non-standard port. I'm
>>> > not
>>> > sure about that but I remember seeing something like that a while back.
>>>
>>> You seem to have hit it! I can in fact telnet using port 6667
>>> explicitly (can't do anything while in there...:-). I thought that
>>> was the default port anyway, correct?
>>>
>>> >
>>> > >
>>> > >
>>> > > similarly with xrx.
>>> > >
>>> > > xrx 10.10.0.170 /bin/date
>>> > > Error: Connection refused:10.10.0.170
>>> >
>>> > Ditto with this, if it's running on a different port you would want to
>>> > do
>>> > xrx 10.10.0.170!port /bin/date
>>> >
>>> > Alternatively you could specify the "-a" flag to retrieve the nodes from
>>> > the
>>> > statfs.
>>>
>>> I can get xgroupset and xuserset to work with the -a flag, with no
>>> complaints. However, when I try to run anything on the nodes using
>>> xrx, whether I use the -a flag or explicitly set the port (xrx
>>> 10.10.0.170\!6667 /bin/date) the command just hangs. I realize this
>>> is some progress, but no cigar yet.
>>
>> Weird. Did you use the above xrx command as-is? If yes, notice the
>> back-slash in your command.
>> I have not ever seen xrx hang that way. Try passing the "-d" switch
>> alongwith -a, to enable the debug mode.
>> If not, do the strace and post the output. It's not that tough. Really. It
>> should just work.
>>
>>>
>>> >
>>> > >
>>> > >
>>> > > I also don't get name resolution for the nXXXX names assigned to the
>>> > > nodes by perceus.
>>> > >
>>> > >
>>> >
>>> > Check your /etc/resolv.conf.
>>> > Probably try adding the following to it.
>>> > nameserver 127.0.0.1
>>> >
>>> > If that doesn't work, the right place to ask this would be the Perceus
>>> > ML.
>>>
>>> Doesn't work. I'll try the perceus gurus...
>>>
>>> >
>>> > >
>>> > >
>>> > >
>>> > > >
>>> > > > >
>>> > > > >
>>> > > > > - what initialization of perceus needs to be done (the first time
>>> > > > > it
>>> > > > > runs)? I know about the network interface specification, and that
>>> > > > > I
>>> > > > > want it to use xget (the default), but is running the "perceus
>>> > > > > module
>>> > > > > activate xcpu" enough to get the nodes booting into xcpu?
>>> > > >
>>> > > > Yes, it is enough to get xcpufs running on the compute nodes.
>>> > > >
>>> > > > >
>>> > > > >
>>> > > > > - what about configuring the resource manager (e.g. slurm) for use
>>> > > > > in
>>> > > > > the perceus/xcpu environment?
>>> > > >
>>> > > > XCPU only supports Moab Torque for now.
>>> > >
>>> > > Is this the open source torque, or just the commercial product?
>>>
>>>
>>> Who would know about which version of Torque this is? I can't afford
>>> the commercial Moab right now...
>>>
>>>
>>> > >
>>> > >
>>> > >
>>> > >
>>> > > >
>>> > > > >
>>> > > > >
>>> > > > > - I don't see the xcpufs and statfs daemons running on the master
>>> > > > > after starting perceus even though I told it to activate xcpu. I
>>> > > > > haven't tried to boot nodes yet, but I'd like to understand what I
>>> > > > > am
>>> > > > > doing first (I hate black boxes...).
>>> > > > >
>>> > > >
>>> > > > You shouldn't need to run xcpufs on the master. As for statfs, you
>>> > > > can
>>> > start
>>> > > > it manually if it is not running already.
>>> > > >
>>> > > > Again, considering that you have fully configured the master and
>>> > > > have
>>> > the
>>> > > > nodes provisioned to the init state, this is what I would do to
>>> > > > generate
>>> > my
>>> > > > statfs.conf --
>>> > > >
>>> > > > perceus node status | awk 'NR > 2 {print $1 "=tcp!" $3 "!6667"}' >
>>> > > > /etc/xcpu/statfs.conf
>>> > >
>>> > > I had to replace the part "NR>2" with "NR>0" for the above incantation
>>> > > to work (??).
>>> >
>>> > Strange, I might probably be running a different version of Perceus.
>>>
>>> Actually, what happens is that the first two lines of output from the
>>> "perceus node status" command are output to stderr, and the rest to
>>> stdout. If your '|' redirection included stderr then the command as
>>> you wrote it would work. What shell are you using?
>>
>> Ahh, maybe. I'm using bash. I didn't realize that.
>>
>> Thanks,
>> -- Abhishek
>>
>>>
>>> Thanks,
>>>
>>> Daniel
>>>
>>>
>>>
>>> >
>>> > >
>>> > >
>>> > >
>>> > > >
>>> > > > And then,
>>> > > >
>>> > > > statfs -c /etc/xcpu/statfs
>>> > >
>>> > > statfs seems to work. Here is the output from xstat:
>>> > >
>>> > > n0000 tcp!10.10.0.170!6667 /Linux/x86_64 up 0
>>> > > n0001 tcp!10.10.0.185!6667 /Linux/x86_64 up 0
>>> > >
>>> > > In any case, there is some progress, but it is not quite there yet...
>>> >
>>> > I'm glad you are almost there.
>>> >
>>> > Thanks,
>>> > -- Abhishek
>>> >
>>> >
>>> > >
>>> > >
>>> > > Thanks,
>>> > > Daniel
>>> > >
>>> > >
>>> > >
>>> > >
>>> > >
>>> > >
>>> > >
>>> > >
>>> > >
>>> > > >
>>> > > >
>>> > > > >
>>> > > > > etc.
>>> > > > >
>>> > > > > I guess the main problem I have is not with perceus itself (I have
>>> > > > > read the manual), but rather with its integration and provisioning
>>> > > > > for
>>> > > > > xcpu, and for the subsequent configuration of those pieces that
>>> > > > > make
>>> > > > > the cluster useable in a production environment.
>>> > > > >
>>> > > > >
>>> > > > > Thanks for your help,
>>> > > > > Daniel
>>> > > >
>>> > > > Thanks
>>> > > > -- Abhishek
>>> > > >
>>> > > > >
>>> > > > >
>>> > > > >
>>> > > > >
>>> > > > >
>>> > > > >
>>> > > > > On 8/29/08, Greg Kurtzer <[EMAIL PROTECTED]> wrote:
>>> > > > > >
>>> > > > > > You have multiple choices on how to move forward.
>>> > > > > >
>>> > > > > > First you can run the xcpu Perceus module like:
>>> > > > > >
>>> > > > > > # perceus module activate xcpu
>>> > > > > >
>>> > > > > > That will interrupt the node provisioning process and instead
>>> > > > > > of
>>> > > > > > copying the VNFS to the node it will just start up xcpu and
>>> > > > > > start
>>> > > > > > accepting connections.
>>> > > > > >
>>> > > > > > The second option would be to run xcpu from within the VNFS of
>>> > > > > > your
>>> > > > > > choice. That mechanism basically involves installing xcpu into
>>> > > > > > the
>>> > > > > > mounted VNFS image and then provision your nodes with that.
>>> > > > > >
>>> > > > > > Let me know if that helps or if you have additional questions.
>>> > > > > > :)
>>> > > > > >
>>> > > > > >
>>> > > > > > Greg
>>> > > > > >
>>> > > > > >
>>> > > > > >
>>> > > > > >
>>> > > > > > On Fri, Aug 29, 2008 at 6:45 AM, Daniel Gruner
>>> > > > > > <[EMAIL PROTECTED]>
>>> > > > wrote:
>>> > > > > > >
>>> > > > > > > Hi Kevin,
>>> > > > > > >
>>> > > > > > > Well, I've just completed installing xcpu2 and perceus into
>>> > > > > > my
>>> > RHEL5
>>> > > > > > > machine, but now I am stumped with the configuration. How do
>>> > > > > > you
>>> > > > tell
>>> > > > > > > perceus that you want your cluster to run xcpu? I sure don't
>>> > > > > > > understand where this is configured (I assume somewhere in
>>> > > > > > the
>>> > > > > > > /etc/perceus .conf files), and there is no mention of that in
>>> > > > > > the
>>> > > > > > > manual other than saying that xcpu works.
>>> > > > > > >
>>> > > > > > > If you install xcpu2 you surely would need 9p, right?
>>> > > > > > >
>>> > > > > > > Also, how does slurm integrate into the perceus/xcpu world?
>>> > > > > > >
>>> > > > > > > I have also installed this on a caos-NSA test machine, but
>>> > > > > > again
>>> > I
>>> > > > > > > don't know how to configure the provisioning.
>>> > > > > > >
>>> > > > > > > Any help with this would be much appreciated...
>>> > > > > > >
>>> > > > > > > Daniel
>>> > > > > > >
>>> > > > > > >
>>> > > > > > > On 8/28/08, Kevin Tegtmeier <[EMAIL PROTECTED]> wrote:
>>> > > > > > >> We used RHEL5 + perceus successfully. I had to modify the
>>> > perceus
>>> > > > boot
>>> > > > > > >> image for x86_64, but it may have been a kexec/hardware
>>> > > > > > specific
>>> > > > issue I ran
>>> > > > > > >> into. If you run into an issue with it I can help you
>>> > > > > > along.
>>> > > > > > >>
>>> > > > > > >> I don't think the 9P module was built in, but I don't think
>>> > > > > > you
>>> > > > would use
>>> > > > > > >> it.
>>> > > > > > >>
>>> > > > > > >>
>>> > > > > > >> On Thu, Aug 28, 2008 at 11:31 AM, Daniel Gruner
>>> > <[EMAIL PROTECTED]>
>>> > > > wrote:
>>> > > > > > >>
>>> > > > > > >> >
>>> > > > > > >> > Thanks, Abhishek.
>>> > > > > > >> >
>>> > > > > > >> > I will try it and report on my success/lack thereof.
>>> > > > > > >> >
>>> > > > > > >> > Just for info, I am using a RHEL5 distribution, but with
>>> > > > > > the
>>> > > > 2.6.26
>>> > > > > > >> > kernel so that it supports 9p. Has anybody been
>>> > > > > > successful
>>> > with
>>> > > > this
>>> > > > > > >> > distribution? Otherwise, is there a preferred one?
>>> > > > > > >> >
>>> > > > > > >> > Daniel
>>> > > > > > >> >
>>> > > > > > >> >
>>> > > > > > >> >
>>> > > > > > >> >
>>> > > > > > >> > On 8/28/08, Abhishek Kulkarni <[EMAIL PROTECTED]> wrote:
>>> > > > > > >> > >
>>> > > > > > >> > > Daniel,
>>> > > > > > >> > >
>>> > > > > > >> > > It is _not_ necessary to install cAos Linux to use
>>> > > > > > Perceus.
>>> > > > Perceus
>>> > > > > > >> > > supports most, if not all, distributions.
>>> > > > > > >> > >
>>> > > > > > >> > > XCPU is bundled up as a module within Perceus. The
>>> > > > documentation at
>>> > > > > > >> > >
>>> > > > > > >>
>>> > > > http://www.perceus.org/docs/perceus-userguide-1.4.0.pdf
>>> > is
>>> > > > > > >> quite
>>> > > > > > >> > > extensive at that and has details on importing and
>>> > activating
>>> > > > modules.
>>> > > > > > >> > > It's quite simple even if you find yourself wanting to
>>> > tinker
>>> > > > with the
>>> > > > > > >> > > XCPU Perceus module (it's just a shell script that runs
>>> > > > > > at
>>> > a
>>> > > > specified
>>> > > > > > >> > > provisioning state/level)
>>> > > > > > >> > >
>>> > > > > > >> > >
>>> > > > > > >> > > -- Abhishek
>>> > > > > > >> > >
>>> > > > > > >> > >
>>> > > > > > >> > > On Thu, 2008-08-28 at 14:17 -0400, Daniel Gruner wrote:
>>> > > > > > >> > > > Yes, that is a possibility. Instructions on that,
>>> > please?
>>> > > > > > >> > > > I tried installing caos linux, but it doesn't quite
>>> > finish
>>> > > > doing the
>>> > > > > > >> install.
>>> > > > > > >> > > >
>>> > > > > > >> > > > Daniel
>>> > > > > > >> > > >
>>> > > > > > >> > > > On 8/28/08, ron minnich <[EMAIL PROTECTED]> wrote:
>>> > > > > > >> > > > >
>>> > > > > > >> > > > > Use perceus.
>>> > > > > > >> > > > >
>>> > > > > > >> > > > > Ron
>>> > > > > > >> > > > >
>>> > > > > > >> > > > >
>>> > > > > > >> > > > > On 8/28/08, Daniel Gruner <[EMAIL PROTECTED]>
>>> > > > > > wrote:
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > Hi All,
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > The list has been very quiet lately... :-)
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > I've been trying, yet again, to install the
>>> > > > > > latest
>>> > xcpu2
>>> > > > in a
>>> > > > > > >> test
>>> > > > > > >> > > > > > cluster. Ron's instructions on the xcpu.org
>>> > > > > > site
>>> > seem
>>> > > > to be
>>> > > > > > >> outdated,
>>> > > > > > >> > > > > > and partly buggy too. For instance, here are a
>>> > couple
>>> > > > of
>>> > > > > > >> points:
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > - After doing:
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > make xcpu-tarball
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > make ramfs-tarball
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > make install
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > I don't know whether xcpu2 has actually been
>>> > > > > > built
>>> > (I
>>> > > > suspect
>>> > > > > > >> not),
>>> > > > > > >> > > > > > and it certainly has not been installed (e.g. no
>>> > xrx, or
>>> > > > xcpufs,
>>> > > > > > >> or
>>> > > > > > >> > > > > > any of that stuff has been installed).
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > - The command
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > export u=`uname -r`
>>> > > > > > >> > > > > > ./mk-initramfs-oneSIS -f initrd-$u.img $u -nn
>>> > > > > > -rr \
>>> > > > > > >> > > > > > -o ../overlays/xcpu-64 \
>>> > > > > > >> > > > > > -w e1000 \
>>> > > > > > >> > > > > > -w forcedeth \
>>> > > > > > >> > > > > > -w ext3
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > should really be
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > ./mk-xcpu-oneSIS ....
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > in order that the 9p and 9pnet modules get
>>> > > > > > loaded
>>> > into
>>> > > > the
>>> > > > > > >> initrd.
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > Can someone please take a look and revise the
>>> > > > instructions (and
>>> > > > > > >> let us
>>> > > > > > >> > > > > > mere mortals know what to do)?
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > Furthermore, is xcpu2 actualy useable for
>>> > > > > > production
>>> > > > work? What
>>> > > > > > >> about
>>> > > > > > >> > > > > > its integration with a scheduler/resource
>>> > > > > > manager?
>>> > What
>>> > > > about
>>> > > > > > >> MPI?
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > > > Regards,
>>> > > > > > >> > > > > > Daniel
>>> > > > > > >> > > > > >
>>> > > > > > >> > > > >
>>> > > > > > >> > > > >
>>> > > > > > >> > > > > --
>>> > > > > > >> > > > > Sent from Gmail for mobile | mobile.google.com
>>> > > > > > >> > > > >
>>> > > > > > >> > >
>>> > > > > > >> > >
>>> > > > > > >> >
>>> > > > > > >>
>>> > > > > > >>
>>> > > > > > >
>>> > > > > >
>>> > > > > >
>>> > > > > >
>>> > > > > >
>>> > > > > > --
>>> > > > > > Greg Kurtzer
>>> > > > > > http://www.infiscale.com/
>>> > > > > > http://www.runlevelzero.net/
>>> > > > > > http://www.perceus.org/
>>> > > > > > http://www.caoslinux.org/
>>> > > > > >
>>> > > > >
>>> > > >
>>> > > >
>>> > >
>>> >
>>> >
>>
>>
>