Hi, thank t35t0r!
I have tried your script, but still got the same problem.

> Then I run iozone on node73:
> /***********************************************************/
> d...@node73 ~ $ iozone -s 1m -Rb log.xls  -t 1 -+m clientlist
>        Iozone: Performance Test of File I/O
>                Version $Revision: 3.242 $
>                Compiled for 64 bit mode.
>                Build: linux-AMD64
[...]
>        Run began: Thu Jan  8 23:11:13 2009
>
>        File size set to 1024 KB
>        Excel chart generation enabled
>        Network distribution mode enabled.
>        Command line used: iozone -s 1m -Rb log.xls -t 1 -+m clientlist
>        Output is in Kbytes/sec
>        Time Resolution = 0.000001 seconds.
>        Processor cache size set to 1024 Kbytes.
>        Processor cache line size set to 32 bytes.
>        File stride size set to 17 * record size.
>        Throughput test with 1 process
>        Each process writes a 1024 Kbyte file in 4 Kbyte records
> /******************************************************/
> Then iozone stoped here.
>
> I still use strace to see what happend:
> /******************************************************/
> d...@node73 ~ $ strace iozone -s 1m -Rb log.xls  -t 1 -+m clientlist
> execve("/usr/bin/iozone", ["iozone", "-s", "1m", "-Rb", "log.xls",
> "-t", "1", "-+m", "clientlist"], [/* 45 vars */]) = 0
> brk(0)                                  = 0x7cb000
> mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
> 0) = 0x7f67f3639000
> mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
> 0) = 0x7f67f3638000
> access("/etc/ld.so.preload", R_OK)      = -1 ENOENT (No such file or 
> directory)
> open("/etc/ld.so.cache", O_RDONLY)      = 3
> fstat(3, {st_mode=S_IFREG|0644, st_size=48606, ...}) = 0
> mmap(NULL, 48606, PROT_READ, MAP_PRIVATE, 3, 0) = 0x7f67f362c000
> close(3)                                = 0
> open("/lib/librt.so.1", O_RDONLY)       = 3
> read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\300\"\0\0\0\0\0\0"...,
> 832) = 832
> fstat(3, {st_mode=S_IFREG|0755, st_size=35688, ...}) = 0
> mmap(NULL, 2132968, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3,
> 0) = 0x7f67f3217000
> mprotect(0x7f67f321f000, 2093056, PROT_NONE) = 0
> mmap(0x7f67f341e000, 8192, PROT_READ|PROT_WRITE,
> MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x7000) = 0x7f67f341e000
> close(3)                                = 0
> open("/lib/libpthread.so.0", O_RDONLY)  = 3
> read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\240W\0\0\0\0\0\0"...,
> 832) = 832
> fstat(3, {st_mode=S_IFREG|0755, st_size=131577, ...}) = 0
> mmap(NULL, 2204528, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3,
> 0) = 0x7f67f2ffc000
> mprotect(0x7f67f3011000, 2097152, PROT_NONE) = 0
> mmap(0x7f67f3211000, 8192, PROT_READ|PROT_WRITE,
> MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x15000) = 0x7f67f3211000
> mmap(0x7f67f3213000, 13168, PROT_READ|PROT_WRITE,
> MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x7f67f3213000
> close(3)                                = 0
> open("/lib/libc.so.6", O_RDONLY)        = 3
> read(3, 
> "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\220\334\1\0\0\0\0\0"...,
> 832) = 832
> fstat(3, {st_mode=S_IFREG|0755, st_size=1293456, ...}) = 0
> mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
> 0) = 0x7f67f362b000
> mmap(NULL, 3399928, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3,
> 0) = 0x7f67f2cbd000
> mprotect(0x7f67f2df3000, 2093056, PROT_NONE) = 0
> mmap(0x7f67f2ff2000, 20480, PROT_READ|PROT_WRITE,
> MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x135000) = 0x7f67f2ff2000
> mmap(0x7f67f2ff7000, 16632, PROT_READ|PROT_WRITE,
> MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x7f67f2ff7000
> close(3)                                = 0
> mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
> 0) = 0x7f67f362a000
> arch_prctl(ARCH_SET_FS, 0x7f67f362a6f0) = 0
> mprotect(0x7f67f2ff2000, 16384, PROT_READ) = 0
> mprotect(0x7f67f3211000, 4096, PROT_READ) = 0
> mprotect(0x7f67f341e000, 4096, PROT_READ) = 0
> mprotect(0x62a000, 4096, PROT_READ)     = 0
> mprotect(0x7f67f363a000, 4096, PROT_READ) = 0
> munmap(0x7f67f362c000, 48606)           = 0
> set_tid_address(0x7f67f362a780)         = 31886
> set_robust_list(0x7f67f362a790, 0x18)   = 0
> rt_sigaction(SIGRTMIN, {0x7f67f3001310, [], SA_RESTORER|SA_SIGINFO,
> 0x7f67f3009ec0}, NULL, 8) = 0
> rt_sigaction(SIGRT_1, {0x7f67f3001390, [],
> SA_RESTORER|SA_RESTART|SA_SIGINFO, 0x7f67f3009ec0}, NULL, 8) = 0
> rt_sigprocmask(SIG_UNBLOCK, [RTMIN RT_1], NULL, 8) = 0
> getrlimit(RLIMIT_STACK, {rlim_cur=8192*1024, rlim_max=RLIM_INFINITY}) = 0
> uname({sys="Linux", node="Gentoo-F312-73", ...}) = 0
> brk(0)                                  = 0x7cb000
> brk(0x7ec000)                           = 0x7ec000
> open("/etc/localtime", O_RDONLY)        = 3
> fstat(3, {st_mode=S_IFREG|0644, st_size=405, ...}) = 0
> fstat(3, {st_mode=S_IFREG|0644, st_size=405, ...}) = 0
> mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
> 0) = 0x7f67f3637000
> read(3, "TZif2\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\3\0\0\0\3\0\0\0\0"...,
> 4096) = 405
> lseek(3, -240, SEEK_CUR)                = 165
> read(3, "TZif2\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0\3\0\0\0\3\0\0\0\0"...,
> 4096) = 240
> close(3)                                = 0
> munmap(0x7f67f3637000, 4096)            = 0
> rt_sigaction(SIGINT, {0x408b2c, [INT], SA_RESTORER|SA_RESTART,
> 0x7f67f2ced430}, {SIG_DFL}, 8) = 0
> rt_sigaction(SIGTERM, {0x408b2c, [TERM], SA_RESTORER|SA_RESTART,
> 0x7f67f2ced430}, {SIG_DFL}, 8) = 0
> mmap(NULL, 18878464, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS,
> -1, 0) = 0x7f67f1abc000
> open("clientlist", O_RDONLY)            = 3
> fstat(3, {st_mode=S_IFREG|0644, st_size=30, ...}) = 0
> mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1,
> 0) = 0x7f67f3637000
> read(3, "node74 /home/dnfs /tmp/iozone\n", 4096) = 30
> read(3, "", 4096)                       = 0
> close(3)                                = 0
> munmap(0x7f67f3637000, 4096)            = 0
> write(1, "\tIozone: Performance Test of Fil"..., 38     Iozone:
> Performance Test of File I/O
> ) = 38
> write(1, "\t        Version $Revision: 3.24"..., 64
> Version $Revision: 3.242 $
>                Compiled for 64 bit mode.
> ) = 64
> write(1, "\t\tBuild: linux-AMD64 \n\n", 23              Build: linux-AMD64
>
> ) = 23
> write(1, "\tContributors:William Norcott, D"..., 71
> Contributors:William Norcott, Don Capps, Isom Crawford, Kirby Collins
> ) = 71
> write(1, "\t             Al Slater, Scott R"..., 60
> Al Slater, Scott Rhine, Mike Wisner, Ken Goss
> ) = 60
> write(1, "\t             Steve Landherr, Br"..., 69
> Steve Landherr, Brad Smith, Mark Kelly, Dr. Alain CYR,
> ) = 69
> write(1, "\t             Randy Dunlap, Mark"..., 57
> Randy Dunlap, Mark Montague, Dan Million,
> ) = 57
> write(1, "\t             Jean-Marc Zucconi,"..., 48
> Jean-Marc Zucconi, Jeff Blomberg,
> ) = 48
> write(1, "\t             Erik Habbinga, Kri"..., 58
> Erik Habbinga, Kris Strecker, Walter Wong.
>
> ) = 58
> write(1, "\tRun began: Thu Jan  8 23:12:20 "..., 38     Run began: Thu
> Jan  8 23:12:20 2009
>
> ) = 38
> write(1, "\tFile size set to 1024 KB\n", 26     File size set to 1024 KB
> ) = 26
> write(1, "\tExcel chart generation enabled\n", 32       Excel chart
> generation enabled
> ) = 32
> write(1, "\tNetwork distribution mode enabl"..., 36     Network
> distribution mode enabled.
> ) = 36
> write(1, "\tCommand line used:", 19     Command line used    = 19
> write(1, " iozone", 7 iozone)                  = 7
> write(1, " -s", 3 -s)                      = 3
> write(1, " 1m", 3 1m)                      = 3
> write(1, " -Rb", 4 -Rb)                     = 4
> write(1, " log.xls", 8 log.xls)                 = 8
> write(1, " -t", 3 -t)                      = 3
> write(1, " 1", 2 1)                       = 2
> write(1, " -+m", 4 -+m)                     = 4
> write(1, " clientlist", 11 clientlist)             = 11
> write(1, "\n", 1
> )                       = 1
> write(1, "\tOutput is in Kbytes/sec", 24        Output is in Kbytes/sec) = 24
> write(1, "\n", 1
> )                       = 1
> write(1, "\tTime Resolution = 0.000001 seco"..., 37     Time
> Resolution = 0.000001 seconds.
> ) = 37
> write(1, "\tProcessor cache size set to 102"..., 42     Processor
> cache size set to 1024 Kbytes.
> ) = 42
> write(1, "\tProcessor cache line size set t"..., 44     Processor
> cache line size set to 32 bytes.
> ) = 44
> write(1, "\tFile stride size set to 17 * re"..., 43     File stride
> size set to 17 * record size.
> ) = 43
> write(1, "\tThroughput test with 1 process\n", 32       Throughput
> test with 1 process
> ) = 32
> shmget(IPC_PRIVATE, 16384, IPC_CREAT|0666) = 1376256
> shmat(1376256, 0, 0)                    = ?
> shmctl(1376256, IPC_RMID, 0)            = 0
> write(1, "\tEach process writes a 1024 Kbyt"..., 58     Each process
> writes a 1024 Kbyte file in 4 Kbyte records
> ) = 58
> socket(PF_INET, SOCK_DGRAM, IPPROTO_IP) = 3
> setsockopt(3, SOL_SOCKET, SO_RCVBUF, [262144], 4) = 0
> bind(3, {sa_family=AF_INET, sin_port=htons(20000),
> sin_addr=inet_addr("0.0.0.0")}, 16) = 0
> rt_sigaction(SIGINT, {SIG_IGN}, {0x408b2c, [INT],
> SA_RESTORER|SA_RESTART, 0x7f67f2ced430}, 8) = 0
> rt_sigaction(SIGQUIT, {SIG_IGN}, {SIG_DFL}, 8) = 0
> rt_sigprocmask(SIG_BLOCK, [CHLD], [], 8) = 0
> clone(child_stack=0, flags=CLONE_PARENT_SETTID|SIGCHLD,
> parent_tidptr=0x7ffffb6398b8) = 31887
> wait4(31887, [{WIFEXITED(s) && WEXITSTATUS(s) == 0}], 0, NULL) = 31887
> rt_sigaction(SIGINT, {0x408b2c, [INT], SA_RESTORER|SA_RESTART,
> 0x7f67f2ced430}, NULL, 8) = 0
> rt_sigaction(SIGQUIT, {SIG_DFL}, NULL, 8) = 0
> rt_sigprocmask(SIG_SETMASK, [], NULL, 8) = 0
> --- SIGCHLD (Child exited) @ 0 (0) ---
> recvfrom(3,
> /******************************************************/

I still have the output of tcpdump when the command above executed:
/******************************************************/
node74 ~ # tcpdump host node73 -vv and not arp
tcpdump: listening on eth0, link-type EN10MB (Ethernet), capture size 68 bytes
23:37:17.048678 IP (tos 0x0, ttl 64, id 28484, offset 0, flags [DF],
proto TCP (6), length 60) node73.36691 > node74.ssh: S
1224275785:1224275785(0) win 5840 <mss 1460,sackOK,timestamp
415078413[|tcp]>
23:37:17.049350 IP (tos 0x0, ttl 64, id 0, offset 0, flags [DF], proto
TCP (6), length 60) node74.ssh > node73.36691: S
2873253591:2873253591(0) ack 1224275786 win 5792 <mss
1460,sackOK,timestamp 414802723[|tcp]>
23:37:17.048719 IP (tos 0x0, ttl 64, id 28485, offset 0, flags [DF],
proto TCP (6), length 52) node73.36691 > node74.ssh: ., cksum 0xee0e
(correct), 1:1(0) ack 1 win 92 <nop,nop,timestamp 415078413 414802723>
23:37:17.054017 IP (tos 0x0, ttl 64, id 15867, offset 0, flags [DF],
proto TCP (6), length 72) node74.ssh > node73.36691: P 1:21(20) ack 1
win 91 <nop,nop,timestamp 414802724 415078413>
23:37:17.054077 IP (tos 0x0, ttl 64, id 28486, offset 0, flags [DF],
proto TCP (6), length 52) node73.36691 > node74.ssh: ., cksum 0xedf8
(correct), 1:1(0) ack 21 win 92 <nop,nop,timestamp 415078414
414802724>
23:37:17.054163 IP (tos 0x0, ttl 64, id 28487, offset 0, flags [DF],
proto TCP (6), length 72) node73.36691 > node74.ssh: P 1:21(20) ack 21
win 92 <nop,nop,timestamp 415078414 414802724>
23:37:17.054182 IP (tos 0x0, ttl 64, id 15868, offset 0, flags [DF],
proto TCP (6), length 52) node74.ssh > node73.36691: ., cksum 0xede5
(correct), 21:21(0) ack 21 win 91 <nop,nop,timestamp 414802724
415078414>
23:37:17.054387 IP (tos 0x0, ttl 64, id 28488, offset 0, flags [DF],
proto TCP (6), length 844) node73.36691 > node74.ssh: P 21:813(792)
ack 21 win 92 <nop,nop,timestamp 415078414 414802724>
23:37:17.054403 IP (tos 0x0, ttl 64, id 15869, offset 0, flags [DF],
proto TCP (6), length 52) node74.ssh > node73.36691: ., cksum 0xeab4
(correct), 21:21(0) ack 813 win 116 <nop,nop,timestamp 414802724
415078414>
23:37:17.055050 IP (tos 0x0, ttl 64, id 15870, offset 0, flags [DF],
proto TCP (6), length 836) node74.ssh > node73.36691: P 21:805(784)
ack 813 win 116 <nop,nop,timestamp 414802725 415078414>
23:37:17.055274 IP (tos 0x0, ttl 64, id 28489, offset 0, flags [DF],
proto TCP (6), length 76) node73.36691 > node74.ssh: P 813:837(24) ack
805 win 116 <nop,nop,timestamp 415078414 414802725>
23:37:17.057803 IP (tos 0x0, ttl 64, id 15871, offset 0, flags [DF],
proto TCP (6), length 204) node74.ssh > node73.36691: P 805:957(152)
ack 837 win 116 <nop,nop,timestamp 414802725 415078414>
23:37:17.059087 IP (tos 0x0, ttl 64, id 28490, offset 0, flags [DF],
proto TCP (6), length 196) node73.36691 > node74.ssh: P 837:981(144)
ack 957 win 141 <nop,nop,timestamp 415078415 414802725>
23:37:17.068091 IP (tos 0x0, ttl 64, id 15872, offset 0, flags [DF],
proto TCP (6), length 772) node74.ssh > node73.36691: P 957:1677(720)
ack 981 win 140 <nop,nop,timestamp 414802728 415078415>
23:37:17.069761 IP (tos 0x0, ttl 64, id 28491, offset 0, flags [DF],
proto TCP (6), length 68) node73.36691 > node74.ssh: P 981:997(16) ack
1677 win 165 <nop,nop,timestamp 415078418 414802728>
23:37:17.107120 IP (tos 0x0, ttl 64, id 15873, offset 0, flags [DF],
proto TCP (6), length 52) node74.ssh > node73.36691: ., cksum 0xe35a
(correct), 1677:1677(0) ack 997 win 140 <nop,nop,timestamp 414802738
415078418>
23:37:17.107161 IP (tos 0x0, ttl 64, id 28492, offset 0, flags [DF],
proto TCP (6), length 100) node73.36691 > node74.ssh: P 997:1045(48)
ack 1677 win 165 <nop,nop,timestamp 415078427 414802738>
23:37:17.107169 IP (tos 0x0, ttl 64, id 15874, offset 0, flags [DF],
proto TCP (6), length 52) node74.ssh > node73.36691: ., cksum 0xe321
(correct), 1677:1677(0) ack 1045 win 140 <nop,nop,timestamp 414802738
415078427>
23:37:17.107206 IP (tos 0x0, ttl 64, id 15875, offset 0, flags [DF],
proto TCP (6), length 100) node74.ssh > node73.36691: P 1677:1725(48)
ack 1045 win 140 <nop,nop,timestamp 414802738 415078427>
23:37:17.107383 IP (tos 0x0, ttl 64, id 28493, offset 0, flags [DF],
proto TCP (6), length 116) node73.36691 > node74.ssh: P 1045:1109(64)
ack 1725 win 165 <nop,nop,timestamp 415078427 414802738>
23:37:17.109273 IP (tos 0x0, ttl 64, id 15876, offset 0, flags [DF],
proto TCP (6), length 132) node74.ssh > node73.36691: P 1725:1805(80)
ack 1109 win 140 <nop,nop,timestamp 414802738 415078427>
23:37:17.109407 IP (tos 0x0, ttl 64, id 28494, offset 0, flags [DF],
proto TCP (6), length 420) node73.36691 > node74.ssh: P 1109:1477(368)
ack 1805 win 165 <nop,nop,timestamp 415078428 414802738>
23:37:17.109920 IP (tos 0x0, ttl 64, id 15877, offset 0, flags [DF],
proto TCP (6), length 372) node74.ssh > node73.36691: P 1805:2125(320)
ack 1477 win 165 <nop,nop,timestamp 414802738 415078428>
23:37:17.119287 IP (tos 0x0, ttl 64, id 28495, offset 0, flags [DF],
proto TCP (6), length 692) node73.36691 > node74.ssh: P 1477:2117(640)
ack 2125 win 190 <nop,nop,timestamp 415078430 414802738>
23:37:17.119941 IP (tos 0x0, ttl 64, id 15878, offset 0, flags [DF],
proto TCP (6), length 84) node74.ssh > node73.36691: P 2125:2157(32)
ack 2117 win 190 <nop,nop,timestamp 414802741 415078430>
23:37:17.120157 IP (tos 0x0, ttl 64, id 28496, offset 0, flags [DF],
proto TCP (6), length 116) node73.36691 > node74.ssh: P 2117:2181(64)
ack 2157 win 190 <nop,nop,timestamp 415078431 414802741>
23:37:17.121928 IP (tos 0x0, ttl 64, id 15879, offset 0, flags [DF],
proto TCP (6), length 100) node74.ssh > node73.36691: P 2157:2205(48)
ack 2181 win 190 <nop,nop,timestamp 414802741 415078431>
23:37:17.122090 IP (tos 0x8, ttl 64, id 28497, offset 0, flags [DF],
proto TCP (6), length 148) node73.36691 > node74.ssh: P 2181:2277(96)
ack 2205 win 190 <nop,nop,timestamp 415078431 414802741>
23:37:17.124942 IP (tos 0x8, ttl 64, id 15880, offset 0, flags [DF],
proto TCP (6), length 100) node74.ssh > node73.36691: P 2205:2253(48)
ack 2277 win 190 <nop,nop,timestamp 414802742 415078431>
23:37:17.125095 IP (tos 0x8, ttl 64, id 28498, offset 0, flags [DF],
proto TCP (6), length 84) node73.36691 > node74.ssh: P 2277:2309(32)
ack 2253 win 190 <nop,nop,timestamp 415078432 414802742>
23:37:17.127056 IP (tos 0x8, ttl 64, id 15881, offset 0, flags [DF],
proto TCP (6), length 180) node74.ssh > node73.36691: P 2253:2381(128)
ack 2309 win 190 <nop,nop,timestamp 414802742 415078432>
23:37:17.127219 IP (tos 0x8, ttl 64, id 28499, offset 0, flags [DF],
proto TCP (6), length 84) node73.36691 > node74.ssh: P 2309:2341(32)
ack 2381 win 214 <nop,nop,timestamp 415078432 414802742>
23:37:17.127340 IP (tos 0x8, ttl 64, id 28500, offset 0, flags [DF],
proto TCP (6), length 52) node73.36691 > node74.ssh: F, cksum 0xdafd
(correct), 2341:2341(0) ack 2381 win 214 <nop,nop,timestamp 415078432
414802742>
23:37:17.127902 IP (tos 0x8, ttl 64, id 15882, offset 0, flags [DF],
proto TCP (6), length 52) node74.ssh > node73.36691: F, cksum 0xdb13
(correct), 2381:2381(0) ack 2342 win 190 <nop,nop,timestamp 414802743
415078432>
23:37:17.127954 IP (tos 0x8, ttl 64, id 28501, offset 0, flags [DF],
proto TCP (6), length 52) node73.36691 > node74.ssh: ., cksum 0xdafb
(correct), 2342:2342(0) ack 2382 win 214 <nop,nop,timestamp 415078432
414802743>
/************************************************/

I have tried iozone3_242 and iozone3_303 on gentoo and RHEL4, all the
result is similar. I guess maybe process I configed and ran iozone is
incorrect.
Anybody have the details of how to run iozone across multiple nodes?
-- 
wcw

Reply via email to