[ 
https://issues.apache.org/jira/browse/YARN-687?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=13658843#comment-13658843
 ] 

Steve Loughran commented on YARN-687:
-------------------------------------

thread dump 
{code}
Running org.apache.hadoop.yarn.server.nodemanager.TestNMAuditLogger
2013-05-15 21:21:39
Full thread dump OpenJDK 64-Bit Server VM (20.0-b12 mixed mode):
"IPC Server handler 4 on 32868" daemon prio=10 tid=0x00007fc9ec4da000 
nid=0x359e waiting on condition [0x00007fc9e8af9000]
   java.lang.Thread.State: WAITING (parking)
        at sun.misc.Unsafe.park(Native Method)
        - parking to wait for  <0x00000000ebaf1720> (a 
java.util.concurrent.locks.AbstractQueuedSynchronizer$ConditionObject)
        at java.util.concurrent.locks.LockSupport.park(LockSupport.java:186)
        at 
java.util.concurrent.locks.AbstractQueuedSynchronizer$ConditionObject.await(AbstractQueuedSynchronizer.java:2043)
        at 
java.util.concurrent.LinkedBlockingQueue.take(LinkedBlockingQueue.java:386)
        at org.apache.hadoop.ipc.Server$Handler.run(Server.java:1817)
"IPC Server handler 3 on 32868" daemon prio=10 tid=0x00007fc9ec4b8000 
nid=0x359d waiting on condition [0x00007fc9e8bfa000]
   java.lang.Thread.State: WAITING (parking)
        at sun.misc.Unsafe.park(Native Method)
        - parking to wait for  <0x00000000ebaf1720> (a 
java.util.concurrent.locks.AbstractQueuedSynchronizer$ConditionObject)
        at java.util.concurrent.locks.LockSupport.park(LockSupport.java:186)
        at 
java.util.concurrent.locks.AbstractQueuedSynchronizer$ConditionObject.await(AbstractQueuedSynchronizer.java:2043)
        at 
java.util.concurrent.LinkedBlockingQueue.take(LinkedBlockingQueue.java:386)
        at org.apache.hadoop.ipc.Server$Handler.run(Server.java:1817)
"IPC Server handler 2 on 32868" daemon prio=10 tid=0x00007fc9ec4b7000 
nid=0x359c waiting on condition [0x00007fc9e8cfb000]
   java.lang.Thread.State: WAITING (parking)
        at sun.misc.Unsafe.park(Native Method)
        - parking to wait for  <0x00000000ebaf1720> (a 
java.util.concurrent.locks.AbstractQueuedSynchronizer$ConditionObject)
        at java.util.concurrent.locks.LockSupport.park(LockSupport.java:186)
        at 
java.util.concurrent.locks.AbstractQueuedSynchronizer$ConditionObject.await(AbstractQueuedSynchronizer.java:2043)
        at 
java.util.concurrent.LinkedBlockingQueue.take(LinkedBlockingQueue.java:386)
        at org.apache.hadoop.ipc.Server$Handler.run(Server.java:1817)
"IPC Server handler 1 on 32868" daemon prio=10 tid=0x00007fc9ec41b800 
nid=0x359b waiting on condition [0x00007fc9e8dfc000]
   java.lang.Thread.State: WAITING (parking)
        at sun.misc.Unsafe.park(Native Method)
        - parking to wait for  <0x00000000ebaf1720> (a 
java.util.concurrent.locks.AbstractQueuedSynchronizer$ConditionObject)
        at java.util.concurrent.locks.LockSupport.park(LockSupport.java:186)
        at 
java.util.concurrent.locks.AbstractQueuedSynchronizer$ConditionObject.await(AbstractQueuedSynchronizer.java:2043)
        at 
java.util.concurrent.LinkedBlockingQueue.take(LinkedBlockingQueue.java:386)
        at org.apache.hadoop.ipc.Server$Handler.run(Server.java:1817)
"IPC Server handler 0 on 32868" daemon prio=10 tid=0x00007fc9ec414000 
nid=0x359a waiting on condition [0x00007fc9e8efd000]
   java.lang.Thread.State: WAITING (parking)
        at sun.misc.Unsafe.park(Native Method)
        - parking to wait for  <0x00000000ebaf1720> (a 
java.util.concurrent.locks.AbstractQueuedSynchronizer$ConditionObject)
        at java.util.concurrent.locks.LockSupport.park(LockSupport.java:186)
        at 
java.util.concurrent.locks.AbstractQueuedSynchronizer$ConditionObject.await(AbstractQueuedSynchronizer.java:2043)
        at 
java.util.concurrent.LinkedBlockingQueue.take(LinkedBlockingQueue.java:386)
        at org.apache.hadoop.ipc.Server$Handler.run(Server.java:1817)
"IPC Server listener on 32868" daemon prio=10 tid=0x00007fc9ec3eb000 nid=0x3599 
runnable [0x00007fc9e8ffe000]
   java.lang.Thread.State: RUNNABLE
        at sun.nio.ch.EPollArrayWrapper.epollWait(Native Method)
        at sun.nio.ch.EPollArrayWrapper.poll(EPollArrayWrapper.java:228)
        at sun.nio.ch.EPollSelectorImpl.doSelect(EPollSelectorImpl.java:83)
        at sun.nio.ch.SelectorImpl.lockAndDoSelect(SelectorImpl.java:87)
        - locked <0x00000000ebaf2800> (a sun.nio.ch.Util$1)
        - locked <0x00000000ebaf27f0> (a java.util.Collections$UnmodifiableSet)
        - locked <0x00000000ebaf2380> (a sun.nio.ch.EPollSelectorImpl)
        at sun.nio.ch.SelectorImpl.select(SelectorImpl.java:98)
        at sun.nio.ch.SelectorImpl.select(SelectorImpl.java:102)
        at org.apache.hadoop.ipc.Server$Listener.run(Server.java:678)
"IPC Server Responder" daemon prio=10 tid=0x00007fc9ec4bb000 nid=0x3598 
runnable [0x00007fc9f0172000]
   java.lang.Thread.State: RUNNABLE
        at sun.nio.ch.EPollArrayWrapper.epollWait(Native Method)
        at sun.nio.ch.EPollArrayWrapper.poll(EPollArrayWrapper.java:228)
        at sun.nio.ch.EPollSelectorImpl.doSelect(EPollSelectorImpl.java:83)
        at sun.nio.ch.SelectorImpl.lockAndDoSelect(SelectorImpl.java:87)
        - locked <0x00000000ebaf35f0> (a sun.nio.ch.Util$1)
        - locked <0x00000000ebaf35e0> (a java.util.Collections$UnmodifiableSet)
        - locked <0x00000000ebaf33c8> (a sun.nio.ch.EPollSelectorImpl)
        at sun.nio.ch.SelectorImpl.select(SelectorImpl.java:98)
        at org.apache.hadoop.ipc.Server$Responder.doRunLoop(Server.java:862)
        at org.apache.hadoop.ipc.Server$Responder.run(Server.java:845)
"Socket Reader #1 for port 32868" prio=10 tid=0x00007fc9ec44f000 nid=0x3597 
runnable [0x00007fc9f0273000]
   java.lang.Thread.State: RUNNABLE
        at sun.nio.ch.EPollArrayWrapper.epollWait(Native Method)
        at sun.nio.ch.EPollArrayWrapper.poll(EPollArrayWrapper.java:228)
        at sun.nio.ch.EPollSelectorImpl.doSelect(EPollSelectorImpl.java:83)
        at sun.nio.ch.SelectorImpl.lockAndDoSelect(SelectorImpl.java:87)
        - locked <0x00000000ebaf2ed8> (a sun.nio.ch.Util$1)
        - locked <0x00000000ebaf2ec8> (a java.util.Collections$UnmodifiableSet)
        - locked <0x00000000ebaf2cb0> (a sun.nio.ch.EPollSelectorImpl)
        at sun.nio.ch.SelectorImpl.select(SelectorImpl.java:98)
        at sun.nio.ch.SelectorImpl.select(SelectorImpl.java:102)
        at 
org.apache.hadoop.ipc.Server$Listener$Reader.doRunLoop(Server.java:565)
        - locked <0x00000000ebaf2a10> (a 
org.apache.hadoop.ipc.Server$Listener$Reader)
        at org.apache.hadoop.ipc.Server$Listener$Reader.run(Server.java:551)
"Low Memory Detector" daemon prio=10 tid=0x00007fc9ec099800 nid=0x3595 runnable 
[0x0000000000000000]
   java.lang.Thread.State: RUNNABLE
"C2 CompilerThread1" daemon prio=10 tid=0x00007fc9ec097800 nid=0x3594 waiting 
on condition [0x0000000000000000]
   java.lang.Thread.State: RUNNABLE
"C2 CompilerThread0" daemon prio=10 tid=0x00007fc9ec094800 nid=0x3593 waiting 
on condition [0x0000000000000000]
   java.lang.Thread.State: RUNNABLE
"Signal Dispatcher" daemon prio=10 tid=0x00007fc9ec086800 nid=0x3592 waiting on 
condition [0x0000000000000000]
   java.lang.Thread.State: RUNNABLE
"Finalizer" daemon prio=10 tid=0x00007fc9ec074800 nid=0x3591 in Object.wait() 
[0x00007fc9f1430000]
   java.lang.Thread.State: WAITING (on object monitor)
        at java.lang.Object.wait(Native Method)
        - waiting on <0x00000000ebaf5d40> (a java.lang.ref.ReferenceQueue$Lock)
        at java.lang.ref.ReferenceQueue.remove(ReferenceQueue.java:133)
        - locked <0x00000000ebaf5d40> (a java.lang.ref.ReferenceQueue$Lock)
        at java.lang.ref.ReferenceQueue.remove(ReferenceQueue.java:149)
        at java.lang.ref.Finalizer$FinalizerThread.run(Finalizer.java:177)
"Reference Handler" daemon prio=10 tid=0x00007fc9ec072800 nid=0x3590 in 
Object.wait() [0x00007fc9f1531000]
   java.lang.Thread.State: WAITING (on object monitor)
        at java.lang.Object.wait(Native Method)
        - waiting on <0x00000000ebaf5d70> (a java.lang.ref.Reference$Lock)
        at java.lang.Object.wait(Object.java:502)
        at java.lang.ref.Reference$ReferenceHandler.run(Reference.java:133)
        - locked <0x00000000ebaf5d70> (a java.lang.ref.Reference$Lock)
"main" prio=10 tid=0x00007fc9ec008000 nid=0x358c runnable [0x00007fc9f5369000]
   java.lang.Thread.State: RUNNABLE
        at sun.nio.ch.EPollArrayWrapper.epollWait(Native Method)
        at sun.nio.ch.EPollArrayWrapper.poll(EPollArrayWrapper.java:228)
        at sun.nio.ch.EPollSelectorImpl.doSelect(EPollSelectorImpl.java:83)
        at sun.nio.ch.SelectorImpl.lockAndDoSelect(SelectorImpl.java:87)
        - locked <0x00000000eab2e198> (a sun.nio.ch.Util$1)
        - locked <0x00000000eab2e188> (a java.util.Collections$UnmodifiableSet)
        - locked <0x00000000eab2df80> (a sun.nio.ch.EPollSelectorImpl)
        at sun.nio.ch.SelectorImpl.select(SelectorImpl.java:98)
        at 
org.apache.hadoop.net.SocketIOWithTimeout$SelectorPool.select(SocketIOWithTimeout.java:335)
        at 
org.apache.hadoop.net.SocketIOWithTimeout.connect(SocketIOWithTimeout.java:203)
        at org.apache.hadoop.net.NetUtils.connect(NetUtils.java:530)
        at org.apache.hadoop.net.NetUtils.connect(NetUtils.java:494)
        at 
org.apache.hadoop.ipc.Client$Connection.setupConnection(Client.java:512)
        - locked <0x00000000ebaf63d8> (a 
org.apache.hadoop.ipc.Client$Connection)
        at 
org.apache.hadoop.ipc.Client$Connection.setupIOstreams(Client.java:607)
        - locked <0x00000000ebaf63d8> (a 
org.apache.hadoop.ipc.Client$Connection)
        at org.apache.hadoop.ipc.Client$Connection.access$2100(Client.java:255)
        at org.apache.hadoop.ipc.Client.getConnection(Client.java:1356)
        at org.apache.hadoop.ipc.Client.call(Client.java:1274)
        at org.apache.hadoop.ipc.Client.call(Client.java:1255)
        at 
org.apache.hadoop.ipc.WritableRpcEngine$Invoker.invoke(WritableRpcEngine.java:231)
        at sun.proxy.$Proxy9.ping(Unknown Source)
        at 
org.apache.hadoop.yarn.server.nodemanager.TestNMAuditLogger.testNMAuditLoggerWithIP(TestNMAuditLogger.java:219)
        at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)
        at 
sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:57)
        at 
sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
        at java.lang.reflect.Method.invoke(Method.java:616)
        at 
org.junit.runners.model.FrameworkMethod$1.runReflectiveCall(FrameworkMethod.java:44)
        at 
org.junit.internal.runners.model.ReflectiveCallable.run(ReflectiveCallable.java:15)
        at 
org.junit.runners.model.FrameworkMethod.invokeExplosively(FrameworkMethod.java:41)
        at 
org.junit.internal.runners.statements.InvokeMethod.evaluate(InvokeMethod.java:20)
        at 
org.junit.internal.runners.statements.RunBefores.evaluate(RunBefores.java:28)
        at 
org.junit.runners.BlockJUnit4ClassRunner.runNotIgnored(BlockJUnit4ClassRunner.java:79)
        at 
org.junit.runners.BlockJUnit4ClassRunner.runChild(BlockJUnit4ClassRunner.java:71)
        at 
org.junit.runners.BlockJUnit4ClassRunner.runChild(BlockJUnit4ClassRunner.java:49)
        at org.junit.runners.ParentRunner$3.run(ParentRunner.java:193)
        at org.junit.runners.ParentRunner$1.schedule(ParentRunner.java:52)
        at org.junit.runners.ParentRunner.runChildren(ParentRunner.java:191)
        at org.junit.runners.ParentRunner.access$000(ParentRunner.java:42)
        at org.junit.runners.ParentRunner$2.evaluate(ParentRunner.java:184)
        at org.junit.runners.ParentRunner.run(ParentRunner.java:236)
        at 
org.apache.maven.surefire.junit4.JUnit4Provider.execute(JUnit4Provider.java:252)
        at 
org.apache.maven.surefire.junit4.JUnit4Provider.executeTestSet(JUnit4Provider.java:141)
        at 
org.apache.maven.surefire.junit4.JUnit4Provider.invoke(JUnit4Provider.java:112)
        at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)
        at 
sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:57)
        at 
sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
        at java.lang.reflect.Method.invoke(Method.java:616)
        at 
org.apache.maven.surefire.util.ReflectionUtils.invokeMethodWithArray(ReflectionUtils.java:189)
        at 
org.apache.maven.surefire.booter.ProviderFactory$ProviderProxy.invoke(ProviderFactory.java:165)
        at 
org.apache.maven.surefire.booter.ProviderFactory.invokeProvider(ProviderFactory.java:85)
        at 
org.apache.maven.surefire.booter.ForkedBooter.runSuitesInProcess(ForkedBooter.java:115)
        at 
org.apache.maven.surefire.booter.ForkedBooter.main(ForkedBooter.java:75)
"VM Thread" prio=10 tid=0x00007fc9ec06d800 nid=0x358f runnable 
"GC task thread#0 (ParallelGC)" prio=10 tid=0x00007fc9ec013000 nid=0x358d 
runnable 
"GC task thread#1 (ParallelGC)" prio=10 tid=0x00007fc9ec015000 nid=0x358e 
runnable 
"VM Periodic Task Thread" prio=10 tid=0x00007fc9ec09c000 nid=0x3596 waiting on 
condition 
JNI global references: 1016

{code}
                
> TestNMAuditLogger hang
> ----------------------
>
>                 Key: YARN-687
>                 URL: https://issues.apache.org/jira/browse/YARN-687
>             Project: Hadoop YARN
>          Issue Type: Bug
>          Components: nodemanager
>    Affects Versions: 3.0.0
>         Environment: Linux stevel-dev 3.2.0-24-virtual #39-Ubuntu SMP Mon May 
> 21 18:44:18 UTC 2012 x86_64 x86_64 x86_64 GNU/Linux
> java version "1.6.0_27"
> OpenJDK Runtime Environment (IcedTea6 1.12.3) (6b27-1.12.3-0ubuntu1~12.04.1)
> OpenJDK 64-Bit Server VM (build 20.0-b12, mixed mode)
>            Reporter: Steve Loughran
>            Priority: Minor
>
> TestNMAuditLogger hanging repeatedly on a test VM

--
This message is automatically generated by JIRA.
If you think it was sent incorrectly, please contact your JIRA administrators
For more information on JIRA, see: http://www.atlassian.com/software/jira

Reply via email to