[ https://issues.apache.org/jira/browse/SLIDER-1034?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=15117694#comment-15117694 ]
Steve Loughran commented on SLIDER-1034: ---------------------------------------- Seen again, locally. {code} Failed tests: TestAgentAAEcho.testAgentEcho:88->postLaunchActions:186 assert cd.getRoleOptInt(rolename, RoleKeys.ROLE_PENDING_AA_INSTANCES, -1) == 0 | | | | | | 49 echo role.pending.aa.instances false { "version" : "1.0", "name" : "testagentaaecho", "type" : "agent", "state" : 3, "createTime" : 1453828499575, "updateTime" : 1453828520462, "originConfigurationPath" : "file:/Users/stevel/.slider/cluster/testagentaaecho/snapshot", "generatedConfigurationPath" : "file:/Users/stevel/.slider/cluster/testagentaaecho/generated", "dataPath" : "file:/Users/stevel/.slider/cluster/testagentaaecho/database", "options" : { "site.global.security_enabled" : "false", "internal.appdef.dir.path" : "file:/Users/stevel/.slider/cluster/testagentaaecho/tmp/appdef", "internal.application.home" : "/", "agent.package.root" : "/Users/stevel/Projects/Hortonworks/Projects/slider/slider-core/./src/test/python", "slider.cluster.directory.permissions" : "0770", "application.name" : "testagentaaecho", "internal.addons.dir.path" : "file:/Users/stevel/.slider/cluster/testagentaaecho/tmp/addons", "internal.tmp.dir" : "file:/Users/stevel/.slider/cluster/testagentaaecho/tmp", "internal.snapshot.conf.path" : "file:/Users/stevel/.slider/cluster/testagentaaecho/snapshot", "env.MALLOC_ARENA_MAX" : "4", "zookeeper.path" : "/services/slider/users/stevel/testagentaaecho", "internal.container.failure.shortlife" : "60000", "internal.application.image.path" : null, "internal.generated.conf.path" : "file:/Users/stevel/.slider/cluster/testagentaaecho/generated", "site.fs.default.name" : "file:///", "agent.version" : "file:/Users/stevel/Projects/Hortonworks/Projects/slider/slider-core/./src/test/python/version", "agent.conf" : "file:/Users/stevel/Projects/Hortonworks/Projects/slider/slider-core/./src/test/python/agent.ini", "zookeeper.hosts" : "localhost", "internal.provider.name" : "agent", "internal.data.dir.path" : "file:/Users/stevel/.slider/cluster/testagentaaecho/database", "site.fs.defaultFS" : "file:///", "slider.data.directory.permissions" : "0770", "zookeeper.quorum" : "localhost:63451", "internal.am.tmp.dir" : "file:/Users/stevel/.slider/cluster/testagentaaecho/tmp/appmaster", "internal.container.failure.threshold" : "5", "application.def" : "file:/private/var/folders/57/xyts0qt105z1f1k0twk6rd8m0000gq/T/junit8871531317671442911/testpkg/appdef_1.zip" }, "info" : { "info.am.container.id" : "container_1453828488505_0001_01_000001", "info.am.rpc.port" : "1026", "info.am.attempt.id" : "appattempt_1453828488505_0001_000001", "yarn.memory" : "8192", "info.am.web.port" : "1027", "info.am.web.url" : "http://stevel-2.local:1027/", "info.am.app.id" : "application_1453828488505_0001", "yarn.vcores" : "1", "info.am.hostname" : "stevel-2.local", "status.application.build.info" : "Slider Core-0.90.0-incubating-SNAPSHOT Built against commit# 20198e2228 on Java 1.7.0_75 by stevel", "status.hadoop.build.info" : "2.6.0", "status.hadoop.deployed.info" : "branch-2.6.0 @18e43357c8f927c0695f1e9522859d6a", "live.time" : "26 Jan 2016 17:14:59 GMT", "live.time.millis" : "1453828499575", "create.time" : "26 Jan 2016 17:14:59 GMT", "create.time.millis" : "1453828499575", "containers.at.am-restart" : "0", "status.time" : "26 Jan 2016 17:15:20 GMT", "status.time.millis" : "1453828520462", "info.am.agent.status.url" : "https://stevel-2.local:63496/", "info.am.agent.status.port" : "63496", "info.am.agent.ops.url" : "https://stevel-2.local:63497/", "info.am.agent.ops.port" : "63497" }, "statistics" : { "slider-appmaster" : { "containers.unknown.completed" : 0, "containers.start.started" : 1, "containers.live" : 2, "containers.start.failed" : 0, "containers.failed" : 0, "containers.completed" : 0, "containers.surplus" : 0 }, "echo" : { "containers.failed.node" : 0, "containers.start.started" : 0, "containers.live" : 1, "containers.start.failed" : 0, "containers.failed.preempted" : 0, "containers.active.requests" : 0, "containers.failed.recently" : 0, "containers.failed" : 0, "containers.completed" : 0, "containers.anti-affine.pending" : 49, "containers.desired" : 1, "containers.requested" : 1 } }, "instances" : { "slider-appmaster" : [ "container_1453828488505_0001_01_000001" ], "echo" : [ "container_1453828488505_0001_01_000002" ] }, "roles" : { "slider-appmaster" : { "role.failed.recently.instances" : "0", "yarn.memory" : "1024", "role.requested.instances" : "0", "role.failed.starting.instances" : "0", "role.actual.instances" : "1", "yarn.vcores" : "1", "yarn.component.instances" : "1", "role.releasing.instances" : "0", "role.failed.node.instances" : "0", "role.failed.instances" : "0", "role.failed.preempted.instances" : "0" }, "echo" : { "role.failed.recently.instances" : "0", "yarn.component.placement.policy" : "4", "role.requested.instances" : "0", "test.relax.validation" : "true", "role.failed.starting.instances" : "0", "role.failed.node.instances" : "0", "role.failed.preempted.instances" : "0", "app.name" : "Agent", "yarn.role.priority" : "1", "role.actual.instances" : "1", "agent.script" : "echo.py", "yarn.component.instances" : "1", "role.releasing.instances" : "0", "role.failed.instances" : "0", "role.pending.aa.instances" : "49" } }, "clientProperties" : { }, "status" : { "live" : { "slider-appmaster" : { "container_1453828488505_0001_01_000001" : { "name" : "container_1453828488505_0001_01_000001", "role" : "slider-appmaster", "roleId" : 0, "createTime" : 1453828499591, "startTime" : 1453828499591, "released" : false, "host" : "stevel-2.local", "hostUrl" : "http://stevel-2.local:1027", "state" : 3, "exitCode" : 0 } }, "echo" : { "container_1453828488505_0001_01_000002" : { "name" : "container_1453828488505_0001_01_000002", "role" : "echo", "roleId" : 1, "createTime" : 1453828502297, "startTime" : 1453828502350, "released" : false, "host" : "192.168.1.85", "hostUrl" : "http://192.168.1.85:63466", "state" : 3, "exitCode" : 0, "command" : "python /Users/stevel/Projects/Hortonworks/Projects/slider/slider-core/./src/test/python/agent/main.py --label container_1453828488505_0001_01_000002___echo --zk-quorum localhost:63451 --zk-reg-path /registry/users/stevel/services/org-apache-slider/testagentaaecho > <LOG_DIR>/slider-agent.out 2>&1 ; ", "environment" : [ "LANGUAGE=\"en_US.UTF-8\"", "AGENT_WORK_ROOT=\"$PWD\"", "HADOOP_USER_NAME=\"stevel\"", "AGENT_LOG_ROOT=\"<LOG_DIR>\"", "PYTHONPATH=\"./infra/agent/slider-agent/\"", "LC_ALL=\"en_US.UTF-8\"", "SLIDER_PASSPHRASE=\"rA3VdXwqjKGvKhr10XhjIj3k1uNDFroQbicQvlQi5d39aEe8UQ\"", "MALLOC_ARENA_MAX=\"4\"", "LANG=\"en_US.UTF-8\"" ] } } } }, "liveness" : { "allRequestsSatisfied" : true, "requestsOutstanding" : 0, "activeRequests" : 0 } } {code} > TestAgentAAEcho failed with #of pending instances == 49 > ------------------------------------------------------- > > Key: SLIDER-1034 > URL: https://issues.apache.org/jira/browse/SLIDER-1034 > Project: Slider > Issue Type: Bug > Components: appmaster, test > Affects Versions: Slider 0.90.2 > Environment: Jenkins > Reporter: Steve Loughran > Assignee: Steve Loughran > Fix For: Slider 0.91 > > Attachments: jenkins.txt > > > A transient jenkins failure had an as > {code} > ssert cd.getRoleOptInt(rolename, RoleKeys.ROLE_PENDING_AA_INSTANCES, -1) == 0 > | | | | | > | 49 echo role.pending.aa.instances > false > {code} > And yes, that's what is in the JSON > {code} > "role.pending.aa.instances" : "49" > {code} > This hints at some race condition in the test, reporting, or appstate -- This message was sent by Atlassian JIRA (v6.3.4#6332)