This is an automated email from the ASF dual-hosted git repository.
jhung pushed a change to branch YARN-8200
in repository https://gitbox.apache.org/repos/asf/hadoop.git.
from 14dc25e YARN-7033. Add support for NM Recovery of assigned resources
(e.g. GPU's, NUMA, FPGA's) to container. (Devaraj K and Wangda Tan)
new e9ce716 Partial commit of YARN-7224 to get GpuDevice class and changes
new 1f2e67b YARN-7330. Add support to show GPU in UI including metrics.
Contributed by Wangda Tan.
new e4268da YARN-7345. GPU Isolation: Incorrect minor device numbers
written to devices.deny file. (Jonathan Hung via wangda)
new b69e841 YARN-7573. Gpu Information page could be empty for nodes
without GPU. (Sunil G via wangda)
new c9d0000 YARN-7637. GPU volume creation command fails when work
preserving is disabled at NM. Contributed by Zian Chen.
new c3e4d9f YARN-7594. TestNMWebServices#testGetNMResourceInfo fails on
trunk. Contributed by Gergely Novák.
new 0330369 YARN-9175. Null resources check in ResourceInfo for branch-3.0
new e4ede15 YARN-7143. FileNotFound handling in ResourceUtils is
inconsistent
new f76f2cf YARN-7383. Node resource is not parsed correctly for resource
names containing dot. Contributed by Gergely Novák.
The 9 revisions listed above as "new" are entirely new to this
repository and will be described in separate emails. The revisions
listed as "add" were already present in the repository and have only
been added to this reference.
Summary of changes:
.../hadoop-yarn/dev-support/findbugs-exclude.xml | 8 +
.../apache/hadoop/yarn/api/records/Resource.java | 20 +++
.../hadoop/yarn/util/resource/ResourceUtils.java | 61 +++----
.../yarn/util/resource/TestResourceUtils.java | 5 +-
.../resources/resource-types/node-resources-2.xml | 5 +
.../resources/resource-types/resource-types-4.xml | 7 +-
.../nodemanager/DockerContainerExecutor.java | 2 +-
.../container/ResourceMappings.java | 2 +-
.../linux/resources/gpu/GpuResourceAllocator.java | 119 +++++++------
.../resources/gpu/GpuResourceHandlerImpl.java | 27 +--
.../resourceplugin/ResourcePlugin.java | 11 ++
.../resourceplugin/gpu/AssignedGpuDevice.java | 83 +++++++++
.../resourceplugin/gpu/GpuDevice.java | 82 +++++++++
.../resourceplugin/gpu/GpuDiscoverer.java | 30 ++--
.../gpu/GpuNodeResourceUpdateHandler.java | 10 +-
.../resourceplugin/gpu/GpuResourcePlugin.java | 24 ++-
.../recovery/NMLeveldbStateStoreService.java | 68 ++++----
.../recovery/NMNullStateStoreService.java | 6 +-
.../nodemanager/recovery/NMStateStoreService.java | 17 +-
.../server/nodemanager/webapp/NMWebServices.java | 25 +++
.../nodemanager/webapp/dao/NMResourceInfo.java} | 14 +-
.../webapp/dao/gpu/GpuDeviceInformation.java | 2 +-
.../webapp/dao/gpu/NMGpuResourceInfo.java | 80 +++++++++
.../webapp/dao/gpu/PerGpuDeviceInformation.java | 2 +-
.../webapp/dao/gpu/PerGpuMemoryUsage.java | 2 +-
.../impl/modules/gpu/gpu-module.c | 2 +-
.../test/modules/gpu/test-gpu-module.cc | 13 ++
.../TestDockerContainerExecutorWithMocks.java | 2 +-
.../TestContainerManagerRecovery.java | 15 +-
.../resources/gpu/TestGpuResourceHandler.java | 194 +++++++++++++++------
.../resourceplugin/gpu/TestGpuDiscoverer.java | 34 +++-
.../recovery/NMMemoryStateStoreService.java | 10 +-
.../recovery/TestNMLeveldbStateStoreService.java | 28 ++-
.../nodemanager/webapp/TestNMWebServices.java | 175 +++++++++++++++----
.../dao/gpu/TestGpuDeviceInformationParser.java | 2 +-
.../resourcemanager/webapp/dao/ResourceInfo.java | 5 +-
.../app/adapters/{yarn-node.js => yarn-nm-gpu.js} | 4 +-
.../src/main/webapp/app/components/donut-chart.js | 20 ++-
.../main/webapp/app/components/gpu-donut-chart.js | 66 +++++++
.../src/main/webapp/app/constants.js | 13 ++
.../webapp/app/controllers/yarn-nodes/table.js | 2 +-
.../src/main/webapp/app/models/cluster-metric.js | 69 ++++++++
.../app/models/{yarn-entity.js => yarn-nm-gpu.js} | 9 +-
.../webapp/app/models/yarn-queue/capacity-queue.js | 3 +-
.../src/main/webapp/app/models/yarn-rm-node.js | 37 ++++
.../hadoop-yarn-ui/src/main/webapp/app/router.js | 5 +-
.../src/main/webapp/app/routes/cluster-overview.js | 2 +-
.../src/main/webapp/app/routes/yarn-node.js | 2 +
.../table.js => yarn-node/yarn-nm-gpu.js} | 0
.../{yarn-container-log.js => yarn-nm-gpu.js} | 25 +--
.../app/serializers/yarn-queue/capacity-queue.js | 1 +
.../main/webapp/app/serializers/yarn-rm-node.js | 4 +-
.../main/webapp/app/templates/cluster-overview.hbs | 88 +++++++---
.../app/templates/components/node-menu-panel.hbs | 10 +-
.../app/templates/components/yarn-nm-gpu-info.hbs | 69 ++++++++
.../main/webapp/app/templates/yarn-node-apps.hbs | 2 +-
.../webapp/app/templates/yarn-node-containers.hbs | 2 +-
.../src/main/webapp/app/templates/yarn-node.hbs | 125 -------------
.../main/webapp/app/templates/yarn-node/info.hbs | 154 ++++++++++++++++
.../yarn-nm-gpu.hbs} | 52 +++---
.../src/main/webapp/app/utils/converter.js | 51 ++++++
61 files changed, 1516 insertions(+), 491 deletions(-)
create mode 100644
hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-nodemanager/src/main/java/org/apache/hadoop/yarn/server/nodemanager/containermanager/resourceplugin/gpu/AssignedGpuDevice.java
create mode 100644
hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-nodemanager/src/main/java/org/apache/hadoop/yarn/server/nodemanager/containermanager/resourceplugin/gpu/GpuDevice.java
copy
hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/{hadoop-yarn-server-resourcemanager/src/main/java/org/apache/hadoop/yarn/server/resourcemanager/webapp/dao/ReservationDeleteResponseInfo.java
=>
hadoop-yarn-server-nodemanager/src/main/java/org/apache/hadoop/yarn/server/nodemanager/webapp/dao/NMResourceInfo.java}
(77%)
create mode 100644
hadoop-yarn-project/hadoop-yarn/hadoop-yarn-server/hadoop-yarn-server-nodemanager/src/main/java/org/apache/hadoop/yarn/server/nodemanager/webapp/dao/gpu/NMGpuResourceInfo.java
copy
hadoop-yarn-project/hadoop-yarn/hadoop-yarn-ui/src/main/webapp/app/adapters/{yarn-node.js
=> yarn-nm-gpu.js} (93%)
create mode 100644
hadoop-yarn-project/hadoop-yarn/hadoop-yarn-ui/src/main/webapp/app/components/gpu-donut-chart.js
copy
hadoop-yarn-project/hadoop-yarn/hadoop-yarn-ui/src/main/webapp/app/models/{yarn-entity.js
=> yarn-nm-gpu.js} (88%)
copy
hadoop-yarn-project/hadoop-yarn/hadoop-yarn-ui/src/main/webapp/app/routes/{yarn-nodes/table.js
=> yarn-node/yarn-nm-gpu.js} (100%)
copy
hadoop-yarn-project/hadoop-yarn/hadoop-yarn-ui/src/main/webapp/app/serializers/{yarn-container-log.js
=> yarn-nm-gpu.js} (73%)
create mode 100644
hadoop-yarn-project/hadoop-yarn/hadoop-yarn-ui/src/main/webapp/app/templates/components/yarn-nm-gpu-info.hbs
delete mode 100644
hadoop-yarn-project/hadoop-yarn/hadoop-yarn-ui/src/main/webapp/app/templates/yarn-node.hbs
create mode 100644
hadoop-yarn-project/hadoop-yarn/hadoop-yarn-ui/src/main/webapp/app/templates/yarn-node/info.hbs
copy
hadoop-yarn-project/hadoop-yarn/hadoop-yarn-ui/src/main/webapp/app/templates/{yarn-node-apps.hbs
=> yarn-node/yarn-nm-gpu.hbs} (50%)
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]