Repository: incubator-systemml Updated Branches: refs/heads/master 2fa6141f3 -> b0fb707d2
[HOTFIX] Fixed gpu bias_add function for GPU. Metadata was being set incorrectly Closes #338. Project: http://git-wip-us.apache.org/repos/asf/incubator-systemml/repo Commit: http://git-wip-us.apache.org/repos/asf/incubator-systemml/commit/b0fb707d Tree: http://git-wip-us.apache.org/repos/asf/incubator-systemml/tree/b0fb707d Diff: http://git-wip-us.apache.org/repos/asf/incubator-systemml/diff/b0fb707d Branch: refs/heads/master Commit: b0fb707d2b515da89b9c0577a279b5cd2ae3e47a Parents: 2fa6141 Author: Nakul Jindal <naku...@gmail.com> Authored: Mon Jan 9 17:06:15 2017 -0800 Committer: Niketan Pansare <npan...@us.ibm.com> Committed: Mon Jan 9 17:06:14 2017 -0800 ---------------------------------------------------------------------- .../sysml/runtime/instructions/gpu/ConvolutionGPUInstruction.java | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) ---------------------------------------------------------------------- http://git-wip-us.apache.org/repos/asf/incubator-systemml/blob/b0fb707d/src/main/java/org/apache/sysml/runtime/instructions/gpu/ConvolutionGPUInstruction.java ---------------------------------------------------------------------- diff --git a/src/main/java/org/apache/sysml/runtime/instructions/gpu/ConvolutionGPUInstruction.java b/src/main/java/org/apache/sysml/runtime/instructions/gpu/ConvolutionGPUInstruction.java index 1a5f3de..67efa8b 100644 --- a/src/main/java/org/apache/sysml/runtime/instructions/gpu/ConvolutionGPUInstruction.java +++ b/src/main/java/org/apache/sysml/runtime/instructions/gpu/ConvolutionGPUInstruction.java @@ -146,8 +146,8 @@ public class ConvolutionGPUInstruction extends GPUInstruction MatrixObject input = ec.getMatrixInputForGPUInstruction(_input1.getName()); MatrixObject bias = ec.getMatrixInputForGPUInstruction(_input2.getName()); - MatrixObject out = ec.getDenseMatrixOutputForGPUInstruction(_output.getName()); ec.setMetaData(_output.getName(), input.getNumRows(), input.getNumColumns()); + MatrixObject out = ec.getDenseMatrixOutputForGPUInstruction(_output.getName()); LibMatrixCUDA.bias_add(input, bias, out); // release inputs/outputs ec.releaseMatrixInputForGPUInstruction(_input1.getName());