You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@systemml.apache.org by ni...@apache.org on 2018/02/01 05:39:26 UTC
systemml git commit: [SYSTEMML-445] Guard JCudaKernels with
sysml.gpu.sync.postProcess flag
Repository: systemml
Updated Branches:
refs/heads/master f69047ea4 -> 5da8132ea
[SYSTEMML-445] Guard JCudaKernels with sysml.gpu.sync.postProcess flag
Project: http://git-wip-us.apache.org/repos/asf/systemml/repo
Commit: http://git-wip-us.apache.org/repos/asf/systemml/commit/5da8132e
Tree: http://git-wip-us.apache.org/repos/asf/systemml/tree/5da8132e
Diff: http://git-wip-us.apache.org/repos/asf/systemml/diff/5da8132e
Branch: refs/heads/master
Commit: 5da8132ea8c165d6d1a65c2c293fc87aaa15a2a3
Parents: f69047e
Author: Niketan Pansare <np...@us.ibm.com>
Authored: Wed Jan 31 21:38:29 2018 -0800
Committer: Niketan Pansare <np...@us.ibm.com>
Committed: Wed Jan 31 21:38:29 2018 -0800
----------------------------------------------------------------------
.../sysml/runtime/instructions/gpu/context/JCudaKernels.java | 4 +++-
1 file changed, 3 insertions(+), 1 deletion(-)
----------------------------------------------------------------------
http://git-wip-us.apache.org/repos/asf/systemml/blob/5da8132e/src/main/java/org/apache/sysml/runtime/instructions/gpu/context/JCudaKernels.java
----------------------------------------------------------------------
diff --git a/src/main/java/org/apache/sysml/runtime/instructions/gpu/context/JCudaKernels.java b/src/main/java/org/apache/sysml/runtime/instructions/gpu/context/JCudaKernels.java
index d22110d..181b08d 100644
--- a/src/main/java/org/apache/sysml/runtime/instructions/gpu/context/JCudaKernels.java
+++ b/src/main/java/org/apache/sysml/runtime/instructions/gpu/context/JCudaKernels.java
@@ -27,6 +27,7 @@ import java.io.IOException;
import java.io.InputStream;
import java.util.HashMap;
+import org.apache.sysml.api.DMLScript;
import org.apache.sysml.runtime.DMLRuntimeException;
import org.apache.sysml.runtime.io.IOUtilFunctions;
import org.apache.sysml.runtime.matrix.data.LibMatrixCUDA;
@@ -110,7 +111,8 @@ public class JCudaKernels {
checkResult(cuLaunchKernel(function, config.gridDimX, config.gridDimY, config.gridDimZ, config.blockDimX,
config.blockDimY, config.blockDimZ, config.sharedMemBytes, config.stream, Pointer.to(kernelParams),
null));
- JCuda.cudaDeviceSynchronize();
+ if(DMLScript.SYNCHRONIZE_GPU)
+ JCuda.cudaDeviceSynchronize();
}
public static void checkResult(int cuResult) throws DMLRuntimeException {