summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorWillem Jan Palenstijn <Willem.Jan.Palenstijn@cwi.nl>2015-12-22 14:00:50 +0100
committerWillem Jan Palenstijn <Willem.Jan.Palenstijn@cwi.nl>2015-12-22 14:00:50 +0100
commitc66e4b030467ddadac71e5bd4803737cf94c0a07 (patch)
tree205133660d0cf6a9e4eb0ff509db176a44eaec2d
parentf1c4c523db55ad31f3cfb8f51113099654c62c00 (diff)
downloadastra-c66e4b030467ddadac71e5bd4803737cf94c0a07.tar.gz
astra-c66e4b030467ddadac71e5bd4803737cf94c0a07.tar.bz2
astra-c66e4b030467ddadac71e5bd4803737cf94c0a07.tar.xz
astra-c66e4b030467ddadac71e5bd4803737cf94c0a07.zip
Reduce FP3D CUDA kernel runtime
This reduces the chance of the Windows display driver watchdog triggering, and doesn't seem to hurt performance.
-rw-r--r--cuda/3d/cone_fp.cu2
-rw-r--r--cuda/3d/par3d_fp.cu2
2 files changed, 2 insertions, 2 deletions
diff --git a/cuda/3d/cone_fp.cu b/cuda/3d/cone_fp.cu
index b36d2bc..13b184f 100644
--- a/cuda/3d/cone_fp.cu
+++ b/cuda/3d/cone_fp.cu
@@ -49,7 +49,7 @@ namespace astraCUDA3d {
static const unsigned int g_anglesPerBlock = 4;
// thickness of the slices we're splitting the volume up into
-static const unsigned int g_blockSlices = 64;
+static const unsigned int g_blockSlices = 32;
static const unsigned int g_detBlockU = 32;
static const unsigned int g_detBlockV = 32;
diff --git a/cuda/3d/par3d_fp.cu b/cuda/3d/par3d_fp.cu
index b14c494..3ce3d42 100644
--- a/cuda/3d/par3d_fp.cu
+++ b/cuda/3d/par3d_fp.cu
@@ -49,7 +49,7 @@ namespace astraCUDA3d {
static const unsigned int g_anglesPerBlock = 4;
// thickness of the slices we're splitting the volume up into
-static const unsigned int g_blockSlices = 64;
+static const unsigned int g_blockSlices = 32;
static const unsigned int g_detBlockU = 32;
static const unsigned int g_detBlockV = 32;