summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorpsychocrypt <psychocrypt@users.noreply.github.com>2017-12-03 14:55:04 +0100
committerpsychocrypt <psychocrypt@users.noreply.github.com>2017-12-03 14:55:04 +0100
commitcfe64725f063b63eafbeeef7e57cad7448cb3d15 (patch)
treedc5cd5b9f4bd1cb98e51e163b85e78cfad4edc67
parentd10d20f1132a3c5d6dc51ed22a0381e460b579e8 (diff)
downloadxmr-stak-cfe64725f063b63eafbeeef7e57cad7448cb3d15.zip
xmr-stak-cfe64725f063b63eafbeeef7e57cad7448cb3d15.tar.gz
set `srided_index = true` as default
Change the default for strided index. Th euser feedback shows that strided_index = true will give a view hashes more per second.
-rw-r--r--doc/tuning.md2
-rw-r--r--xmrstak/backend/amd/autoAdjust.hpp2
-rw-r--r--xmrstak/backend/amd/config.tpl4
3 files changed, 4 insertions, 4 deletions
diff --git a/doc/tuning.md b/doc/tuning.md
index 25c5065..8eeefcb 100644
--- a/doc/tuning.md
+++ b/doc/tuning.md
@@ -86,4 +86,4 @@ export GPU_SINGLE_ALLOC_PERCENT=99
### Scratchpad Indexing
The layout of the hash scratchpad memory can be changed for each GPU with the option `strided_index` in `amd.txt`.
-Try to change the value from the default `false` to `true`.
+Try to change the value from the default `true` to `false`.
diff --git a/xmrstak/backend/amd/autoAdjust.hpp b/xmrstak/backend/amd/autoAdjust.hpp
index 0abf84e..0bc5239 100644
--- a/xmrstak/backend/amd/autoAdjust.hpp
+++ b/xmrstak/backend/amd/autoAdjust.hpp
@@ -123,7 +123,7 @@ private:
// set 8 threads per block (this is a good value for the most gpus)
conf += std::string(" { \"index\" : ") + std::to_string(ctx.deviceIdx) + ",\n" +
" \"intensity\" : " + std::to_string(intensity) + ", \"worksize\" : " + std::to_string(8) + ",\n" +
- " \"affine_to_cpu\" : false, \"strided_index\" : false\n"
+ " \"affine_to_cpu\" : false, \"strided_index\" : true\n"
" },\n";
++i;
}
diff --git a/xmrstak/backend/amd/config.tpl b/xmrstak/backend/amd/config.tpl
index f31a678..af662f8 100644
--- a/xmrstak/backend/amd/config.tpl
+++ b/xmrstak/backend/amd/config.tpl
@@ -6,11 +6,11 @@ R"===(
* worksize - Number of local GPU threads (nothing to do with CPU threads)
* affine_to_cpu - This will affine the thread to a CPU. This can make a GPU miner play along nicer with a CPU miner.
* strided_index - switch memory pattern used for the scratch pad memory
- * false = use a contiguous block of memory per thread
* true = use 16byte contiguous memory per thread, the next memory block has offset of intensity blocks
+ * false = use a contiguous block of memory per thread
* "gpu_threads_conf" :
* [
- * { "index" : 0, "intensity" : 1000, "worksize" : 8, "affine_to_cpu" : false, "strided_index" : false },
+ * { "index" : 0, "intensity" : 1000, "worksize" : 8, "affine_to_cpu" : false, "strided_index" : true },
* ],
*/
OpenPOWER on IntegriCloud