diff --git a/Changelog b/Changelog index cd9fc43..bef2f8e 100644 --- a/Changelog +++ b/Changelog @@ -1,3 +1,5 @@ +1.3.0 +----- * Program binaries are now extracted during tuning and saved in the cache (see #8). This can also make tuning faster on systems that don't cache kernels. * Out-of-place scan is now supported (partially implements #12). * Workaround to avoid depending on OpenCL 1.2 ICD diff --git a/doc/benchmark/1.3.0/480gtx/uint-uint.txt b/doc/benchmark/1.3.0/480gtx/uint-uint.txt new file mode 100644 index 0000000..c8c3126 --- /dev/null +++ b/doc/benchmark/1.3.0/480gtx/uint-uint.txt @@ -0,0 +1,15 @@ +1000 1.94053 +2000 3.86824 +5000 9.60939 +10000 19.2169 +20000 38.1196 +50000 81.3429 +100000 146.165 +200000 238.164 +500000 289.491 +1000000 365.432 +2000000 393.618 +5000000 415.811 +10000000 427.707 +20000000 419.47 +50000000 436.53 diff --git a/doc/benchmark/1.3.0/480gtx/uint-void.txt b/doc/benchmark/1.3.0/480gtx/uint-void.txt new file mode 100644 index 0000000..13bca01 --- /dev/null +++ b/doc/benchmark/1.3.0/480gtx/uint-void.txt @@ -0,0 +1,15 @@ +1000 3.06639 +2000 6.14276 +5000 15.3448 +10000 30.2398 +20000 57.2744 +50000 125.785 +100000 197.697 +200000 295.1 +500000 432.951 +1000000 518.157 +2000000 582.318 +5000000 641.221 +10000000 660.685 +20000000 676.266 +50000000 679.02 diff --git a/doc/benchmark/1.3.0/480gtx/ulong-float4.txt b/doc/benchmark/1.3.0/480gtx/ulong-float4.txt new file mode 100644 index 0000000..e329e2c --- /dev/null +++ b/doc/benchmark/1.3.0/480gtx/ulong-float4.txt @@ -0,0 +1,13 @@ +1000 0.920758 +2000 1.84414 +5000 4.56342 +10000 8.9245 +20000 15.5165 +50000 31.3804 +100000 45.4368 +200000 67.7037 +500000 85.4646 +1000000 99.2464 +2000000 110.984 +5000000 120.795 +10000000 123.159 diff --git a/doc/benchmark/1.3.0/clogs-benchmark.svg b/doc/benchmark/1.3.0/clogs-benchmark.svg new file mode 100644 index 0000000..f25e449 --- /dev/null +++ b/doc/benchmark/1.3.0/clogs-benchmark.svg @@ -0,0 +1,298 @@ + + + + +Gnuplot +Produced by GNUPLOT 4.6 patchlevel 3 + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + 0 + + + + + + + 100 + + + + + + + 200 + + + + + + + 300 + + + + + + + 400 + + + + + + + 500 + + + + + + + 600 + + + + + + + 700 + + + 100 + + + 1000 + + + 10000 + + + 100000 + + + 1e+06 + + + 1e+07 + + + 1e+08 + + + MKeys/s + + + Elements + + + CLOGS sorting rate + + + gnuplot_plot_1 + + + 480 GTX / uint keys / no values + + + + + + + + + + + + + + + + + + + + gnuplot_plot_2 + + + 480 GTX / uint keys / uint values + + + + + + + + + + + + + + + + + + + + gnuplot_plot_3 + + + 480 GTX / ulong keys / float4 values + + + + + + + + + + + + + + + + + + gnuplot_plot_4 + + + R9 270 / uint keys / no values + + + + + + + + + + + + + + + + + + + + gnuplot_plot_5 + + + R9 270 / uint keys / uint values + + + + + + + + + + + + + + + + + + + + gnuplot_plot_6 + + + R9 270 / ulong keys / float4 values + + + + + + + + + + + + + + + + + + + + + + diff --git a/doc/benchmark/1.3.0/r9-270/uint-uint.txt b/doc/benchmark/1.3.0/r9-270/uint-uint.txt new file mode 100644 index 0000000..03069e2 --- /dev/null +++ b/doc/benchmark/1.3.0/r9-270/uint-uint.txt @@ -0,0 +1,15 @@ +1000 1.30802 +2000 3.14244 +5000 8.92085 +10000 16.8956 +20000 32.9922 +50000 56.161 +100000 103.771 +200000 162.871 +500000 248.038 +1000000 282.035 +2000000 318.303 +5000000 344.626 +10000000 351.477 +20000000 357.712 +50000000 361.265 diff --git a/doc/benchmark/1.3.0/r9-270/uint-void.txt b/doc/benchmark/1.3.0/r9-270/uint-void.txt new file mode 100644 index 0000000..8ecb4d8 --- /dev/null +++ b/doc/benchmark/1.3.0/r9-270/uint-void.txt @@ -0,0 +1,15 @@ +1000 1.3886 +2000 2.82567 +5000 7.4481 +10000 13.6512 +20000 28.5861 +50000 63.189 +100000 102.282 +200000 164.106 +500000 326.991 +1000000 447.178 +2000000 517.907 +5000000 595.438 +10000000 634.482 +20000000 649.966 +50000000 658.447 diff --git a/doc/benchmark/1.3.0/r9-270/ulong-float4.txt b/doc/benchmark/1.3.0/r9-270/ulong-float4.txt new file mode 100644 index 0000000..f640c3c --- /dev/null +++ b/doc/benchmark/1.3.0/r9-270/ulong-float4.txt @@ -0,0 +1,13 @@ +1000 1.17397 +2000 2.45197 +5000 6.14184 +10000 11.581 +20000 18.2669 +50000 32.5265 +100000 53.4161 +200000 67.9985 +500000 83.1411 +1000000 88.2147 +2000000 92.7467 +5000000 94.9689 +10000000 96.1383 diff --git a/doc/benchmark/clogs-benchmark-plot.sh b/doc/benchmark/clogs-benchmark-plot.sh index 884dcbf..ff4e1ec 100755 --- a/doc/benchmark/clogs-benchmark-plot.sh +++ b/doc/benchmark/clogs-benchmark-plot.sh @@ -20,4 +20,4 @@ # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE # SOFTWARE. -gnuplot -e "in='1.2.4/'; out='1.2.4/clogs-benchmark.svg'" clogs-benchmark.plot +gnuplot -e "in='1.3.0/'; out='1.3.0/clogs-benchmark.svg'" clogs-benchmark.plot diff --git a/wscript b/wscript index a6f8fa4..96bf03b 100644 --- a/wscript +++ b/wscript @@ -27,7 +27,7 @@ from waflib.TaskGen import feature, after_method from waflib import Task APPNAME = 'clogs' -VERSION = '1.2.4' +VERSION = '1.3.0' out = 'build' variants = {