arma-thesis

git clone https://git.igankevich.com/arma-thesis.git
Log | Files | Refs | LICENSE

commit fee2baa5c4f6535bb03a738cc2baa1ff9527fe04
parent 511d33ca409b340799fd7e3715daf5f61face8ff
Author: Ivan Gankevich <igankevich@ya.ru>
Date:   Tue, 15 Aug 2017 14:28:50 +0300

Update to the latest benchmark repository revision.

Diffstat:
R/benchmarks.R | 18++++++------------
arma-thesis.org | 11+++++++++--
2 files changed, 15 insertions(+), 14 deletions(-)

diff --git a/R/benchmarks.R b/R/benchmarks.R @@ -10,12 +10,9 @@ arma.load_benchmark_data <- function(attempt, framework, models, tags) { idx <- 1 for (t in tags) { values <- arma.load( - file.path("build", "arma-benchmarks", "output"), - "gpulab1", - attempt, - 10000, - framework, - m, + file.path( + "build", "arma-benchmarks", "output", + "gpulab1", attempt, 10000, framework, m), t, ".*\\s+([0-9]+)us.*" ) @@ -70,12 +67,9 @@ arma.load_io_benchmark_data <- function(attempt, filesystems, suffix, tags) { idx <- 1 for (t in tags) { values <- arma.load( - file.path("build", "arma-benchmarks", "output"), - "gpulab1", - paste(attempt, fs, suffix, sep="-"), - 10000, - "openmp", - "ar", + file.path( + "build", "arma-benchmarks", "output", "gpulab1", + paste(attempt, fs, suffix, sep="-"), 10000, "openmp", "ar"), t, ".*\\s+([0-9]+)us.*" ) diff --git a/arma-thesis.org b/arma-thesis.org @@ -1205,7 +1205,7 @@ fi cd $dir git checkout master git pull -git checkout 908739d3a21354b86b5397619deca26c84355fb6 +git checkout 1ed6679387f0b79d8495c8bf55a6b0b304347e48 #+end_src #+RESULTS: @@ -3603,6 +3603,7 @@ model CPU architecture is superior compared to GPU due to better handling of complex information dependencies, non-intensive calculations (multiplications and additions) and complex memory access patterns. +#+header :results output raw :exports results #+name: tab-arma-performance #+begin_src R source(file.path("R", "benchmarks.R")) @@ -3673,6 +3674,11 @@ possibility to optimise this routine is to use root finding method with quadratic convergence rate to reduce the number of transcendental functions that need to be computed. +**** I/O performance. +:PROPERTIES: +:header-args:R: :results output raw :exports results +:END: + Although, in the current benchmarks writing data to files does not consume much of the running time, the use of network-mounted file systems may slow down this stage. To optimise it wavy surface parts were written to file as soon as full @@ -3687,6 +3693,7 @@ computation so the total running time is decreased system has the same effect, but the total reduction in execution time is small, because local file system is more performant. +#+header :results output raw :exports results #+name: tab-arma-io-performance #+begin_src R source(file.path("R", "benchmarks.R")) @@ -3765,7 +3772,7 @@ wavy surface. In order to investigate, how GPGPU computations can be used to speed-up velocity potential field computation, we benchmarked simplified version of -eq.\nbsp{}eqref:phi-3d: +eq.\nbsp{}eqref:eq-phi-3d: \begin{align} \label{eq:phi-linear} \phi(x,y,z,t) &= \InverseFourierY{