aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorAlon Zakai <alonzakai@gmail.com>2011-11-04 11:54:27 -0700
committerAlon Zakai <alonzakai@gmail.com>2011-11-04 11:54:27 -0700
commitd7abb60c3f6a69f182a62be4db52e18547914bd9 (patch)
tree143cdf7f2b3d51d25c5137d0f8385f57b5f48cdc
parent81607b331bc1dadd443a7b8799006f68c485b51c (diff)
optimize ta1 memcpy, and use ta1 in raytrace benchmark
-rw-r--r--src/parseTools.js31
-rw-r--r--tests/runner.py10
2 files changed, 22 insertions, 19 deletions
diff --git a/src/parseTools.js b/src/parseTools.js
index 44577491..96007489 100644
--- a/src/parseTools.js
+++ b/src/parseTools.js
@@ -802,7 +802,7 @@ function makeSetValue(ptr, pos, value, type, noNeedFirst, ignore) {
}
}
-var UNROLL_LOOP_LIMIT = 5;
+var UNROLL_LOOP_LIMIT = 8;
function makeSetValues(ptr, pos, value, type, num) {
function safety(where) {
@@ -854,25 +854,36 @@ function makeCopyValues(dest, src, num, type, modifier) {
from = from || (src + '+' + '$mcpi$');
return (SAFE_HEAP ? 'SAFE_HEAP_COPY_HISTORY(' + to + ', ' + from + ')' : '');
}
- if (USE_TYPED_ARRAYS in set(0, 1)) {
+ if (USE_TYPED_ARRAYS <= 1) {
if (isNumber(num)) {
if (num < UNROLL_LOOP_LIMIT) {
return range(num).map(function(i) {
return type !== 'null' ? makeSetValue(dest, i, makeGetValue(src, i, type) + (modifier || ''), type)
: // Null is special-cased: We copy over all heaps
makeGetSlabs(dest, 'null', true).map(function(slab) {
- return slab + '[' + dest + '+' + i + ']=' + slab + '[' + src + '+' + i + ']';
+ return slab + '[' + getFastValue(dest, '+', i) + ']=' + slab + '[' + getFastValue(src, '+', i) + ']';
}).join('; ') + '; ' + safety(dest + '+' + i, src + '+' + i)
}).join('; ');
}
}
- return 'for (var $mcpi$ = 0; $mcpi$ < ' + num + '; $mcpi$++) {\n' +
- (type !== 'null' ? makeSetValue(dest, '$mcpi$', makeGetValue(src, '$mcpi$', type) + (modifier || ''), type)
- : // Null is special-cased: We copy over all heaps
- makeGetSlabs(dest, 'null', true).map(function(slab) {
- return slab + '[' + dest + '+$mcpi$]=' + slab + '[' + src + '+$mcpi$]'
- }).join('; ') + '; ' + safety()
- ) + '\n' + '}';
+ if (SAFE_HEAP) {
+ return 'for (var $mcpi$ = 0; $mcpi$ < ' + num + '; $mcpi$++) {\n' +
+ (type !== 'null' ? makeSetValue(dest, '$mcpi$', makeGetValue(src, '$mcpi$', type) + (modifier || ''), type)
+ : // Null is special-cased: We copy over all heaps
+ makeGetSlabs(dest, 'null', true).map(function(slab) {
+ return slab + '[' + dest + '+$mcpi$]=' + slab + '[' + src + '+$mcpi$]'
+ }).join('; ') + '; ' + safety()
+ ) + '\n' + '}';
+ }
+ if (USE_TYPED_ARRAYS == 0) {
+ return 'for (var $mcpi_s$=' + src + ',$mcpi_e$=' + src + '+' + num + ',$mcpi_d$=' + dest + '; $mcpi_s$<$mcpi_e$; $mcpi_s$++, $mcpi_d$++) {\n' +
+ ' HEAP[$mcpi_d$] = HEAP[$mcpi_s$];\n' +
+ '}';
+ } else { // USE_TYPED_ARRAYS == 1
+ return 'for (var $mcpi_s$=' + src + ',$mcpi_e$=' + src + '+' + num + ',$mcpi_d$=' + dest + '; $mcpi_s$<$mcpi_e$; $mcpi_s$++, $mcpi_d$++) {\n' +
+ ' IHEAP[$mcpi_d$] = IHEAP[$mcpi_s$]; FHEAP[$mcpi_d$] = FHEAP[$mcpi_s$];\n' +
+ '}';
+ }
} else { // USE_TYPED_ARRAYS == 2
return '' +
'var $src$, $dest$, $stop$, $stop4$, $fast$;\n' +
diff --git a/tests/runner.py b/tests/runner.py
index 35bbe3ac..e31b1455 100644
--- a/tests/runner.py
+++ b/tests/runner.py
@@ -1774,7 +1774,7 @@ if 'benchmark' not in str(sys.argv):
if (i == j) continue;
if (i < j && i+k > j) continue;
if (j < i && j+k > i) continue;
- printf("[%d,%d,%d]\\n", i, j, k);
+ printf("[%d,%d,%d] ", i, j, k);
reset(buffer);
memcpy(buffer+i, buffer+j, k);
dump(buffer);
@@ -4449,17 +4449,9 @@ else:
def test_raytrace(self):
global POST_OPTIMIZATIONS; POST_OPTIMIZATIONS = ['closure']
- old_quantum = Settings.QUANTUM_SIZE
- old_use_typed_arrays = Settings.USE_TYPED_ARRAYS
- Settings.QUANTUM_SIZE = 1
- Settings.USE_TYPED_ARRAYS = 0 # Rounding errors with TA2 are too big in this very rounding-sensitive code. However, TA2 is much faster (2X)
-
src = open(path_from_root('tests', 'raytrace.cpp'), 'r').read().replace('double', 'float') # benchmark with floats
self.do_benchmark(src, ['7', '256'], '256 256', llvm_opts=True, handpicked=False)
- Settings.QUANTUM_SIZE = old_quantum
- Settings.USE_TYPED_ARRAYS = old_use_typed_arrays
-
def test_dlmalloc(self):
global POST_OPTIMIZATIONS; POST_OPTIMIZATIONS = ['eliminator']