diff options
author | Bernard Ogden <bernie.ogden@linaro.org> | 2014-07-09 13:06:08 +0100 |
---|---|---|
committer | Bernard Ogden <bernie.ogden@linaro.org> | 2014-07-09 13:06:08 +0100 |
commit | 3bd24ee79b22bf4f5b97754fdbb936a209ed9114 (patch) | |
tree | 0532b0eabfa5a817c1bcc84bfd543166df2f7494 | |
parent | 537919350e756c7c7dad847a67f1bfabc7516cb0 (diff) |
A second alternative pld arrangementbench_all_variants
A bit better for one set of block sizes, a bit worse for another.
-rw-r--r-- | src/arm/memcpy.S | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/src/arm/memcpy.S b/src/arm/memcpy.S index 5ec4d96..45455b3 100644 --- a/src/arm/memcpy.S +++ b/src/arm/memcpy.S @@ -415,10 +415,10 @@ def_fn memcpy p2align=6 subs tmp2, tmp2, #prefetch_lines * 64 * 2 blt 2f 1: - cpy_line_vfp d3, 0 pld [src, #320] - cpy_line_vfp d4, 64 pld [src, #384] + cpy_line_vfp d3, 0 + cpy_line_vfp d4, 64 cpy_line_vfp d5, 128 pld [src, #448] add dst, dst, #3 * 64 |