From d3789eeeed3423bd1ca9dc40030a2f7a21ea5332 Mon Sep 17 00:00:00 2001 From: Janne Grunau Date: Sat, 5 Apr 2014 11:47:18 +0200 Subject: aarch64: implement videodsp.prefetch 8% faster h264 decoding on Apple A7. --- libavcodec/aarch64/videodsp.S | 28 ++++++++++++++++++++++++++++ 1 file changed, 28 insertions(+) create mode 100644 libavcodec/aarch64/videodsp.S (limited to 'libavcodec/aarch64/videodsp.S') diff --git a/libavcodec/aarch64/videodsp.S b/libavcodec/aarch64/videodsp.S new file mode 100644 index 0000000000..7ce5a7ddf6 --- /dev/null +++ b/libavcodec/aarch64/videodsp.S @@ -0,0 +1,28 @@ +/* + * This file is part of Libav. + * + * Libav is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * Libav is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with Libav; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +#include "libavutil/aarch64/asm.S" + +function ff_prefetch_aarch64, export=1 + subs w2, w2, #2 + prfm pldl1strm, [x0] + prfm pldl1strm, [x0, x1] + add x0, x0, x1, lsl #1 + b.gt X(ff_prefetch_aarch64) + ret +endfunc -- cgit v1.2.3