1/*! 2 * \copy 3 * Copyright (c) 2013, Cisco Systems 4 * All rights reserved. 5 * 6 * Redistribution and use in source and binary forms, with or without 7 * modification, are permitted provided that the following conditions 8 * are met: 9 * 10 * * Redistributions of source code must retain the above copyright 11 * notice, this list of conditions and the following disclaimer. 12 * 13 * * Redistributions in binary form must reproduce the above copyright 14 * notice, this list of conditions and the following disclaimer in 15 * the documentation and/or other materials provided with the 16 * distribution. 17 * 18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 19 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 20 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS 21 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE 22 * COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, 23 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, 24 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; 25 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER 26 * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN 28 * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 29 * POSSIBILITY OF SUCH DAMAGE. 30 * 31 */ 32 33 34#ifdef HAVE_NEON 35#include "arm_arch_common_macro.S" 36 37WELS_ASM_FUNC_BEGIN WelsI16x16LumaPredV_neon 38 //Get the top line data to 'q0' 39 sub r3, r1, r2 40 vldm r3, {d0, d1} 41 42 //mov r2, #16 43 mov r3, #4 44 //Set the top line to the each line of MB(16*16) 45loop_0_get_i16x16_luma_pred_v: 46 vst1.8 {d0,d1}, [r0]! 47 vst1.8 {d0,d1}, [r0]! 48 vst1.8 {d0,d1}, [r0]! 49 vst1.8 {d0,d1}, [r0]! 50 subs r3, #1 51 bne loop_0_get_i16x16_luma_pred_v 52WELS_ASM_FUNC_END 53 54 55WELS_ASM_FUNC_BEGIN WelsI16x16LumaPredH_neon 56 //stmdb sp!, {r4, lr} 57 sub r1, r1, #1 58 mov r3, #4 59loop_0_get_i16x16_luma_pred_h: 60 //Get one byte data from left side 61 vld1.8 {d0[],d1[]}, [r1], r2 62 vld1.8 {d2[],d3[]}, [r1], r2 63 vld1.8 {d4[],d5[]}, [r1], r2 64 vld1.8 {d6[],d7[]}, [r1], r2 65 66 //Set the line of MB using the left side byte data 67 vst1.8 {d0,d1}, [r0]! 68 //add r0, #16 69 vst1.8 {d2,d3}, [r0]! 70 //add r0, #16 71 vst1.8 {d4,d5}, [r0]! 72 //add r0, #16 73 vst1.8 {d6,d7}, [r0]! 74 //add r0, #16 75 76 subs r3, #1 77 bne loop_0_get_i16x16_luma_pred_h 78 79WELS_ASM_FUNC_END 80 81 82#endif 83