1 /* 2 * Copyright (c) 2003-2010 Michael Niedermayer <michaelni@gmx.at> 3 * 4 * This file is part of FFmpeg. 5 * 6 * FFmpeg is free software; you can redistribute it and/or 7 * modify it under the terms of the GNU Lesser General Public 8 * License as published by the Free Software Foundation; either 9 * version 2.1 of the License, or (at your option) any later version. 10 * 11 * FFmpeg is distributed in the hope that it will be useful, 12 * but WITHOUT ANY WARRANTY; without even the implied warranty of 13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14 * Lesser General Public License for more details. 15 * 16 * You should have received a copy of the GNU Lesser General Public 17 * License along with FFmpeg; if not, write to the Free Software 18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA 19 */ 20 21 /** 22 * @file 23 * H.264 DSP functions. 24 * @author Michael Niedermayer <michaelni@gmx.at> 25 */ 26 27 #ifndef AVCODEC_H264DSP_H 28 #define AVCODEC_H264DSP_H 29 30 #include <stdint.h> 31 #include <stddef.h> 32 33 typedef void (*h264_weight_func)(uint8_t *block, ptrdiff_t stride, int height, 34 int log2_denom, int weight, int offset); 35 typedef void (*h264_biweight_func)(uint8_t *dst, uint8_t *src, 36 ptrdiff_t stride, int height, int log2_denom, 37 int weightd, int weights, int offset); 38 39 /** 40 * Context for storing H.264 DSP functions 41 */ 42 typedef struct H264DSPContext { 43 /* weighted MC */ 44 h264_weight_func weight_h264_pixels_tab[4]; 45 h264_biweight_func biweight_h264_pixels_tab[4]; 46 47 /* loop filter */ 48 void (*h264_v_loop_filter_luma)(uint8_t *pix /*align 16*/, ptrdiff_t stride, 49 int alpha, int beta, int8_t *tc0); 50 void (*h264_h_loop_filter_luma)(uint8_t *pix /*align 4 */, ptrdiff_t stride, 51 int alpha, int beta, int8_t *tc0); 52 void (*h264_h_loop_filter_luma_mbaff)(uint8_t *pix /*align 16*/, ptrdiff_t stride, 53 int alpha, int beta, int8_t *tc0); 54 /* v/h_loop_filter_luma_intra: align 16 */ 55 void (*h264_v_loop_filter_luma_intra)(uint8_t *pix, ptrdiff_t stride, 56 int alpha, int beta); 57 void (*h264_h_loop_filter_luma_intra)(uint8_t *pix, ptrdiff_t stride, 58 int alpha, int beta); 59 void (*h264_h_loop_filter_luma_mbaff_intra)(uint8_t *pix /*align 16*/, 60 ptrdiff_t stride, int alpha, int beta); 61 void (*h264_v_loop_filter_chroma)(uint8_t *pix /*align 8*/, ptrdiff_t stride, 62 int alpha, int beta, int8_t *tc0); 63 void (*h264_h_loop_filter_chroma)(uint8_t *pix /*align 4*/, ptrdiff_t stride, 64 int alpha, int beta, int8_t *tc0); 65 void (*h264_h_loop_filter_chroma_mbaff)(uint8_t *pix /*align 8*/, 66 ptrdiff_t stride, int alpha, int beta, 67 int8_t *tc0); 68 void (*h264_v_loop_filter_chroma_intra)(uint8_t *pix /*align 8*/, 69 ptrdiff_t stride, int alpha, int beta); 70 void (*h264_h_loop_filter_chroma_intra)(uint8_t *pix /*align 8*/, 71 ptrdiff_t stride, int alpha, int beta); 72 void (*h264_h_loop_filter_chroma_mbaff_intra)(uint8_t *pix /*align 8*/, 73 ptrdiff_t stride, int alpha, int beta); 74 // h264_loop_filter_strength: simd only. the C version is inlined in h264_loopfilter.c 75 void (*h264_loop_filter_strength)(int16_t bS[2][4][4], uint8_t nnz[40], 76 int8_t ref[2][40], int16_t mv[2][40][2], 77 int bidir, int edges, int step, 78 int mask_mv0, int mask_mv1, int field); 79 80 /* IDCT */ 81 void (*h264_idct_add)(uint8_t *dst /*align 4*/, 82 int16_t *block /*align 16*/, int stride); 83 void (*h264_idct8_add)(uint8_t *dst /*align 8*/, 84 int16_t *block /*align 16*/, int stride); 85 void (*h264_idct_dc_add)(uint8_t *dst /*align 4*/, 86 int16_t *block /*align 16*/, int stride); 87 void (*h264_idct8_dc_add)(uint8_t *dst /*align 8*/, 88 int16_t *block /*align 16*/, int stride); 89 90 void (*h264_idct_add16)(uint8_t *dst /*align 16*/, const int *blockoffset, 91 int16_t *block /*align 16*/, int stride, 92 const uint8_t nnzc[5 * 8]); 93 void (*h264_idct8_add4)(uint8_t *dst /*align 16*/, const int *blockoffset, 94 int16_t *block /*align 16*/, int stride, 95 const uint8_t nnzc[5 * 8]); 96 void (*h264_idct_add8)(uint8_t **dst /*align 16*/, const int *blockoffset, 97 int16_t *block /*align 16*/, int stride, 98 const uint8_t nnzc[15 * 8]); 99 void (*h264_idct_add16intra)(uint8_t *dst /*align 16*/, const int *blockoffset, 100 int16_t *block /*align 16*/, 101 int stride, const uint8_t nnzc[5 * 8]); 102 void (*h264_luma_dc_dequant_idct)(int16_t *output, 103 int16_t *input /*align 16*/, int qmul); 104 void (*h264_chroma_dc_dequant_idct)(int16_t *block, int qmul); 105 106 /* bypass-transform */ 107 void (*h264_add_pixels8_clear)(uint8_t *dst, int16_t *block, int stride); 108 void (*h264_add_pixels4_clear)(uint8_t *dst, int16_t *block, int stride); 109 110 /** 111 * Search buf from the start for up to size bytes. Return the index 112 * of a zero byte, or >= size if not found. Ideally, use lookahead 113 * to filter out any zero bytes that are known to not be followed by 114 * one or more further zero bytes and a one byte. Better still, filter 115 * out any bytes that form the trailing_zero_8bits syntax element too. 116 */ 117 int (*startcode_find_candidate)(const uint8_t *buf, int size); 118 } H264DSPContext; 119 120 void ff_h264dsp_init(H264DSPContext *c, const int bit_depth, 121 const int chroma_format_idc); 122 void ff_h264dsp_init_aarch64(H264DSPContext *c, const int bit_depth, 123 const int chroma_format_idc); 124 void ff_h264dsp_init_arm(H264DSPContext *c, const int bit_depth, 125 const int chroma_format_idc); 126 void ff_h264dsp_init_ppc(H264DSPContext *c, const int bit_depth, 127 const int chroma_format_idc); 128 void ff_h264dsp_init_x86(H264DSPContext *c, const int bit_depth, 129 const int chroma_format_idc); 130 void ff_h264dsp_init_mips(H264DSPContext *c, const int bit_depth, 131 const int chroma_format_idc); 132 void ff_h264dsp_init_loongarch(H264DSPContext *c, const int bit_depth, 133 const int chroma_format_idc); 134 135 #endif /* AVCODEC_H264DSP_H */ 136