mirror of
https://mirror.skon.top/https://github.com/FFmpeg/FFmpeg
synced 2026-04-20 21:00:41 +08:00
Add NEON-optimized implementation for HEVC intra DC prediction at 8-bit
depth, supporting all block sizes (4x4 to 32x32).
DC prediction computes the average of top and left reference samples
using uaddlv, with urshr for rounded division. For luma blocks smaller
than 32x32, edge smoothing is applied: the first row and column are
blended toward the reference using (ref[i] + 3*dc + 2) >> 2 computed
entirely in the NEON domain. Fill stores use pre-computed address
patterns to break dependency chains.
Also adds the aarch64 initialization framework (Makefile, pred.c/pred.h
hooks, hevcpred_init_aarch64.c).
Speedup over C on Apple M4 (checkasm --bench):
4x4: 2.28x 8x8: 3.14x 16x16: 3.29x 32x32: 3.02x
Signed-off-by: Jun Zhao <barryjzhao@tencent.com>
85 lines
2.4 KiB
C
85 lines
2.4 KiB
C
/*
|
|
* HEVC video Decoder
|
|
*
|
|
* Copyright (C) 2012 - 2013 Guillaume Martres
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#include "hevcdec.h"
|
|
|
|
#include "pred.h"
|
|
|
|
#define BIT_DEPTH 8
|
|
#include "pred_template.c"
|
|
#undef BIT_DEPTH
|
|
|
|
#define BIT_DEPTH 9
|
|
#include "pred_template.c"
|
|
#undef BIT_DEPTH
|
|
|
|
#define BIT_DEPTH 10
|
|
#include "pred_template.c"
|
|
#undef BIT_DEPTH
|
|
|
|
#define BIT_DEPTH 12
|
|
#include "pred_template.c"
|
|
#undef BIT_DEPTH
|
|
|
|
void ff_hevc_pred_init(HEVCPredContext *hpc, int bit_depth)
|
|
{
|
|
#undef FUNC
|
|
#define FUNC(a, depth) a ## _ ## depth
|
|
|
|
#define HEVC_PRED(depth) \
|
|
hpc->intra_pred[0] = FUNC(intra_pred_2, depth); \
|
|
hpc->intra_pred[1] = FUNC(intra_pred_3, depth); \
|
|
hpc->intra_pred[2] = FUNC(intra_pred_4, depth); \
|
|
hpc->intra_pred[3] = FUNC(intra_pred_5, depth); \
|
|
hpc->pred_planar[0] = FUNC(pred_planar_0, depth); \
|
|
hpc->pred_planar[1] = FUNC(pred_planar_1, depth); \
|
|
hpc->pred_planar[2] = FUNC(pred_planar_2, depth); \
|
|
hpc->pred_planar[3] = FUNC(pred_planar_3, depth); \
|
|
hpc->pred_dc = FUNC(pred_dc, depth); \
|
|
hpc->pred_angular[0] = FUNC(pred_angular_0, depth); \
|
|
hpc->pred_angular[1] = FUNC(pred_angular_1, depth); \
|
|
hpc->pred_angular[2] = FUNC(pred_angular_2, depth); \
|
|
hpc->pred_angular[3] = FUNC(pred_angular_3, depth);
|
|
|
|
switch (bit_depth) {
|
|
case 9:
|
|
HEVC_PRED(9);
|
|
break;
|
|
case 10:
|
|
HEVC_PRED(10);
|
|
break;
|
|
case 12:
|
|
HEVC_PRED(12);
|
|
break;
|
|
default:
|
|
HEVC_PRED(8);
|
|
break;
|
|
}
|
|
|
|
#if ARCH_AARCH64
|
|
ff_hevc_pred_init_aarch64(hpc, bit_depth);
|
|
#endif
|
|
#if ARCH_MIPS
|
|
ff_hevc_pred_init_mips(hpc, bit_depth);
|
|
#endif
|
|
}
|