mirror of
https://github.com/xenia-project/FFmpeg.git
synced 2024-12-01 15:31:24 +00:00
b7d1488393
This fixes out of global array reads. The alternative solutions of checking the index or modifying the VLC tables to prevent the index going outside are each about 1-2 cpu cyclces slower per coded 4x4 block. The alternative of padding the global tables directly is more ugly and moving them to the context should benefit cache locality. Found-by: Mateusz "j00ru" Jurczyk and Gynvael Coldwind Signed-off-by: Michael Niedermayer <michaelni@gmx.at>
273 lines
11 KiB
C
273 lines
11 KiB
C
/*
|
|
* H26L/H264/AVC/JVT/14496-10/... encoder/decoder
|
|
* Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
/**
|
|
* @file
|
|
* @brief
|
|
* H264 / AVC / MPEG4 part10 codec data table
|
|
* @author Michael Niedermayer <michaelni@gmx.at>
|
|
*/
|
|
|
|
#ifndef AVCODEC_H264DATA_H
|
|
#define AVCODEC_H264DATA_H
|
|
|
|
#include <stdint.h>
|
|
|
|
#include "libavutil/rational.h"
|
|
#include "mpegvideo.h"
|
|
#include "h264.h"
|
|
|
|
static const uint8_t golomb_to_pict_type[5] = {
|
|
AV_PICTURE_TYPE_P, AV_PICTURE_TYPE_B, AV_PICTURE_TYPE_I,
|
|
AV_PICTURE_TYPE_SP, AV_PICTURE_TYPE_SI
|
|
};
|
|
|
|
static const uint8_t golomb_to_intra4x4_cbp[48] = {
|
|
47, 31, 15, 0, 23, 27, 29, 30, 7, 11, 13, 14, 39, 43, 45, 46,
|
|
16, 3, 5, 10, 12, 19, 21, 26, 28, 35, 37, 42, 44, 1, 2, 4,
|
|
8, 17, 18, 20, 24, 6, 9, 22, 25, 32, 33, 34, 36, 40, 38, 41
|
|
};
|
|
|
|
static const uint8_t golomb_to_inter_cbp[48] = {
|
|
0, 16, 1, 2, 4, 8, 32, 3, 5, 10, 12, 15, 47, 7, 11, 13,
|
|
14, 6, 9, 31, 35, 37, 42, 44, 33, 34, 36, 40, 39, 43, 45, 46,
|
|
17, 18, 20, 24, 19, 21, 26, 28, 23, 27, 29, 30, 22, 25, 38, 41
|
|
};
|
|
|
|
static const uint8_t zigzag_scan[16+1] = {
|
|
0 + 0 * 4, 1 + 0 * 4, 0 + 1 * 4, 0 + 2 * 4,
|
|
1 + 1 * 4, 2 + 0 * 4, 3 + 0 * 4, 2 + 1 * 4,
|
|
1 + 2 * 4, 0 + 3 * 4, 1 + 3 * 4, 2 + 2 * 4,
|
|
3 + 1 * 4, 3 + 2 * 4, 2 + 3 * 4, 3 + 3 * 4,
|
|
};
|
|
|
|
static const uint8_t field_scan[16+1] = {
|
|
0 + 0 * 4, 0 + 1 * 4, 1 + 0 * 4, 0 + 2 * 4,
|
|
0 + 3 * 4, 1 + 1 * 4, 1 + 2 * 4, 1 + 3 * 4,
|
|
2 + 0 * 4, 2 + 1 * 4, 2 + 2 * 4, 2 + 3 * 4,
|
|
3 + 0 * 4, 3 + 1 * 4, 3 + 2 * 4, 3 + 3 * 4,
|
|
};
|
|
|
|
static const uint8_t luma_dc_zigzag_scan[16] = {
|
|
0 * 16 + 0 * 64, 1 * 16 + 0 * 64, 2 * 16 + 0 * 64, 0 * 16 + 2 * 64,
|
|
3 * 16 + 0 * 64, 0 * 16 + 1 * 64, 1 * 16 + 1 * 64, 2 * 16 + 1 * 64,
|
|
1 * 16 + 2 * 64, 2 * 16 + 2 * 64, 3 * 16 + 2 * 64, 0 * 16 + 3 * 64,
|
|
3 * 16 + 1 * 64, 1 * 16 + 3 * 64, 2 * 16 + 3 * 64, 3 * 16 + 3 * 64,
|
|
};
|
|
|
|
static const uint8_t luma_dc_field_scan[16] = {
|
|
0 * 16 + 0 * 64, 2 * 16 + 0 * 64, 1 * 16 + 0 * 64, 0 * 16 + 2 * 64,
|
|
2 * 16 + 2 * 64, 3 * 16 + 0 * 64, 1 * 16 + 2 * 64, 3 * 16 + 2 * 64,
|
|
0 * 16 + 1 * 64, 2 * 16 + 1 * 64, 0 * 16 + 3 * 64, 2 * 16 + 3 * 64,
|
|
1 * 16 + 1 * 64, 3 * 16 + 1 * 64, 1 * 16 + 3 * 64, 3 * 16 + 3 * 64,
|
|
};
|
|
|
|
static const uint8_t chroma_dc_scan[4] = {
|
|
(0 + 0 * 2) * 16, (1 + 0 * 2) * 16,
|
|
(0 + 1 * 2) * 16, (1 + 1 * 2) * 16,
|
|
};
|
|
|
|
static const uint8_t chroma422_dc_scan[8] = {
|
|
(0 + 0 * 2) * 16, (0 + 1 * 2) * 16,
|
|
(1 + 0 * 2) * 16, (0 + 2 * 2) * 16,
|
|
(0 + 3 * 2) * 16, (1 + 1 * 2) * 16,
|
|
(1 + 2 * 2) * 16, (1 + 3 * 2) * 16,
|
|
};
|
|
|
|
// zigzag_scan8x8_cavlc[i] = zigzag_scan8x8[(i/4) + 16*(i%4)]
|
|
static const uint8_t zigzag_scan8x8_cavlc[64+1] = {
|
|
0 + 0 * 8, 1 + 1 * 8, 1 + 2 * 8, 2 + 2 * 8,
|
|
4 + 1 * 8, 0 + 5 * 8, 3 + 3 * 8, 7 + 0 * 8,
|
|
3 + 4 * 8, 1 + 7 * 8, 5 + 3 * 8, 6 + 3 * 8,
|
|
2 + 7 * 8, 6 + 4 * 8, 5 + 6 * 8, 7 + 5 * 8,
|
|
1 + 0 * 8, 2 + 0 * 8, 0 + 3 * 8, 3 + 1 * 8,
|
|
3 + 2 * 8, 0 + 6 * 8, 4 + 2 * 8, 6 + 1 * 8,
|
|
2 + 5 * 8, 2 + 6 * 8, 6 + 2 * 8, 5 + 4 * 8,
|
|
3 + 7 * 8, 7 + 3 * 8, 4 + 7 * 8, 7 + 6 * 8,
|
|
0 + 1 * 8, 3 + 0 * 8, 0 + 4 * 8, 4 + 0 * 8,
|
|
2 + 3 * 8, 1 + 5 * 8, 5 + 1 * 8, 5 + 2 * 8,
|
|
1 + 6 * 8, 3 + 5 * 8, 7 + 1 * 8, 4 + 5 * 8,
|
|
4 + 6 * 8, 7 + 4 * 8, 5 + 7 * 8, 6 + 7 * 8,
|
|
0 + 2 * 8, 2 + 1 * 8, 1 + 3 * 8, 5 + 0 * 8,
|
|
1 + 4 * 8, 2 + 4 * 8, 6 + 0 * 8, 4 + 3 * 8,
|
|
0 + 7 * 8, 4 + 4 * 8, 7 + 2 * 8, 3 + 6 * 8,
|
|
5 + 5 * 8, 6 + 5 * 8, 6 + 6 * 8, 7 + 7 * 8,
|
|
};
|
|
|
|
static const uint8_t field_scan8x8[64+1] = {
|
|
0 + 0 * 8, 0 + 1 * 8, 0 + 2 * 8, 1 + 0 * 8,
|
|
1 + 1 * 8, 0 + 3 * 8, 0 + 4 * 8, 1 + 2 * 8,
|
|
2 + 0 * 8, 1 + 3 * 8, 0 + 5 * 8, 0 + 6 * 8,
|
|
0 + 7 * 8, 1 + 4 * 8, 2 + 1 * 8, 3 + 0 * 8,
|
|
2 + 2 * 8, 1 + 5 * 8, 1 + 6 * 8, 1 + 7 * 8,
|
|
2 + 3 * 8, 3 + 1 * 8, 4 + 0 * 8, 3 + 2 * 8,
|
|
2 + 4 * 8, 2 + 5 * 8, 2 + 6 * 8, 2 + 7 * 8,
|
|
3 + 3 * 8, 4 + 1 * 8, 5 + 0 * 8, 4 + 2 * 8,
|
|
3 + 4 * 8, 3 + 5 * 8, 3 + 6 * 8, 3 + 7 * 8,
|
|
4 + 3 * 8, 5 + 1 * 8, 6 + 0 * 8, 5 + 2 * 8,
|
|
4 + 4 * 8, 4 + 5 * 8, 4 + 6 * 8, 4 + 7 * 8,
|
|
5 + 3 * 8, 6 + 1 * 8, 6 + 2 * 8, 5 + 4 * 8,
|
|
5 + 5 * 8, 5 + 6 * 8, 5 + 7 * 8, 6 + 3 * 8,
|
|
7 + 0 * 8, 7 + 1 * 8, 6 + 4 * 8, 6 + 5 * 8,
|
|
6 + 6 * 8, 6 + 7 * 8, 7 + 2 * 8, 7 + 3 * 8,
|
|
7 + 4 * 8, 7 + 5 * 8, 7 + 6 * 8, 7 + 7 * 8,
|
|
};
|
|
|
|
static const uint8_t field_scan8x8_cavlc[64+1] = {
|
|
0 + 0 * 8, 1 + 1 * 8, 2 + 0 * 8, 0 + 7 * 8,
|
|
2 + 2 * 8, 2 + 3 * 8, 2 + 4 * 8, 3 + 3 * 8,
|
|
3 + 4 * 8, 4 + 3 * 8, 4 + 4 * 8, 5 + 3 * 8,
|
|
5 + 5 * 8, 7 + 0 * 8, 6 + 6 * 8, 7 + 4 * 8,
|
|
0 + 1 * 8, 0 + 3 * 8, 1 + 3 * 8, 1 + 4 * 8,
|
|
1 + 5 * 8, 3 + 1 * 8, 2 + 5 * 8, 4 + 1 * 8,
|
|
3 + 5 * 8, 5 + 1 * 8, 4 + 5 * 8, 6 + 1 * 8,
|
|
5 + 6 * 8, 7 + 1 * 8, 6 + 7 * 8, 7 + 5 * 8,
|
|
0 + 2 * 8, 0 + 4 * 8, 0 + 5 * 8, 2 + 1 * 8,
|
|
1 + 6 * 8, 4 + 0 * 8, 2 + 6 * 8, 5 + 0 * 8,
|
|
3 + 6 * 8, 6 + 0 * 8, 4 + 6 * 8, 6 + 2 * 8,
|
|
5 + 7 * 8, 6 + 4 * 8, 7 + 2 * 8, 7 + 6 * 8,
|
|
1 + 0 * 8, 1 + 2 * 8, 0 + 6 * 8, 3 + 0 * 8,
|
|
1 + 7 * 8, 3 + 2 * 8, 2 + 7 * 8, 4 + 2 * 8,
|
|
3 + 7 * 8, 5 + 2 * 8, 4 + 7 * 8, 5 + 4 * 8,
|
|
6 + 3 * 8, 6 + 5 * 8, 7 + 3 * 8, 7 + 7 * 8,
|
|
};
|
|
|
|
typedef struct IMbInfo {
|
|
uint16_t type;
|
|
uint8_t pred_mode;
|
|
uint8_t cbp;
|
|
} IMbInfo;
|
|
|
|
static const IMbInfo i_mb_type_info[26] = {
|
|
{ MB_TYPE_INTRA4x4, -1, -1 },
|
|
{ MB_TYPE_INTRA16x16, 2, 0 },
|
|
{ MB_TYPE_INTRA16x16, 1, 0 },
|
|
{ MB_TYPE_INTRA16x16, 0, 0 },
|
|
{ MB_TYPE_INTRA16x16, 3, 0 },
|
|
{ MB_TYPE_INTRA16x16, 2, 16 },
|
|
{ MB_TYPE_INTRA16x16, 1, 16 },
|
|
{ MB_TYPE_INTRA16x16, 0, 16 },
|
|
{ MB_TYPE_INTRA16x16, 3, 16 },
|
|
{ MB_TYPE_INTRA16x16, 2, 32 },
|
|
{ MB_TYPE_INTRA16x16, 1, 32 },
|
|
{ MB_TYPE_INTRA16x16, 0, 32 },
|
|
{ MB_TYPE_INTRA16x16, 3, 32 },
|
|
{ MB_TYPE_INTRA16x16, 2, 15 + 0 },
|
|
{ MB_TYPE_INTRA16x16, 1, 15 + 0 },
|
|
{ MB_TYPE_INTRA16x16, 0, 15 + 0 },
|
|
{ MB_TYPE_INTRA16x16, 3, 15 + 0 },
|
|
{ MB_TYPE_INTRA16x16, 2, 15 + 16 },
|
|
{ MB_TYPE_INTRA16x16, 1, 15 + 16 },
|
|
{ MB_TYPE_INTRA16x16, 0, 15 + 16 },
|
|
{ MB_TYPE_INTRA16x16, 3, 15 + 16 },
|
|
{ MB_TYPE_INTRA16x16, 2, 15 + 32 },
|
|
{ MB_TYPE_INTRA16x16, 1, 15 + 32 },
|
|
{ MB_TYPE_INTRA16x16, 0, 15 + 32 },
|
|
{ MB_TYPE_INTRA16x16, 3, 15 + 32 },
|
|
{ MB_TYPE_INTRA_PCM, -1, -1 },
|
|
};
|
|
|
|
typedef struct PMbInfo {
|
|
uint16_t type;
|
|
uint8_t partition_count;
|
|
} PMbInfo;
|
|
|
|
static const PMbInfo p_mb_type_info[5] = {
|
|
{ MB_TYPE_16x16 | MB_TYPE_P0L0, 1 },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L0 | MB_TYPE_P1L0, 2 },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L0 | MB_TYPE_P1L0, 2 },
|
|
{ MB_TYPE_8x8 | MB_TYPE_P0L0 | MB_TYPE_P1L0, 4 },
|
|
{ MB_TYPE_8x8 | MB_TYPE_P0L0 | MB_TYPE_P1L0 | MB_TYPE_REF0, 4 },
|
|
};
|
|
|
|
static const PMbInfo p_sub_mb_type_info[4] = {
|
|
{ MB_TYPE_16x16 | MB_TYPE_P0L0, 1 },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L0, 2 },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L0, 2 },
|
|
{ MB_TYPE_8x8 | MB_TYPE_P0L0, 4 },
|
|
};
|
|
|
|
static const PMbInfo b_mb_type_info[23] = {
|
|
{ MB_TYPE_DIRECT2 | MB_TYPE_L0L1, 1, },
|
|
{ MB_TYPE_16x16 | MB_TYPE_P0L0, 1, },
|
|
{ MB_TYPE_16x16 | MB_TYPE_P0L1, 1, },
|
|
{ MB_TYPE_16x16 | MB_TYPE_P0L0 | MB_TYPE_P0L1, 1, },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L0 | MB_TYPE_P1L0, 2, },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L0 | MB_TYPE_P1L0, 2, },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L1 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L1 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L0 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L0 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L1 | MB_TYPE_P1L0, 2, },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L1 | MB_TYPE_P1L0, 2, },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L0 | MB_TYPE_P1L0 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L0 | MB_TYPE_P1L0 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L1 | MB_TYPE_P1L0 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L1 | MB_TYPE_P1L0 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | MB_TYPE_P1L0, 2, },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | MB_TYPE_P1L0, 2, },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | MB_TYPE_P1L0 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | MB_TYPE_P1L0 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_8x8 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | MB_TYPE_P1L0 | MB_TYPE_P1L1, 4, },
|
|
};
|
|
|
|
static const PMbInfo b_sub_mb_type_info[13] = {
|
|
{ MB_TYPE_DIRECT2, 1, },
|
|
{ MB_TYPE_16x16 | MB_TYPE_P0L0, 1, },
|
|
{ MB_TYPE_16x16 | MB_TYPE_P0L1, 1, },
|
|
{ MB_TYPE_16x16 | MB_TYPE_P0L0 | MB_TYPE_P0L1, 1, },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L0 | MB_TYPE_P1L0, 2, },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L0 | MB_TYPE_P1L0, 2, },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L1 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L1 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_16x8 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | MB_TYPE_P1L0 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_8x16 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | MB_TYPE_P1L0 | MB_TYPE_P1L1, 2, },
|
|
{ MB_TYPE_8x8 | MB_TYPE_P0L0 | MB_TYPE_P1L0, 4, },
|
|
{ MB_TYPE_8x8 | MB_TYPE_P0L1 | MB_TYPE_P1L1, 4, },
|
|
{ MB_TYPE_8x8 | MB_TYPE_P0L0 | MB_TYPE_P0L1 | MB_TYPE_P1L0 | MB_TYPE_P1L1, 4, },
|
|
};
|
|
|
|
static const uint8_t dequant4_coeff_init[6][3] = {
|
|
{ 10, 13, 16 },
|
|
{ 11, 14, 18 },
|
|
{ 13, 16, 20 },
|
|
{ 14, 18, 23 },
|
|
{ 16, 20, 25 },
|
|
{ 18, 23, 29 },
|
|
};
|
|
|
|
static const uint8_t dequant8_coeff_init_scan[16] = {
|
|
0, 3, 4, 3, 3, 1, 5, 1, 4, 5, 2, 5, 3, 1, 5, 1
|
|
};
|
|
|
|
static const uint8_t dequant8_coeff_init[6][6] = {
|
|
{ 20, 18, 32, 19, 25, 24 },
|
|
{ 22, 19, 35, 21, 28, 26 },
|
|
{ 26, 23, 42, 24, 33, 31 },
|
|
{ 28, 25, 45, 26, 35, 33 },
|
|
{ 32, 28, 51, 30, 40, 38 },
|
|
{ 36, 32, 58, 34, 46, 43 },
|
|
};
|
|
|
|
#endif /* AVCODEC_H264DATA_H */
|