ZLMediaKit/src/Codec/H264Encoder.cpp

348 lines
13 KiB
C++
Raw Normal View History

2017-10-09 22:11:01 +08:00
/*
2020-04-04 20:30:09 +08:00
* Copyright (c) 2016 The ZLMediaKit project authors. All Rights Reserved.
2017-09-27 16:20:30 +08:00
*
* This file is part of ZLMediaKit(https://github.com/xia-chu/ZLMediaKit).
2017-09-27 16:20:30 +08:00
*
2020-04-04 20:30:09 +08:00
* Use of this source code is governed by MIT license that can be found in the
* LICENSE file in the root of the source tree. All contributing project authors
* may be found in the AUTHORS file in the root of the source tree.
2017-04-01 16:35:56 +08:00
*/
2017-09-27 16:20:30 +08:00
2017-04-01 16:35:56 +08:00
#ifdef ENABLE_X264
2022-05-25 15:11:26 +08:00
#include "H264Encoder.h"
2017-04-01 16:35:56 +08:00
#include "Util/TimeTicker.h"
2018-10-24 17:17:55 +08:00
using namespace toolkit;
namespace mediakit {
2017-04-01 16:35:56 +08:00
2022-05-25 15:11:26 +08:00
H264Encoder::H264Encoder() {}
2017-04-01 16:35:56 +08:00
H264Encoder::~H264Encoder() {
2020-03-20 11:51:24 +08:00
//* 清除图像区域
if (_pPicIn) {
delete _pPicIn;
_pPicIn = nullptr;
}
if (_pPicOut) {
delete _pPicOut;
_pPicOut = nullptr;
}
//* 关闭编码器句柄
if (_pX264Handle) {
x264_encoder_close(_pX264Handle);
_pX264Handle = nullptr;
}
2017-04-01 16:35:56 +08:00
}
/*typedef struct x264_param_t
{
CPU
unsigned int cpu;
int i_threads;
int b_deterministic; 线
int i_sync_lookahead; 线
int i_width;
int i_height;
int i_csp; CSP,i420
int i_level_idc; level值的设置
int i_frame_total; , 0
Vui参数集视频可用性信息视频标准化选项
struct
{
they will be reduced to be 0 < x <= 65535 and prime
int i_sar_height;
int i_sar_width;
2017-08-09 18:39:30 +08:00
int i_overscan; 0=undef, 1=no overscan, 2=overscan 线"undef"():show()/crop()
2017-04-01 16:35:56 +08:00
h264附件E
Int i_vidformat; "undef"component/pal/ntsc/secam/mac/undef
2017-08-09 18:39:30 +08:00
int b_fullrange; Specify full range samples setting"off":off/on
int i_colorprim; "undef":undef/bt709/bt470m/bt470bgsmpte170m/smpte240m/film
int i_transfer; "undef":undef/bt709/bt470m/bt470bg/linear,log100/log316/smpte170m/smpte240m
2017-04-01 16:35:56 +08:00
int i_colmatrix; "undef",undef/bt709/fcc/bt470bg,smpte170m/smpte240m/GBR/YCgCo
int i_chroma_loc; both top & bottom色度样本指定0~50
} vui;
int i_fps_num;
int i_fps_den;
2017-08-09 18:39:30 +08:00
fps帧率确定的:
2017-04-01 16:35:56 +08:00
{ float fps;
if( sscanf( value, "%d/%d", &p->i_fps_num, &p->i_fps_den ) == 2 )
;
else if( sscanf( value, "%f", &fps ) )
{
p->i_fps_num = (int)(fps * 1000 + .5);
p->i_fps_den = 1000;
}
else
b_error = 1;
}
Value的值就是fps
int i_frame_reference;
int i_keyint_max; IDR关键帧
int i_keyint_min; I, IDR.
int i_scenecut_threshold; I帧
int i_bframe; P帧的数目
int i_bframe_adaptive; B帧判定
int i_bframe_bias; B帧判定-100~+100B帧0
int b_bframe_pyramid; B为参考帧
int b_deblocking_filter;
int i_deblocking_filter_alphac0; [-6, 6] -6 light filter, 6 strong
int i_deblocking_filter_beta; [-6, 6] idem
int b_cabac;
int i_cabac_init_idc;
int b_interlaced;
int i_cqm_preset; (CQM),flat
char *psz_cqm_file; JM format读取JM格式的外部量化矩阵文件cqm
uint8_t cqm_4iy[16]; used only if i_cqm_preset == X264_CQM_CUSTOM
uint8_t cqm_4ic[16];
uint8_t cqm_4py[16];
uint8_t cqm_4pc[16];
uint8_t cqm_8iy[64];
uint8_t cqm_8py[64];
void (*pf_log)( void *, int i_level, const char *psz, va_list );
void *p_log_private;
int i_log_level;
int b_visualize;
char *psz_dump_yuv;
struct
{
unsigned int intra;
unsigned int inter;
int b_transform_8x8;
int b_weighted_bipred; b帧隐式加权
int i_direct_mv_pred;
int i_chroma_qp_offset;
int i_me_method; (X264_ME_*)
int i_me_range; (from predicted mv)
int i_mv_range; (in pixels). -1 = auto, based on level
int i_mv_range_thread; 线. -1 = auto, based on number of threads.
int i_subpel_refine;
int b_chroma_me; P帧的模式选择
int b_mixed_references; P帧有它自己的参考号
2017-08-09 18:39:30 +08:00
int i_trellis; Trellis量化8x8的块寻找合适的量化值CABAC0 0:1:使2:使
2017-04-01 16:35:56 +08:00
int b_fast_pskip; P帧跳过检测
int b_dct_decimate; P-frames转换参数域
int i_noise_reduction;
float f_psy_rd; Psy RD strength
float f_psy_trellis; Psy trellis strength
int b_psy; Toggle all psy optimizations
使
int i_luma_deadzone[2]; {, }
int b_psnr; PSNR信息
int b_ssim; SSIM信息
} analyse;
struct
{
int i_rc_method; X264_RC_*
int i_qp_constant; 0-51
int i_qp_min;
int i_qp_max;
int i_qp_step;
int i_bitrate;
float f_rf_constant; 1pass VBR, nominal QP
float f_rate_tolerance;
int i_vbv_max_bitrate; 0(-B设置相同)
int i_vbv_buffer_size; kbit0
float f_vbv_buffer_init; <=1: fraction of buffer_size. >1: kbit码率控制缓冲区数据保留的最大数据量与缓冲区大小之比0~1.00.9
float f_ip_factor;
float f_pb_factor;
int i_aq_mode; psy adaptive QP. (X264_AQ_*)
float f_aq_strength;
int b_mb_tree; Macroblock-tree ratecontrol.
int i_lookahead;
2pass
int b_stat_write; Enable stat writing in psz_stat_out
char *psz_stat_out;
int b_stat_read; Read stat from psz_stat_in and use it
char *psz_stat_in;
2pass params (same as ffmpeg ones)
float f_qcompress; 0.0 => cbr, 1.0 => constant qp
float f_qblur;
float f_complexity_blur;
x264_zone_t *zones;
int i_zones; number of zone_t's
char *psz_zones;
} rc;
Muxing parameters
int b_aud; 访
int b_repeat_headers; SPS/PPS
int i_sps_id; SPS PPS id
int i_slice_max_size; NAL开销.
int i_slice_max_mbs; i_slice_count
int i_slice_count; : .
Optional callback for freeing this x264_param_t when it is done being used.
* Only used when the x264_param_t sits in memory for an indefinite period of time,
* i.e. when an x264_param_t is passed to x264_t in an x264_picture_t or in zones.
* Not used when x264_encoder_reconfig is called directly.
void (*param_free)( void* );
} x264_param_t;*/
2022-05-25 15:11:26 +08:00
bool H264Encoder::init(int iWidth, int iHeight, int iFps, int iBitRate) {
2020-03-20 11:51:24 +08:00
if (_pX264Handle) {
return true;
}
x264_param_t X264Param, *pX264Param = &X264Param;
//* 配置参数
//* 使用默认参数
x264_param_default_preset(pX264Param, "ultrafast", "zerolatency");
//* cpuFlags
2022-05-25 15:11:26 +08:00
pX264Param->i_threads = X264_SYNC_LOOKAHEAD_AUTO; //* 取空缓冲区继续使用不死锁的保证.
2020-03-20 11:51:24 +08:00
//* video Properties
pX264Param->i_width = iWidth; //* 宽度.
pX264Param->i_height = iHeight; //* 高度
pX264Param->i_frame_total = 0; //* 编码总帧数.不知道用0.
pX264Param->i_keyint_max = iFps * 3; //ffmpeg:gop_size 关键帧最大间隔
pX264Param->i_keyint_min = iFps * 1; //ffmpeg:keyint_min 关键帧最小间隔
//* Rate control Parameters
2022-05-25 15:11:26 +08:00
pX264Param->rc.i_bitrate = iBitRate / 1000; //* 码率(比特率,单位Kbps)
pX264Param->rc.i_qp_step = 1; //最大的在帧与帧之间进行切变的量化因子的变化量。ffmpeg:max_qdiff
pX264Param->rc.i_qp_min = 10; //ffmpeg:qmin;最小的量化因子。取值范围1-51。建议在10-30之间。
pX264Param->rc.i_qp_max = 41; //ffmpeg:qmax;最大的量化因子。取值范围1-51。建议在10-30之间。
2020-03-20 11:51:24 +08:00
pX264Param->rc.f_qcompress = 0.6;//ffmpeg:qcompress 量化器压缩比率0-1.越小则比特率越区域固定,但是越高越使量化器参数越固定
2022-05-25 15:11:26 +08:00
pX264Param->analyse.i_me_range = 16; //ffmpeg:me_range 运动侦测的半径
pX264Param->i_frame_reference = 3; //ffmpeg:refsB和P帧向前预测参考的帧数。取值范围1-16。
//该值不影响解码的速度,但是越大解码
//所需的内存越大。这个值在一般情况下
//越大效果越好但是超过6以后效果就
//不明显了。
pX264Param->analyse.i_trellis = 1; //ffmpeg:trellis
2020-03-20 11:51:24 +08:00
//pX264Param->analyse.i_me_method=X264_ME_DIA;//ffmpeg:me_method ME_ZERO 运动侦测的方式
2022-05-25 15:11:26 +08:00
pX264Param->rc.f_qblur = 0.5; //ffmpeg:qblur
2020-03-20 11:51:24 +08:00
//* bitstream parameters
/*open-GOP
B帧的时候才会出现open-GOP
GOP里面的某一帧在解码时要依赖于前一个GOP的某些帧
GOP就称为open-GOP
open-GOP码流
x264里面open-GOP是默认关闭的
:I0 B0 B1 P0 B2 B3...open-GOP码流I帧后面紧跟B帧
B0 B1的解码需要用到I0前面一个GOP的数据B0 B1的dts是小于I0的
: I0 P0 B0 B1 P1 B2 B3...close-GOP码流
I0后面所有帧的解码不依赖于I0前面的帧I0后面所有帧的dts都比I0的大
IDR0 B0 B1 P0 B2 B3...GOP是close-GOPB0,B1虽然dst比IDR0小
B0,B1参考不到前向GOP帧
: ...P0 B1 B2 P3 B4 B5 I6这就会输出open-Gop码流 P0 P3 B1 B2 I6 B4 B5...
B4 B5的解码依赖P3
...P0 B1 B2 P3 B4 P5 I6这样就不会输出open-GOP码流P0 P3 B1 B2 P5 B4 I6...
I6前面的第5帧是设置为B帧还是P帧
GOP的最后一帧5B帧
open-GOP,P帧就是close-GOP
B帧压缩性能好于P帧open-GOP在编码性能上稍微优于close-GOP
opne-GOP关闭的好*/
pX264Param->b_open_gop = 0;
2022-05-25 15:11:26 +08:00
pX264Param->i_bframe = 0; //最大B帧数.
2020-03-20 11:51:24 +08:00
pX264Param->i_bframe_pyramid = 0;
pX264Param->i_bframe_adaptive = X264_B_ADAPT_TRELLIS;
//* Log
pX264Param->i_log_level = X264_LOG_ERROR;
//* muxing parameters
pX264Param->i_fps_den = 1; //* 帧率分母
pX264Param->i_fps_num = iFps; //* 帧率分子
pX264Param->i_timebase_den = pX264Param->i_fps_num;
pX264Param->i_timebase_num = pX264Param->i_fps_den;
pX264Param->analyse.i_subpel_refine = 1; //这个参数控制在运动估算过程中质量和速度的权衡。Subq=5可以压缩>10%于subq=1。1-7
pX264Param->analyse.b_fast_pskip = 1; //在P帧内执行早期快速跳跃探测。这个经常在没有任何损失的前提下提高了速度。
pX264Param->b_annexb = 1; //1前面为0x00000001,0为nal长度
pX264Param->b_repeat_headers = 1; //关键帧前面是否放sps跟pps帧0 否 1
//* 设置Profile.使用baseline
x264_param_apply_profile(pX264Param, "high");
//* 打开编码器句柄,通过x264_encoder_parameters得到设置给X264
//* 的参数.通过x264_encoder_reconfig更新X264的参数
_pX264Handle = x264_encoder_open(pX264Param);
if (!_pX264Handle) {
return false;
}
_pPicIn = new x264_picture_t;
_pPicOut = new x264_picture_t;
x264_picture_init(_pPicIn);
x264_picture_init(_pPicOut);
_pPicIn->img.i_csp = X264_CSP_I420;
_pPicIn->img.i_plane = 3;
return true;
2017-04-01 16:35:56 +08:00
}
2022-05-25 15:11:26 +08:00
int H264Encoder::inputData(char *yuv[3], int linesize[3], int64_t cts, H264Frame **out_frame) {
2020-03-20 11:51:24 +08:00
//TimeTicker1(5);
2022-05-25 15:11:26 +08:00
_pPicIn->img.i_stride[0] = linesize[0];
_pPicIn->img.i_stride[1] = linesize[1];
_pPicIn->img.i_stride[2] = linesize[2];
_pPicIn->img.plane[0] = (uint8_t *) yuv[0];
_pPicIn->img.plane[1] = (uint8_t *) yuv[1];
_pPicIn->img.plane[2] = (uint8_t *) yuv[2];
_pPicIn->i_pts = cts;
2020-03-20 11:51:24 +08:00
int iNal;
2022-05-25 15:11:26 +08:00
x264_nal_t *pNals;
2020-03-20 11:51:24 +08:00
2022-05-25 15:11:26 +08:00
int iResult = x264_encoder_encode(_pX264Handle, &pNals, &iNal, _pPicIn, _pPicOut);
2020-03-20 11:51:24 +08:00
if (iResult <= 0) {
return 0;
}
for (int i = 0; i < iNal; i++) {
x264_nal_t pNal = pNals[i];
_aFrames[i].iType = pNal.i_type;
_aFrames[i].iLength = pNal.i_payload;
_aFrames[i].pucData = pNal.p_payload;
}
2022-05-25 15:11:26 +08:00
*out_frame = _aFrames;
2020-03-20 11:51:24 +08:00
return iNal;
2017-04-01 16:35:56 +08:00
}
2018-10-24 17:17:55 +08:00
} /* namespace mediakit */
2017-04-01 16:35:56 +08:00
#endif //ENABLE_X264