音视频从入门到精通——FFmpeg之av_seek_frame函数分析



     * Seek to the keyframe at timestamp.
     * 'timestamp' in 'stream_index'.
     * @param s media file handle
     * @param stream_index If stream_index is (-1), a default
     * stream is selected, and timestamp is automatically converted
     * from AV_TIME_BASE units to the stream specific time_base.
     * @param timestamp Timestamp in AVStream.time_base units
     *        or, if no stream is specified, in AV_TIME_BASE units.
     * @param flags flags which select direction and seeking mode
     * @return >= 0 on success
    int av_seek_frame(AVFormatContext *s, int stream_index, int64_t timestamp,
                      int flags);
    s: AVFormatContext类型的多媒体文件句柄

    stream_index : int类型表示要进行操作的流索引

    timestamp: int64_t类型的时间戳,表示要跳转到的时间位置

    flags : 跳转方法,主要有一下几种

    ///< seek backward seek到timestamp之前的最近关键帧
    #define AVSEEK_FLAG_BYTE 2 
    ///< seeking based on position in bytes 基于字节位置的跳转
    #define AVSEEK_FLAG_ANY 4 
    ///< seek to any frame, even non-keyframes 跳转到任意帧,不一定是关键帧
    #define AVSEEK_FLAG_FRAME 8 
    ///< seeking based on frame number 基于帧数量的跳转
    flags 的值为1,2,4,8。表示为二进制也就是

    0000 0001
    0000 0010
    0000 1000
    1000 0000
    所以,flags 应该是要通过或运算,加起来使用的。


    extern "C" {
    	#include "libavformat/avformat.h"
    	#include "libavcodec/avcodec.h"
    	#include "libswscale/swscale.h"
    	#include "libswresample/swresample.h"
    using namespace std;
    #pragma comment(lib,"avformat.lib")
    #pragma comment(lib,"avutil.lib")
    #pragma comment(lib,"avcodec.lib")
    #pragma comment(lib,"swscale.lib")
    #pragma comment(lib,"swresample.lib")
    static double r2d(AVRational r)
    	return r.den == 0 ? 0 : (double)r.num / (double)r.den;
    void XSleep(int ms)
    	//c++ 11
    	chrono::milliseconds du(ms);
    int main(int argc, char* argv[])
    	cout << "Test Demux FFmpeg.club" << endl;
    	const char* path = "D:\\javaCode\\androidmaniu2022\\FFmpeg\\input.mp4";
    	//初始化封装库---declared deprecated
    	//初始化网络库 (可以打开rtsp rtmp http 协议的流媒体视频)
    	//注册解码器---declared deprecated
    	AVDictionary* opts = NULL;
    	av_dict_set(&opts, "rtsp_transport", "tcp", 0);
    	av_dict_set(&opts, "max_delay", "500", 0);
    	AVFormatContext* ic = NULL;
    	int re = avformat_open_input(
    		0,  // 0表示自动选择解封器
    		&opts //参数设置,比如rtsp的延时时间
    	if (re != 0)
    		char buf[1024] = { 0 };
    		av_strerror(re, buf, sizeof(buf) - 1);
    		cout << "open " << path << " failed! :" << buf << endl;
    		return -1;
    	cout << "open " << path << " success! " << endl;
    	re = avformat_find_stream_info(ic, 0);
    	//总时长 毫秒
    	int totalMs = ic->duration / (AV_TIME_BASE / 1000);
    	cout << "totalMs = " << totalMs << endl;
    	av_dump_format(ic, 0, path, 0);
    	int videoStream = 0;
    	int audioStream = 1;
    	//获取音视频流信息 (遍历,函数获取)
    	for (int i = 0; i < ic->nb_streams; i++)
    		AVStream* as = ic->streams[i];
    		cout << "codec_id = " << as->codecpar->codec_id << endl;
    		cout << "format = " << as->codecpar->format << endl;
    		if (as->codecpar->codec_type == AVMEDIA_TYPE_AUDIO)
    			audioStream = i;
    			cout << i << "音频信息" << endl;
    			cout << "sample_rate = " << as->codecpar->sample_rate << endl;
    			cout << "channels = " << as->codecpar->channels << endl;
    			//一帧数据?? 单通道样本数 
    			cout << "frame_size = " << as->codecpar->frame_size << endl;
    			//1024 * 2 * 2 = 4096  fps = sample_rate/frame_size
    		else if (as->codecpar->codec_type == AVMEDIA_TYPE_VIDEO)
    			videoStream = i;
    			cout << i << "视频信息" << endl;
    			cout << "width=" << as->codecpar->width << endl;
    			cout << "height=" << as->codecpar->height << endl;
    			//帧率 fps 分数转换
    			cout << "video fps = " << r2d(as->avg_frame_rate) << endl;
    	videoStream = av_find_best_stream(ic, AVMEDIA_TYPE_VIDEO, -1, -1, NULL, 0);
    	AVCodec* vcodec = avcodec_find_decoder(ic->streams[videoStream]->codecpar->codec_id);
    	if (!vcodec)
    		cout << "can't find the codec id " << ic->streams[videoStream]->codecpar->codec_id;
    		return -1;
    	cout << "find the AVCodec " << ic->streams[videoStream]->codecpar->codec_id << endl;
    	AVCodecContext* vc = avcodec_alloc_context3(vcodec);
    	avcodec_parameters_to_context(vc, ic->streams[videoStream]->codecpar);
    	vc->thread_count = 8;
    	re = avcodec_open2(vc, 0, 0);
    	if (re != 0)
    		char buf[1024] = { 0 };
    		av_strerror(re, buf, sizeof(buf) - 1);
    		cout << "avcodec_open2  failed! :" << buf << endl;
    		return -1;
    	cout << "video avcodec_open2 success!" << endl;
    	AVCodec* acodec = avcodec_find_decoder(ic->streams[audioStream]->codecpar->codec_id);
    	if (!acodec)
    		cout << "can't find the codec id " << ic->streams[audioStream]->codecpar->codec_id;
    		return -1;
    	cout << "find the AVCodec " << ic->streams[audioStream]->codecpar->codec_id << endl;
    	AVCodecContext* ac = avcodec_alloc_context3(acodec);
    	avcodec_parameters_to_context(ac, ic->streams[audioStream]->codecpar);
    	ac->thread_count = 8;
    	re = avcodec_open2(ac, 0, 0);
    	if (re != 0)
    		char buf[1024] = { 0 };
    		av_strerror(re, buf, sizeof(buf) - 1);
    		cout << "avcodec_open2  failed! :" << buf << endl;
    		return -1;
    	cout << "audio avcodec_open2 success!" << endl;
    	//malloc AVPacket并初始化
    	AVPacket* pkt = av_packet_alloc();
    	AVFrame* frame = av_frame_alloc();
    	SwsContext* vctx = NULL;
    	unsigned char* rgb = NULL;
    	//音频重采样 上下文初始化
    	SwrContext* actx = swr_alloc();
    	actx = swr_alloc_set_opts(actx,
    		av_get_default_channel_layout(2),	//输出格式
    		AV_SAMPLE_FMT_S16,					//输出样本格式
    		ac->sample_rate,					//输出采样率
    		0, 0
    	re = swr_init(actx);
    	if (re != 0)
    		char buf[1024] = { 0 };
    		av_strerror(re, buf, sizeof(buf) - 1);
    		cout << "swr_init  failed! :" << buf << endl;
    		return -1;
    	unsigned char* pcm = NULL;
    	for (;;)
    		int re = av_read_frame(ic, pkt);
    		if (re != 0)
    			cout << "==============================end==============================" << endl;
    			int ms = 3000; //三秒位置 根据时间基数(分数)转换
    			long long pos = (double)ms / (double)1000 * r2d(ic->streams[pkt->stream_index]->time_base);
    			av_seek_frame(ic, videoStream, pos, AVSEEK_FLAG_BACKWARD | AVSEEK_FLAG_FRAME);
    		cout << "pkt->size = " << pkt->size << endl;
    		cout << "pkt->pts = " << pkt->pts << "(单位:秒)" << endl;
    		cout << "pkt->pts ms = " << pkt->pts * (r2d(ic->streams[pkt->stream_index]->time_base) * 1000) << "(单位:毫秒)" << endl;
    		cout << "pkt->dts = " << pkt->dts << endl;
    		AVCodecContext* cc = 0;
    		if (pkt->stream_index == videoStream)
    			cout << "图像" << endl;
    			cc = vc;
    		if (pkt->stream_index == audioStream)
    			cout << "音频" << endl;
    			cc = ac;
    		//发送packet到解码线程  send传NULL后调用多次receive取出所有缓冲帧
    		re = avcodec_send_packet(cc, pkt);
    		//释放,引用计数-1 为0释放空间
    		if (re != 0)
    			char buf[1024] = { 0 };
    			av_strerror(re, buf, sizeof(buf) - 1);
    			cout << "avcodec_send_packet  failed! :" << buf << endl;
    		for (;;)
    			re = avcodec_receive_frame(cc, frame);
    			if (re != 0) break;
    			if (cc == vc) {//视频
    				cout << "recv frame format      = " << frame->format << endl;
    				cout << "recv frame linesize[0] = " << frame->linesize[0] << endl;
    				cout << "recv frame linesize[1] = " << frame->linesize[1] << endl;
    				cout << "recv frame linesize[2] = " << frame->linesize[2] << endl;
    				//cout << endl;
    			}else {//音频
    				cout << "recv frame format      = " << frame->format << endl;
    				cout << "recv frame linesize[0] = " << frame->linesize[0] << endl;
    				cout << "recv frame nb_samples  = " << frame->nb_samples << endl;
    			if (cc == vc)
    				vctx = sws_getCachedContext(
    					vctx,	//传NULL会新创建
    					frame->width, frame->height,	//输入的宽高
    					(AVPixelFormat)frame->format,	//输入格式 YUV420p
    					frame->width, frame->height,	//输出的宽高
    					AV_PIX_FMT_RGBA,				//输出格式RGBA
    					SWS_BILINEAR,					//尺寸变化的算法
    					0, 0, 0);
    					//cout << "像素格式尺寸转换上下文创建或者获取成功!" << endl;
    				//	cout << "像素格式尺寸转换上下文创建或者获取失败!" << endl;
    				if (vctx)
    					if (!rgb) rgb = new unsigned char[frame->width * frame->height * 4];
    					uint8_t* data[2] = { 0 };
    					data[0] = rgb;
    					int lines[2] = { 0 };
    					lines[0] = frame->width * 4;
    					re = sws_scale(vctx,
    						frame->data,		//输入数据
    						frame->linesize,	//输入行大小
    						frame->height,		//输入高度
    						data,				//输出数据和大小
    					cout << "sws_scale = " << re << endl;
    			else //音频
    				uint8_t* data[2] = { 0 };
    				if (!pcm) pcm = new uint8_t[frame->nb_samples * 2 * 2];
    				data[0] = pcm;
    				re = swr_convert(actx,
    					data, frame->nb_samples,		//输出
    					(const uint8_t**)frame->data, frame->nb_samples	//输入
    				cout << "swr_convert = " << re << endl;
    	if (ic)
    	return 0;
    FFMPEG av_seek_frame

