FFMPEG 实现 YUV，RGB各种图像原始数据之间的转换（swscale）

最新推荐文章于 2024-09-04 14:18:42 发布

最新推荐文章于 2024-09-04 14:18:42 发布 · 874 阅读

文章标签：

本文介绍如何使用FFMPEG库进行视频解码并将解码后的数据转换为YUV420、YUV422、RGB24等不同格式的原始数据文件。关键步骤包括设置转换格式、初始化转换上下文以及根据目标格式保存数据。通过理解FFMPEG中的planar和packed数据布局，可以正确地写入和保存不同格式的图像数据。

摘要生成于 C知道，由 DeepSeek-R1 满血版支持，前往体验 >

FFMPEG中的swscale提供了视频原始数据（YUV420，YUV422，YUV444，RGB24...）之间的转换，分辨率变换等操作，使用起来十分方便，在这里记录一下它的用法。
swscale主要用于在2个AVFrame之间进行转换。

下面来看一个视频解码的简单例子，并将解码后的数据保存为原始数据文件（例如YUV420，YUV422，RGB24等等）。

/**
*  使用FFmpeg解析出H264、YUV数据
*/

#include <stdio.h>

extern "C"
{
#include "libavcodec/avcodec.h"
#include "libavformat/avformat.h"
#include "libswscale/swscale.h"
#include "libavutil/imgutils.h"
};

#pragma comment(lib, "avcodec.lib")
#pragma comment(lib, "avformat.lib")
#pragma comment(lib, "swscale.lib")
#pragma comment(lib, "avutil.lib")

int main(int argc, char* argv[])
{
	AVFormatContext		*pFormatCtx = NULL;
	AVCodecContext		*pCodecCtx = NULL;
	AVCodec				*pCodec = NULL;
	AVFrame				*pFrame = NULL, *pFrameYUV = NULL;
	unsigned char		*out_buffer = NULL;
	AVPacket			packet;
	struct SwsContext	*img_convert_ctx = NULL;
	int					got_picture;
	int					videoIndex;
	int					frame_cnt = 1;

	char filepath[] = "Titanic.ts";
	//char filepath[] = "Forrest_Gump_IMAX.mp4";

	FILE *fp_yuv = fopen("film.yuv", "wb+");
	FILE *fp_h264 = fopen("film.h264", "wb+");
	if (fp_yuv == NULL || fp_h264 == NULL)
	{
		printf("FILE open error");
		return -1;
	}

	av_register_all();

	if (avformat_open_input(&pFormatCtx, filepath, NULL, NULL) != 0){
		printf("Couldn't open an input stream.\n");
		return -1;
	}
	if (avformat_find_stream_info(pFormatCtx, NULL) < 0){
		printf("Couldn't find stream information.\n");
		return -1;
	}
	videoIndex = -1;
	for (int i = 0; i < pFormatCtx->nb_streams; i++)
		if (pFormatCtx->streams[i]->codec->codec_type == AVMEDIA_TYPE_VIDEO){
			videoIndex = i;
			break;
		}

	if (videoIndex == -1){
		printf("Couldn't find a video stream.\n");
		return -1;
	}

	pCodecCtx = pFormatCtx->streams[videoIndex]->codec;
	pCodec = avcodec_find_decoder(pCodecCtx->codec_id);
	if (pCodec == NULL){
		printf("Codec not found.\n");
		return -1;
	}
	if (avcodec_open2(pCodecCtx, pCodec, NULL) < 0){
		printf("Could not open codec.\n");
		return -1;
	}



	pFrame = av_frame_alloc();
	pFrameYUV = av_frame_alloc();
	if (pFrame == NULL || pFrameYUV == NULL)
	{
		printf("memory allocation error\n");
		return -1;
	}

	/**
	*  RGB--------->AV_PIX_FMT_RGB24
	*  YUV420P----->AV_PIX_FMT_YUV420P
	*  UYVY422----->AV_PIX_FMT_UYVY422
	*  YUV422P----->AV_PIX_FMT_YUV422P
	*/
	out_buffer = (unsigned char *)av_malloc(av_image_get_buffer_size(AV_PIX_FMT_YUV420P, pCodecCtx->width, pCodecCtx->height, 1));
	av_image_fill_arrays(pFrameYUV->data, pFrameYUV->linesize, out_buffer,
		AV_PIX_FMT_YUV420P, pCodecCtx->width, pCodecCtx->height, 1);
	img_convert_ctx = sws_getContext(pCodecCtx->width, pCodecCtx->height, pCodecCtx->pix_fmt,
		pCodecCtx->width, pCodecCtx->height, AV_PIX_FMT_YUV420P, SWS_BICUBIC, NULL, NULL, NULL);




	/*
	//针对H.264码流
	unsigned char *dummy = NULL;   //输入的指针  
	int dummy_len;
	const char nal_start[] = { 0, 0, 0, 1 };
	AVBitStreamFilterContext* bsfc = av_bitstream_filter_init("h264_mp4toannexb");
	av_bitstream_filter_filter(bsfc, pCodecCtx, NULL, &dummy, &dummy_len, NULL, 0, 0);
	fwrite(pCodecCtx->extradata, pCodecCtx->extradata_size, 1, fp_h264);
	av_bitstream_filter_close(bsfc);
	free(dummy);
	*/
	while (av_read_frame(pFormatCtx, &packet) >= 0)
	{
		if (packet.stream_index == videoIndex)
		{
			//输出出h.264数据
			fwrite(packet.data, 1, packet.size, fp_h264);
			
			//针对H.264码流
			//fwrite(nal_start, 4, 1, fp_h264);
			//fwrite(packet.data + 4, packet.size - 4, 1, fp_h264);

			if (avcodec_decode_video2(pCodecCtx, pFrame, &got_picture, &packet) < 0)
			{
				printf("Decode Error.\n");
				return -1;
			}
			if (got_picture)
			{
				sws_scale(img_convert_ctx, (const unsigned char* const*)pFrame->data, pFrame->linesize, 0, pCodecCtx->height,
					pFrameYUV->data, pFrameYUV->linesize);

				//输出出YUV数据
				int y_size = pCodecCtx->width * pCodecCtx->height;
				fwrite(pFrameYUV->data[0], 1, y_size, fp_yuv);		//Y 
				fwrite(pFrameYUV->data[1], 1, y_size / 4, fp_yuv);	//U
				fwrite(pFrameYUV->data[2], 1, y_size / 4, fp_yuv);	//V

				/**
				*  输出RGB数据
				*  fwrite(pFrameYUV->data[0], (pCodecCtx->width) * (pCodecCtx->height) * 3, 1, fp);
				*  输出UYVY数据
				*  fwrite(pFrameYUV->data[0], (pCodecCtx->width) * (pCodecCtx->height), 2, fp);
				*/
				
				printf("Succeed to decode %d frame!\n", frame_cnt);
				frame_cnt++;
			}
		}
		av_free_packet(&packet);
	}

	//flush decoder
	//FIX: Flush Frames remained in Codec
	while (true)
	{
		if (avcodec_decode_video2(pCodecCtx, pFrame, &got_picture, &packet) < 0)
		{
			break;
		}
		if (!got_picture)
		{
			break; 
		}
			
		sws_scale(img_convert_ctx, (const unsigned char* const*)pFrame->data, pFrame->linesize, 0, pCodecCtx->height,
			pFrameYUV->data, pFrameYUV->linesize);

		int y_size = pCodecCtx->width * pCodecCtx->height;
		fwrite(pFrameYUV->data[0], 1, y_size, fp_yuv);		//Y 
		fwrite(pFrameYUV->data[1], 1, y_size / 4, fp_yuv);	//U
		fwrite(pFrameYUV->data[2], 1, y_size / 4, fp_yuv);	//V

		printf("Flush Decoder: Succeed to decode %d frame!\n", frame_cnt);
		frame_cnt++;
	}


	fclose(fp_yuv);
	fclose(fp_h264);
	sws_freeContext(img_convert_ctx);
	av_free(out_buffer);
	av_frame_free(&pFrameYUV);
	av_frame_free(&pFrame);
	avcodec_close(pCodecCtx);
	avformat_close_input(&pFormatCtx);

	return 0;
}

从代码中可以看出，解码后的视频帧数据保存在pFrame变量中，然后经过swscale函数转换后，将视频帧数据保存在pFrameYUV变量中。最后将pFrameYUV中的数据写入成文件。

在本代码中，将数据保存成了RGB24的格式。如果想保存成其他格式，比如YUV420，YUV422等，需要做2个步骤：

1.初始化pFrameYUV的时候，设定想要转换的格式：

[cpp]view plaincopy 
   
 AVFrame*pFrame,*pFrameYUV; 
 pFrame=avcodec_alloc_frame(); 
 pFrameYUV=avcodec_alloc_frame(); 
 uint8_t*out_buffer; 
  
 out_buffer=newuint8_t[avpicture_get_size(PIX_FMT_RGB24,pCodecCtx->width,pCodecCtx->height)]; 
 avpicture_fill((AVPicture*)pFrameYUV,out_buffer,PIX_FMT_RGB24,pCodecCtx->width,pCodecCtx->height);