1.support one to many,only tested using one student

2.add macro to support using ffmpeg codec version 58,which need pcm format using AV_SAMPLE_FMT_FLTP when encoding aac

1.support one to many,only tested using one student
2.add macro to support using ffmpeg codec version 58,which need pcm format using AV_SAMPLE_FMT_FLTP when encoding aac
胡斌
Commit b564d2b313f32cd870d3a4e7bfdd47118cef49da b564d2b3 1 parent fc96f84b
pip/AVTranscoder.cpp
pip/AVTranscoder.h
pip/AudioDecoder.cpp
pip/media_info.h
pip/merge_pip.cpp
--- a/pip/AVTranscoder.cpp
查看文件 @b564d2b
+++ b/pip/AVTranscoder.cpp
查看文件 @b564d2b
@@ -11,24 +11,36 @@ extern "C" {
 #define SRC_W 320
 #define SRC_H 240
-CAVTranscoder::CAVTranscoder():
+CAVTranscoder::CAVTranscoder(bool bOne2One):
 _start_time(INT64_MAX),
 _all_processed(true),
-_one2one(true),
 _nOutputWidth(320),
 _cur_out_v_ts(0),
 _cur_out_a_ts(0),
 _max_audio(1),
-_swsCtx(NULL)
+_swsCtx(NULL),
+_scaledFrame(NULL)
 {
+	_one2one = bOne2One;
 	if (_one2one) {
 		_nOutputHeight = 480;
 	}
 	else {
 		_nOutputHeight = 240;
-		_swsCtx = sws_getContext(SRC_W, SRC_H, PIX_FMT_YUV420P,
-			SCALED_W, SCALED_H, PIX_FMT_YUV420P, SWS_BILINEAR,
+		_swsCtx = sws_getContext(SRC_W, SRC_H, AV_PIX_FMT_YUV420P,
+			SCALED_W, SCALED_H, AV_PIX_FMT_YUV420P, SWS_BILINEAR,
 			NULL, NULL, NULL);
+		_scaledFrame = av_frame_alloc();
+		_scaledFrame->format = AV_PIX_FMT_YUV420P;
+		_scaledFrame->width = SCALED_W;
+		_scaledFrame->height = SCALED_H;
+		_scaledFrame->pts = 0;
+
+		int ret = av_frame_get_buffer(_scaledFrame, 32);
+		if (ret != 0)
+		{
+			printf("Error alloc frame buffer for scaling video frame");
+		}
 	}
 }
@@ -113,6 +125,10 @@ int CAVTranscoder::close()
 		sws_freeContext(_swsCtx);
 		_swsCtx = NULL;
 	}
+	if (_scaledFrame) {
+		av_frame_unref(_scaledFrame);
+		av_frame_free(&_scaledFrame);
+	}
 	flush_encoder(0);
 	flush_encoder(1);
 	av_write_trailer(_ofmt_ctx);
@@ -214,7 +230,7 @@ int CAVTranscoder::open_output_file(const char *filename)
 				enc_ctx->channel_layout = AV_CH_LAYOUT_MONO;
 				enc_ctx->channels = av_get_channel_layout_nb_channels(AV_CH_LAYOUT_MONO);
 				/* take first format from list of supported formats */
-				enc_ctx->sample_fmt = AV_SAMPLE_FMT_S16; //AV_SAMPLE_FMT_FLTP;
+				enc_ctx->sample_fmt = PCM_FORMAT_FOR_AAC_ENCODE; //AV_SAMPLE_FMT_FLTP;
 				enc_ctx->time_base.num = 1;
 				enc_ctx->time_base.den = enc_ctx->sample_rate;
 				enc_ctx->bit_rate = 64000;
@@ -264,7 +280,7 @@ int CAVTranscoder::open_output_file(const char *filename)
 		pDstFrame->nb_samples = 1024;
 		pDstFrame->channel_layout = AV_CH_LAYOUT_MONO;
 		pDstFrame->channels = av_get_channel_layout_nb_channels(AV_CH_LAYOUT_MONO);
-		pDstFrame->format = AV_SAMPLE_FMT_S16;
+		pDstFrame->format = PCM_FORMAT_FOR_AAC_ENCODE;
 		pDstFrame->sample_rate = 48000;
 		av_frame_get_buffer(pDstFrame, 0);
@@ -273,8 +289,13 @@ int CAVTranscoder::open_output_file(const char *filename)
 		for (; it != decoders_got_frame.end(); it++) {
 			AVFrame * pFrame = (*it)->_cur_a_frame;
 			if (pFrame) {
+#if LIBAVCODEC_VERSION_MAJOR < 58
 				int16_t * psrc = (int16_t *)pFrame->extended_data[0];
 				int16_t * pdst = (int16_t *)pDstFrame->extended_data[0];
+#else
+				float * psrc = (float *)pFrame->extended_data[0];
+				float * pdst = (float *)pDstFrame->extended_data[0];
+#endif
 				for (int i = 0; i < 1024; i++,pdst++,psrc++) {
 					*pdst += (*psrc/_max_audio);
 				}
@@ -310,41 +331,43 @@ int CAVTranscoder::open_output_file(const char *filename)
 		uint8_t *dstbuf = new uint8_t[nDstSize];
 		avpicture_fill((AVPicture*)pDstFrame, dstbuf, AV_PIX_FMT_YUV420P, _nOutputWidth, _nOutputHeight);
+		bool fill_pure_color = true;
 		if (idxTeacher != -1) {
 			//copy teacher frame to dest frame
 			CAVDecoder * pDecoder = decoders_got_frame[idxTeacher];
 			AVFrame * pFrame = pDecoder->_cur_v_frame;
 			if (pFrame) {
 				fillDestFrame(pDstFrame, pFrame, 0, 0);
+				fill_pure_color = false;
+				pDecoder->free_cur_v_frame();
 			}
-			else {//fill with pure color
+		}
+		if(fill_pure_color){//fill with pure color
 				memset(pDstFrame->data[0], 0, _nOutputWidth * _nOutputHeight);
 				memset(pDstFrame->data[1], 0x80, _nOutputWidth *_nOutputHeight / 4);
 				memset(pDstFrame->data[2], 0x80, _nOutputWidth * _nOutputHeight / 4);
-			}
-
-			for (int i = 0; i < decoders_got_frame.size(); i++){
-				if (i != idxTeacher) {
-					//scale eacher frame
-
-					//copy each frame to the dest frame
-
-				}
-			}
 		}
-		else {
-			memset(pDstFrame->data[0], 0, _nOutputWidth * _nOutputHeight);
-			memset(pDstFrame->data[1], 0x80, _nOutputWidth *_nOutputHeight / 4);
-			memset(pDstFrame->data[2], 0x80, _nOutputWidth * _nOutputHeight / 4);
-				for (int i = 0; i < decoders_got_frame.size(); i++){
-					if (i != idxTeacher) {
-						//scale eacher frame
-
-						//copy each frame to the dest frame
-
-					}
+		int imageIdx = 0;
+		for (int i = 0; i < decoders_got_frame.size(); i++){
+			if (i != idxTeacher) {
+				//scale eacher frame
+				CAVDecoder * pDecoder = decoders_got_frame[i];
+				AVFrame * pFrame = pDecoder->_cur_v_frame;
+				if (!pFrame) {
+					continue;
 				}
+				int h = sws_scale(_swsCtx, pFrame->data, pFrame->linesize, 0, pFrame->height,
+					_scaledFrame->data, _scaledFrame->linesize);
+				if (h <= 0){
+					printf("scale output 0?");
+				}
+				
+				//copy each frame to the dest frame
+				fillDestFrame(pDstFrame, _scaledFrame, SRC_W - SCALED_H - ((imageIdx % 4) * SCALED_H), SRC_H - SCALED_H - (SCALED_H + 8)*imageIdx / 4, (SCALED_W - SCALED_H) / 2, 0, SCALED_H, SCALED_H);
+				pDecoder->free_cur_v_frame();
+				imageIdx++;
+			}
 		}
 		//fill the timestamp of dest frame
@@ -381,6 +404,19 @@ int CAVTranscoder::open_output_file(const char *filename)
 		return 0;
 	}
+	int CAVTranscoder::fillDestFrame(AVFrame * pDstFrame, AVFrame * pSrcFrame, int x, int y, int srcx, int srcy, int w, int h)
+	{
+		for (int i = 0; i < h; i++)	{
+			memcpy(pDstFrame->data[0] + (y + i)*pDstFrame->linesize[0] + x, pSrcFrame->data[0] + (i+srcy) * pSrcFrame->linesize[0] + srcx, pSrcFrame->linesize[0] > 0 ? w : -w);
+		}
+
+		for (int i = 0; i < h / 2; i++){
+			memcpy(pDstFrame->data[1] + (y / 2 + i)*pDstFrame->linesize[1] + x / 2, pSrcFrame->data[1] + (i + srcy/2) * pSrcFrame->linesize[1], pSrcFrame->linesize[1] > 0 ? w/2 : -w/2);
+			memcpy(pDstFrame->data[2] + (y / 2 + i)*pDstFrame->linesize[2] + x / 2, pSrcFrame->data[2] + (i + srcy/2) * pSrcFrame->linesize[2], pSrcFrame->linesize[2] > 0 ? w/2 : -w/2);
+		}
+		return 0;
+	}
+
 	int CAVTranscoder::mix_and_output_one2one_vframe(vector<CAVDecoder *> & decoders_got_frame)
 	{
 		//prepare one2one base frame
--- a/pip/AVTranscoder.h
查看文件 @b564d2b
+++ b/pip/AVTranscoder.h
查看文件 @b564d2b
@@ -5,7 +5,7 @@
 class CAVTranscoder
 {
 public:
-	CAVTranscoder();
+	CAVTranscoder(bool bOne2One);
 	virtual ~CAVTranscoder();
 	int add(media_info & info);
@@ -35,12 +35,14 @@ private:
 	int mix_and_output_one2many_vframe(vector<CAVDecoder *> & decoders_got_frame);
 	int fillDestFrame(AVFrame * pDstFrame, AVFrame * pSrcFrame, int x, int y);
+	int fillDestFrame(AVFrame * pDstFrame, AVFrame * pSrcFrame, int destx, int desty, int srcx,int srcy,int w,int h);
 	int encode_write_frame(AVFrame *filt_frame, unsigned int stream_index, int *got_frame);
 	int flush_encoder(unsigned int stream_index);
 	void * _a_frame_pool;
 	int _max_audio;
 	struct SwsContext * _swsCtx;
+	AVFrame * _scaledFrame;
 public:
 	void set_max_audio(int max_audio);
 };
--- a/pip/AudioDecoder.cpp
查看文件 @b564d2b
+++ b/pip/AudioDecoder.cpp
查看文件 @b564d2b
@@ -123,7 +123,7 @@ int CAudioDecoder::init_filter(FilteringContext* fctx, AVCodecContext *dec_ctx,
 			av_log(NULL, AV_LOG_ERROR, "Cannot create audio buffer sink\n");
 			goto end;
 		}
-		enum AVSampleFormat sample_fmt = AV_SAMPLE_FMT_S16;
+		enum AVSampleFormat sample_fmt = PCM_FORMAT_FOR_AAC_ENCODE;
 		ret = av_opt_set_bin(buffersink_ctx, "sample_fmts",
 			(uint8_t*)&sample_fmt, sizeof(sample_fmt),
 			AV_OPT_SEARCH_CHILDREN);
--- a/pip/media_info.h
查看文件 @b564d2b
+++ b/pip/media_info.h
查看文件 @b564d2b
 #pragma  once
-
+#define  __STDC_LIMIT_MACROS
 #include <string>
 #include <vector>
 #include <stdint.h>
@@ -78,4 +78,10 @@ typedef struct FilteringContext {
 #define AFRAME_DURATION_MS 21.333333
-#define VFRAME_DURATION_MS 50
+#define VFRAME_DURATION_MS 50
+
+#if LIBAVCODEC_VERSION_MAJOR < 58
+#define PCM_FORMAT_FOR_AAC_ENCODE  AV_SAMPLE_FMT_S16
+#else
+#define PCM_FORMAT_FOR_AAC_ENCODE  AV_SAMPLE_FMT_FLTP
+#endif
--- a/pip/merge_pip.cpp
查看文件 @b564d2b
+++ b/pip/merge_pip.cpp
查看文件 @b564d2b
@@ -954,7 +954,7 @@ int process_av_files()
 	av_register_all();
 	avfilter_register_all();
-	CAVTranscoder videoTranscoder;
+	CAVTranscoder videoTranscoder(max_audio==2);
 	videoTranscoder.set_max_audio(max_audio);
 	int64_t cur_time = 0;