kiwi/VideoStreamEncoder.cpp at master · zhenkai/kiwi · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
#include "VideoStreamEncoder.h"
#include "Params.h"
#include <QTime>

VideoStreamEncoder::VideoStreamEncoder(size_t bufSize, int videoWidth, int videoHeight, int fps, PixelFormat pixelFormat){
	this->bufSize = bufSize;
	this->videoWidth = videoWidth;
	this->videoHeight = videoHeight;
	this->fps = fps;
	this->openCVPixelFormat = pixelFormat;

	initialized = false;
	if (bufSize <= 1) {
		return;
	}

	buffer = new unsigned char[bufSize];
	if (initEncoder())
		initialized = true;
}

VideoStreamEncoder::~VideoStreamEncoder() {
	if (buffer != NULL)
		delete buffer;
}

bool VideoStreamEncoder::openCodec(AVStream *stream) {
	AVCodecContext *codecContext = stream->codec;
	AVCodec *codec = avcodec_find_encoder(codecContext->codec_id);
	if (!codec) {
		fprintf(stderr, "Codec not found\n");
	}
	if (avcodec_open(codecContext, codec) < 0) {
		return false;
	}
	return true;
}

AVFrame *VideoStreamEncoder::createAVFrame(PixelFormat pixel_format) {
	AVFrame *frame = avcodec_alloc_frame();
	if (!frame)
		return NULL;

	int picSize = avpicture_get_size(pixel_format, videoWidth, videoHeight);
	unsigned char *picBuffer = new unsigned char[picSize];
	if (!picBuffer) {
		av_free(frame);
		return NULL;
	}

	avpicture_fill((AVPicture *)frame, picBuffer, pixel_format, videoWidth, videoHeight);
	return frame;
}

AVStream *VideoStreamEncoder::createVideoStream(AVFormatContext *fmtContext) {
	AVStream *stream = av_new_stream(fmtContext, 0);
	if (!stream) {
		fprintf(stderr, "Could not alloc stream\n");
		return NULL;
	}

	AVCodecContext *codecContext = stream->codec;
	codecContext->codec_id = (CodecID) (ENCODING_CODEC);
	codecContext->codec_type = AVMEDIA_TYPE_VIDEO;
	codecContext->bit_rate = STREAM_BIT_RATE;
	codecContext->width = videoWidth;
	codecContext->height = videoHeight;
	codecContext->time_base.den = fps;
	codecContext->time_base.num = 1;
	codecContext->gop_size = GROUP_OF_PICTURES;
	codecContext->pix_fmt = RAW_STREAM_FORMAT;

	if (ENCODING_CODEC == CODEC_ID_H264) {
		codecContext->profile = FF_PROFILE_H264_CONSTRAINED_BASELINE;
		codecContext->level = 1;
	}

	return stream;
}

bool VideoStreamEncoder::initEncoder() {
	av_register_all();
	outputFormat = av_guess_format(ENCODING_STRING, NULL, NULL);
	if (!outputFormat) {
		fprintf(stderr, "Could not find suitable output format for %s\n", ENCODING_STRING);
		return false;
	}
	outputFormat->video_codec = ENCODING_CODEC;
	fmtContext = avformat_alloc_context();
	if (!fmtContext) {
		fprintf(stderr, "Can not alloc format context\n");
		return false;
	}

	fmtContext->oformat = outputFormat;

	videoStream = createVideoStream(fmtContext);
	if (!videoStream)
		return false;

	// must be done even if no parameters are needed
	if(av_set_parameters(fmtContext, NULL) < 0) {
		fprintf(stderr, "Invalid output format parameters\n");
		return false;
	}

	if (!openCodec(videoStream))
		return false;

	readyToEncodeFrame = createAVFrame(videoStream->codec->pix_fmt);
	openCVFrame = createAVFrame(openCVPixelFormat);

	return true;
}

const unsigned char *VideoStreamEncoder::encodeVideoFrame(IplImage *image, int *outSize) {
	if (image == NULL)
		return NULL;

	if (!initialized) {
		fprintf(stderr, "Initial class failed\n");
		return NULL;
	}

	if (image->imageSize > bufSize) {
		fprintf(stderr, "image size too large.\n");
		return NULL;
	}

	AVCodecContext *codecContext = videoStream->codec;

	// I saw people use this hack: just assign pointer image->imageData t- openCVFrame->data[0]
	// without using memcpy. This is supposed to speed things up.
	openCVFrame->data[0] = (uint8_t *)image->imageData;

	struct SwsContext *imgConvertCtx;
	int width = codecContext->width;
	int height = codecContext->height;
	imgConvertCtx = sws_getContext(width, height, openCVPixelFormat, width, height, codecContext->pix_fmt, SWS_FAST_BILINEAR, NULL, NULL, NULL);
	sws_scale(imgConvertCtx, openCVFrame->data, openCVFrame->linesize, 0, height, readyToEncodeFrame->data, readyToEncodeFrame->linesize);
	//img_convert((AVPicture *)readToEncodeFrame, codecContext->pix_fmt, (AVPicture *)openCVFrame, openCVPixelFormt, codecContext->width, codecContext->height);

	// for some reason, you have to set strict monotonic pts mantually, or otherwise H264 won't work at work
	if (ENCODING_CODEC == CODEC_ID_H264) {
		static long frameNum = 0;
		long pts = 90 * frameNum;
		frameNum += 40;
		readyToEncodeFrame->pts = pts;
	}

	QTime s = QTime::currentTime();
	*outSize = avcodec_encode_video(codecContext, buffer, bufSize, readyToEncodeFrame);
	QTime e = QTime::currentTime();
	int t = s.msecsTo(e);
	return buffer;
}