20#include <freerdp/config.h>
28#include <freerdp/channels/log.h>
29#include <freerdp/client/tsmf.h>
31#include <libavcodec/avcodec.h>
32#include <libavutil/common.h>
33#include <libavutil/cpu.h>
34#include <libavutil/imgutils.h>
36#include "tsmf_constants.h"
37#include "tsmf_decoder.h"
38#include "tsmf_audio.h"
41#if LIBAVUTIL_VERSION_MAJOR < 50
42#define AVMEDIA_TYPE_VIDEO 0
43#define AVMEDIA_TYPE_AUDIO 1
46#if LIBAVCODEC_VERSION_MAJOR < 54
47#define MAX_AUDIO_FRAME_SIZE AVCODEC_MAX_AUDIO_FRAME_SIZE
49#define MAX_AUDIO_FRAME_SIZE 192000
52#if LIBAVCODEC_VERSION_MAJOR < 55
53#define AV_CODEC_ID_VC1 CODEC_ID_VC1
54#define AV_CODEC_ID_WMAV2 CODEC_ID_WMAV2
55#define AV_CODEC_ID_WMAPRO CODEC_ID_WMAPRO
56#define AV_CODEC_ID_MP3 CODEC_ID_MP3
57#define AV_CODEC_ID_MP2 CODEC_ID_MP2
58#define AV_CODEC_ID_MPEG2VIDEO CODEC_ID_MPEG2VIDEO
59#define AV_CODEC_ID_WMV3 CODEC_ID_WMV3
60#define AV_CODEC_ID_AAC CODEC_ID_AAC
61#define AV_CODEC_ID_H264 CODEC_ID_H264
62#define AV_CODEC_ID_AC3 CODEC_ID_AC3
65#if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(56, 34, 2)
66#define AV_CODEC_CAP_TRUNCATED CODEC_CAP_TRUNCATED
67#define AV_CODEC_FLAG_TRUNCATED CODEC_FLAG_TRUNCATED
70#if LIBAVUTIL_VERSION_MAJOR < 52
71#define AV_PIX_FMT_YUV420P PIX_FMT_YUV420P
79#if LIBAVCODEC_VERSION_MAJOR < 55
80 enum CodecID codec_id;
82 enum AVCodecID codec_id;
84 AVCodecContext* codec_context;
91 UINT32 decoded_size_max;
94static BOOL tsmf_ffmpeg_init_context(ITSMFDecoder* decoder)
96 TSMFFFmpegDecoder* mdecoder = (TSMFFFmpegDecoder*)decoder;
97 mdecoder->codec_context = avcodec_alloc_context3(NULL);
99 if (!mdecoder->codec_context)
101 WLog_ERR(TAG,
"avcodec_alloc_context failed.");
108static BOOL tsmf_ffmpeg_init_video_stream(ITSMFDecoder* decoder,
const TS_AM_MEDIA_TYPE* media_type)
110 TSMFFFmpegDecoder* mdecoder = (TSMFFFmpegDecoder*)decoder;
111 mdecoder->codec_context->width = WINPR_ASSERTING_INT_CAST(
int, media_type->Width);
112 mdecoder->codec_context->height = WINPR_ASSERTING_INT_CAST(
int, media_type->Height);
113 mdecoder->codec_context->bit_rate = WINPR_ASSERTING_INT_CAST(
int, media_type->BitRate);
114 mdecoder->codec_context->time_base.den =
115 WINPR_ASSERTING_INT_CAST(
int, media_type->SamplesPerSecond.Numerator);
116 mdecoder->codec_context->time_base.num =
117 WINPR_ASSERTING_INT_CAST(
int, media_type->SamplesPerSecond.Denominator);
118#if LIBAVCODEC_VERSION_MAJOR < 55
119 mdecoder->frame = avcodec_alloc_frame();
121 mdecoder->frame = av_frame_alloc();
126static BOOL tsmf_ffmpeg_init_audio_stream(ITSMFDecoder* decoder,
const TS_AM_MEDIA_TYPE* media_type)
128 TSMFFFmpegDecoder* mdecoder = (TSMFFFmpegDecoder*)decoder;
129 mdecoder->codec_context->sample_rate =
130 WINPR_ASSERTING_INT_CAST(
int, media_type->SamplesPerSecond.Numerator);
131 mdecoder->codec_context->bit_rate = WINPR_ASSERTING_INT_CAST(
int, media_type->BitRate);
132#if LIBAVUTIL_VERSION_INT >= AV_VERSION_INT(57, 28, 100)
133 mdecoder->codec_context->ch_layout.nb_channels =
134 WINPR_ASSERTING_INT_CAST(
int, media_type->Channels);
136 mdecoder->codec_context->channels = WINPR_ASSERTING_INT_CAST(
int, media_type->Channels);
138 mdecoder->codec_context->block_align = WINPR_ASSERTING_INT_CAST(
int, media_type->BlockAlign);
139#if LIBAVCODEC_VERSION_MAJOR < 55
140#ifdef AV_CPU_FLAG_SSE2
141 mdecoder->codec_context->dsp_mask = AV_CPU_FLAG_SSE2 | AV_CPU_FLAG_MMX2;
143#if LIBAVCODEC_VERSION_MAJOR < 53
144 mdecoder->codec_context->dsp_mask = FF_MM_SSE2 | FF_MM_MMXEXT;
146 mdecoder->codec_context->dsp_mask = FF_MM_SSE2 | FF_MM_MMX2;
150#ifdef AV_CPU_FLAG_SSE2
151#if LIBAVUTIL_VERSION_INT < AV_VERSION_INT(57, 17, 100)
152 av_set_cpu_flags_mask(AV_CPU_FLAG_SSE2 | AV_CPU_FLAG_MMXEXT);
154 av_force_cpu_flags(AV_CPU_FLAG_SSE2 | AV_CPU_FLAG_MMXEXT);
157 av_set_cpu_flags_mask(FF_MM_SSE2 | FF_MM_MMX2);
163static BOOL tsmf_ffmpeg_init_stream(ITSMFDecoder* decoder,
const TS_AM_MEDIA_TYPE* media_type)
167 const BYTE* s = NULL;
168 TSMFFFmpegDecoder* mdecoder = (TSMFFFmpegDecoder*)decoder;
170 WINPR_PRAGMA_DIAG_PUSH
171 WINPR_PRAGMA_DIAG_IGNORED_QUALIFIERS
172 mdecoder->codec = avcodec_find_decoder(mdecoder->codec_id);
173 WINPR_PRAGMA_DIAG_POP
175 if (!mdecoder->codec)
177 WLog_ERR(TAG,
"avcodec_find_decoder failed.");
181 mdecoder->codec_context->codec_id = mdecoder->codec_id;
182 mdecoder->codec_context->codec_type = mdecoder->media_type;
184 switch (mdecoder->media_type)
186 case AVMEDIA_TYPE_VIDEO:
187 if (!tsmf_ffmpeg_init_video_stream(decoder, media_type))
192 case AVMEDIA_TYPE_AUDIO:
193 if (!tsmf_ffmpeg_init_audio_stream(decoder, media_type))
199 WLog_ERR(TAG,
"unknown media_type %d", mdecoder->media_type);
203 if (media_type->ExtraData)
206 mdecoder->codec_context->extradata_size =
207 WINPR_ASSERTING_INT_CAST(
int, media_type->ExtraDataSize + 8);
208 if (mdecoder->codec_context->extradata_size == 0)
210 mdecoder->codec_context->extradata = calloc(1, mdecoder->codec_context->extradata_size);
212 if (!mdecoder->codec_context->extradata)
215 if (media_type->SubType == TSMF_SUB_TYPE_AVC1 &&
216 media_type->FormatType == TSMF_FORMAT_TYPE_MPEG2VIDEOINFO)
221 p = mdecoder->codec_context->extradata;
222 if ((mdecoder->codec_context->extradata_size < 0) ||
223 ((
size_t)mdecoder->codec_context->extradata_size < required))
226 *p++ = media_type->ExtraData[8];
228 *p++ = media_type->ExtraData[12];
231 s = media_type->ExtraData + 20;
232 size = ((UINT32)(*s)) * 256 + ((UINT32)(*(s + 1)));
233 required += size + 2;
234 if ((mdecoder->codec_context->extradata_size < 0) ||
235 ((size_t)mdecoder->codec_context->extradata_size < required))
237 memcpy(p, s, size + 2);
241 if ((mdecoder->codec_context->extradata_size < 0) ||
242 ((
size_t)mdecoder->codec_context->extradata_size < required))
245 size = ((UINT32)(*s)) * 256 + ((UINT32)(*(s + 1)));
246 required += size + 2;
247 if ((mdecoder->codec_context->extradata_size < 0) ||
248 ((size_t)mdecoder->codec_context->extradata_size < required))
250 memcpy(p, s, size + 2);
254 memcpy(mdecoder->codec_context->extradata, media_type->ExtraData,
255 media_type->ExtraDataSize);
256 if ((mdecoder->codec_context->extradata_size < 0) ||
257 ((
size_t)mdecoder->codec_context->extradata_size <
258 media_type->ExtraDataSize + 8ull))
260 memset(mdecoder->codec_context->extradata + media_type->ExtraDataSize, 0, 8);
264#if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(59, 18, 100)
265 if (mdecoder->codec->capabilities & AV_CODEC_CAP_TRUNCATED)
266 mdecoder->codec_context->flags |= AV_CODEC_FLAG_TRUNCATED;
272static BOOL tsmf_ffmpeg_prepare(ITSMFDecoder* decoder)
274 TSMFFFmpegDecoder* mdecoder = (TSMFFFmpegDecoder*)decoder;
276 if (avcodec_open2(mdecoder->codec_context, mdecoder->codec, NULL) < 0)
278 WLog_ERR(TAG,
"avcodec_open2 failed.");
282 mdecoder->prepared = 1;
286static BOOL tsmf_ffmpeg_set_format(ITSMFDecoder* decoder,
TS_AM_MEDIA_TYPE* media_type)
288 TSMFFFmpegDecoder* mdecoder = (TSMFFFmpegDecoder*)decoder;
290 WINPR_ASSERT(mdecoder);
291 WINPR_ASSERT(media_type);
293 switch (media_type->MajorType)
295 case TSMF_MAJOR_TYPE_VIDEO:
296 mdecoder->media_type = AVMEDIA_TYPE_VIDEO;
299 case TSMF_MAJOR_TYPE_AUDIO:
300 mdecoder->media_type = AVMEDIA_TYPE_AUDIO;
307 switch (media_type->SubType)
309 case TSMF_SUB_TYPE_WVC1:
310 mdecoder->codec_id = AV_CODEC_ID_VC1;
313 case TSMF_SUB_TYPE_WMA2:
314 mdecoder->codec_id = AV_CODEC_ID_WMAV2;
317 case TSMF_SUB_TYPE_WMA9:
318 mdecoder->codec_id = AV_CODEC_ID_WMAPRO;
321 case TSMF_SUB_TYPE_MP3:
322 mdecoder->codec_id = AV_CODEC_ID_MP3;
325 case TSMF_SUB_TYPE_MP2A:
326 mdecoder->codec_id = AV_CODEC_ID_MP2;
329 case TSMF_SUB_TYPE_MP2V:
330 mdecoder->codec_id = AV_CODEC_ID_MPEG2VIDEO;
333 case TSMF_SUB_TYPE_WMV3:
334 mdecoder->codec_id = AV_CODEC_ID_WMV3;
337 case TSMF_SUB_TYPE_AAC:
338 mdecoder->codec_id = AV_CODEC_ID_AAC;
343 if (media_type->ExtraData)
345 if (media_type->ExtraDataSize < 12)
348 media_type->ExtraData += 12;
349 media_type->ExtraDataSize -= 12;
354 case TSMF_SUB_TYPE_H264:
355 case TSMF_SUB_TYPE_AVC1:
356 mdecoder->codec_id = AV_CODEC_ID_H264;
359 case TSMF_SUB_TYPE_AC3:
360 mdecoder->codec_id = AV_CODEC_ID_AC3;
367 if (!tsmf_ffmpeg_init_context(decoder))
370 if (!tsmf_ffmpeg_init_stream(decoder, media_type))
373 if (!tsmf_ffmpeg_prepare(decoder))
379static BOOL tsmf_ffmpeg_decode_video(ITSMFDecoder* decoder,
const BYTE* data, UINT32 data_size,
382 TSMFFFmpegDecoder* mdecoder = (TSMFFFmpegDecoder*)decoder;
385 AVFrame* frame = NULL;
387#if LIBAVCODEC_VERSION_MAJOR < 52 || \
388 (LIBAVCODEC_VERSION_MAJOR == 52 && LIBAVCODEC_VERSION_MINOR <= 20)
389 len = avcodec_decode_video(mdecoder->codec_context, mdecoder->frame, &decoded, data, data_size);
392 AVPacket pkt = { 0 };
393#if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(58, 133, 100)
394 av_init_packet(&pkt);
396 pkt.data = WINPR_CAST_CONST_PTR_AWAY(data, BYTE*);
397 pkt.size = WINPR_ASSERTING_INT_CAST(
int, data_size);
399 if (extensions & TSMM_SAMPLE_EXT_CLEANPOINT)
400 pkt.flags |= AV_PKT_FLAG_KEY;
402#if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(57, 48, 101)
403 len = avcodec_decode_video2(mdecoder->codec_context, mdecoder->frame, &decoded, &pkt);
405 len = avcodec_send_packet(mdecoder->codec_context, &pkt);
408 len = avcodec_receive_frame(mdecoder->codec_context, mdecoder->frame);
409 if (len == AVERROR(EAGAIN))
418 WLog_ERR(TAG,
"data_size %" PRIu32
", avcodec_decode_video failed (%d)", data_size, len);
423 WLog_ERR(TAG,
"data_size %" PRIu32
", no frame is decoded.", data_size);
428 DEBUG_TSMF(
"linesize[0] %d linesize[1] %d linesize[2] %d linesize[3] %d "
429 "pix_fmt %d width %d height %d",
430 mdecoder->frame->linesize[0], mdecoder->frame->linesize[1],
431 mdecoder->frame->linesize[2], mdecoder->frame->linesize[3],
432 mdecoder->codec_context->pix_fmt, mdecoder->codec_context->width,
433 mdecoder->codec_context->height);
434 mdecoder->decoded_size = av_image_get_buffer_size(mdecoder->codec_context->pix_fmt,
435 mdecoder->codec_context->width,
436 mdecoder->codec_context->height, 1);
437 mdecoder->decoded_data = calloc(1, mdecoder->decoded_size);
439 if (!mdecoder->decoded_data)
442#if LIBAVCODEC_VERSION_MAJOR < 55
443 frame = avcodec_alloc_frame();
445 frame = av_frame_alloc();
447 av_image_fill_arrays(frame->data, frame->linesize, mdecoder->decoded_data,
448 mdecoder->codec_context->pix_fmt, mdecoder->codec_context->width,
449 mdecoder->codec_context->height, 1);
451 const uint8_t* ptr[AV_NUM_DATA_POINTERS] = { 0 };
452 for (
size_t x = 0; x < AV_NUM_DATA_POINTERS; x++)
453 ptr[x] = mdecoder->frame->data[x];
455 av_image_copy(frame->data, frame->linesize, ptr, mdecoder->frame->linesize,
456 mdecoder->codec_context->pix_fmt, mdecoder->codec_context->width,
457 mdecoder->codec_context->height);
464static BOOL tsmf_ffmpeg_decode_audio(ITSMFDecoder* decoder,
const BYTE* data, UINT32 data_size,
467 TSMFFFmpegDecoder* mdecoder = (TSMFFFmpegDecoder*)decoder;
471 if (mdecoder->decoded_size_max == 0)
472 mdecoder->decoded_size_max = MAX_AUDIO_FRAME_SIZE + 16;
474 mdecoder->decoded_data = calloc(1, mdecoder->decoded_size_max);
476 if (!mdecoder->decoded_data)
480 BYTE* dst = (BYTE*)(((uintptr_t)mdecoder->decoded_data + 15) & ~0x0F);
481 size_t dst_offset = (size_t)(dst - mdecoder->decoded_data);
482 const BYTE* src = data;
483 UINT32 src_size = data_size;
488 if (mdecoder->decoded_size_max - mdecoder->decoded_size < MAX_AUDIO_FRAME_SIZE)
490 BYTE* tmp_data = NULL;
491 tmp_data = realloc(mdecoder->decoded_data, mdecoder->decoded_size_max * 2 + 16);
496 mdecoder->decoded_size_max = mdecoder->decoded_size_max * 2 + 16;
497 mdecoder->decoded_data = tmp_data;
498 dst = (BYTE*)(((uintptr_t)mdecoder->decoded_data + 15) & ~0x0F);
500 const size_t diff = (size_t)(dst - mdecoder->decoded_data);
501 if (diff != dst_offset)
504 memmove(dst, mdecoder->decoded_data + dst_offset, mdecoder->decoded_size);
508 dst += mdecoder->decoded_size;
511#if LIBAVCODEC_VERSION_MAJOR < 52 || \
512 (LIBAVCODEC_VERSION_MAJOR == 52 && LIBAVCODEC_VERSION_MINOR <= 20)
513 frame_size = mdecoder->decoded_size_max - mdecoder->decoded_size;
514 len = avcodec_decode_audio2(mdecoder->codec_context, (int16_t*)dst, &frame_size, src,
518#if LIBAVCODEC_VERSION_MAJOR < 55
519 AVFrame* decoded_frame = avcodec_alloc_frame();
521 AVFrame* decoded_frame = av_frame_alloc();
524 AVPacket pkt = { 0 };
525#if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(58, 133, 100)
526 av_init_packet(&pkt);
529 pkt.data = WINPR_CAST_CONST_PTR_AWAY(src, BYTE*);
530 pkt.size = WINPR_ASSERTING_INT_CAST(
int, src_size);
531#if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(57, 48, 101)
532 len = avcodec_decode_audio4(mdecoder->codec_context, decoded_frame, &got_frame, &pkt);
534 len = avcodec_send_packet(mdecoder->codec_context, &pkt);
537 len = avcodec_receive_frame(mdecoder->codec_context, decoded_frame);
538 if (len == AVERROR(EAGAIN))
543 if (len >= 0 && got_frame)
545#if LIBAVUTIL_VERSION_INT >= AV_VERSION_INT(57, 28, 100)
546 const int channels = mdecoder->codec_context->ch_layout.nb_channels;
548 const int channels = mdecoder->codec_context->channels;
550 frame_size = av_samples_get_buffer_size(NULL, channels, decoded_frame->nb_samples,
551 mdecoder->codec_context->sample_fmt, 1);
552 memcpy(dst, decoded_frame->data[0], frame_size);
559 av_free(decoded_frame);
571 mdecoder->decoded_size += frame_size;
576 if (mdecoder->decoded_size == 0)
578 free(mdecoder->decoded_data);
579 mdecoder->decoded_data = NULL;
584 memmove(mdecoder->decoded_data, mdecoder->decoded_data + dst_offset,
585 mdecoder->decoded_size);
588 DEBUG_TSMF(
"data_size %" PRIu32
" decoded_size %" PRIu32
"", data_size, mdecoder->decoded_size);
592static BOOL tsmf_ffmpeg_decode(ITSMFDecoder* decoder,
const BYTE* data, UINT32 data_size,
595 TSMFFFmpegDecoder* mdecoder = (TSMFFFmpegDecoder*)decoder;
597 if (mdecoder->decoded_data)
599 free(mdecoder->decoded_data);
600 mdecoder->decoded_data = NULL;
603 mdecoder->decoded_size = 0;
605 switch (mdecoder->media_type)
607 case AVMEDIA_TYPE_VIDEO:
608 return tsmf_ffmpeg_decode_video(decoder, data, data_size, extensions);
610 case AVMEDIA_TYPE_AUDIO:
611 return tsmf_ffmpeg_decode_audio(decoder, data, data_size, extensions);
614 WLog_ERR(TAG,
"unknown media type.");
619static BYTE* tsmf_ffmpeg_get_decoded_data(ITSMFDecoder* decoder, UINT32* size)
622 TSMFFFmpegDecoder* mdecoder = (TSMFFFmpegDecoder*)decoder;
623 *size = mdecoder->decoded_size;
624 buf = mdecoder->decoded_data;
625 mdecoder->decoded_data = NULL;
626 mdecoder->decoded_size = 0;
630static UINT32 tsmf_ffmpeg_get_decoded_format(ITSMFDecoder* decoder)
632 TSMFFFmpegDecoder* mdecoder = (TSMFFFmpegDecoder*)decoder;
634 switch (mdecoder->codec_context->pix_fmt)
636 case AV_PIX_FMT_YUV420P:
637 return RDP_PIXFMT_I420;
640 WLog_ERR(TAG,
"unsupported pixel format %d", mdecoder->codec_context->pix_fmt);
645static BOOL tsmf_ffmpeg_get_decoded_dimension(ITSMFDecoder* decoder, UINT32* width, UINT32* height)
647 TSMFFFmpegDecoder* mdecoder = (TSMFFFmpegDecoder*)decoder;
649 if (mdecoder->codec_context->width > 0 && mdecoder->codec_context->height > 0)
651 *width = mdecoder->codec_context->width;
652 *height = mdecoder->codec_context->height;
661static void tsmf_ffmpeg_free(ITSMFDecoder* decoder)
663 TSMFFFmpegDecoder* mdecoder = (TSMFFFmpegDecoder*)decoder;
666 av_free(mdecoder->frame);
668 free(mdecoder->decoded_data);
670 if (mdecoder->codec_context)
672 free(mdecoder->codec_context->extradata);
673 mdecoder->codec_context->extradata = NULL;
675#if LIBAVCODEC_VERSION_INT >= AV_VERSION_INT(55, 69, 100)
676 avcodec_free_context(&mdecoder->codec_context);
678 if (mdecoder->prepared)
679 avcodec_close(mdecoder->codec_context);
681 av_free(mdecoder->codec_context);
688static INIT_ONCE g_Initialized = INIT_ONCE_STATIC_INIT;
689static BOOL CALLBACK InitializeAvCodecs(
PINIT_ONCE once, PVOID param, PVOID* context)
691#if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(58, 10, 100)
692 avcodec_register_all();
697FREERDP_ENTRY_POINT(UINT VCAPITYPE ffmpeg_freerdp_tsmf_client_decoder_subsystem_entry(
void* ptr))
699 ITSMFDecoder** sptr = (ITSMFDecoder**)ptr;
703 TSMFFFmpegDecoder* decoder = NULL;
704 InitOnceExecuteOnce(&g_Initialized, InitializeAvCodecs, NULL, NULL);
705 WLog_DBG(TAG,
"TSMFDecoderEntry FFMPEG");
706 decoder = (TSMFFFmpegDecoder*)calloc(1,
sizeof(TSMFFFmpegDecoder));
709 return ERROR_OUTOFMEMORY;
711 decoder->iface.SetFormat = tsmf_ffmpeg_set_format;
712 decoder->iface.Decode = tsmf_ffmpeg_decode;
713 decoder->iface.GetDecodedData = tsmf_ffmpeg_get_decoded_data;
714 decoder->iface.GetDecodedFormat = tsmf_ffmpeg_get_decoded_format;
715 decoder->iface.GetDecodedDimension = tsmf_ffmpeg_get_decoded_dimension;
716 decoder->iface.Free = tsmf_ffmpeg_free;
717 *sptr = &decoder->iface;
718 return CHANNEL_RC_OK;