2 * Copyright 2012 Michael Chen <omxcodec@gmail.com>
3 * Copyright 2015 The CyanogenMod Project
5 * Licensed under the Apache License, Version 2.0 (the "License");
6 * you may not use this file except in compliance with the License.
7 * You may obtain a copy of the License at
9 * http://www.apache.org/licenses/LICENSE-2.0
11 * Unless required by applicable law or agreed to in writing, software
12 * distributed under the License is distributed on an "AS IS" BASIS,
13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 * See the License for the specific language governing permissions and
15 * limitations under the License.
18 //#define LOG_NDEBUG 0
19 #define LOG_TAG "FFmpegExtractor"
20 #include <utils/Log.h>
23 #include <limits.h> /* INT_MAX */
25 #include <sys/prctl.h>
27 #include <utils/misc.h>
28 #include <utils/String8.h>
29 #include <cutils/properties.h>
30 #include <media/stagefright/foundation/ABitReader.h>
31 #include <media/stagefright/foundation/ABuffer.h>
32 #include <media/stagefright/foundation/ADebug.h>
33 #include <media/stagefright/foundation/AMessage.h>
34 #include <media/stagefright/foundation/hexdump.h>
35 #include <media/stagefright/DataSource.h>
36 #include <media/stagefright/MediaBuffer.h>
37 #include <media/stagefright/foundation/ADebug.h>
38 #include <media/stagefright/MediaDefs.h>
39 #include <media/stagefright/MediaErrors.h>
40 #include <media/stagefright/MediaSource.h>
41 #include <media/stagefright/MetaData.h>
42 #include <media/stagefright/Utils.h>
43 #include "include/avc_utils.h"
45 #include "utils/codec_utils.h"
46 #include "utils/ffmpeg_cmdutils.h"
48 #include "FFmpegExtractor.h"
50 #define MAX_QUEUE_SIZE (15 * 1024 * 1024)
51 #define MIN_AUDIOQ_SIZE (20 * 16 * 1024)
53 #define EXTRACTOR_MAX_PROBE_PACKETS 200
54 #define FF_MAX_EXTRADATA_SIZE ((1 << 28) - FF_INPUT_BUFFER_PADDING_SIZE)
56 #define WAIT_KEY_PACKET_AFTER_SEEK 1
57 #define SUPPOURT_UNKNOWN_FORMAT 1
60 #define DEBUG_READ_ENTRY 0
61 #define DEBUG_DISABLE_VIDEO 0
62 #define DEBUG_DISABLE_AUDIO 0
64 #define DEBUG_FORMATS 0
73 struct FFmpegSource : public MediaSource {
74 FFmpegSource(const sp<FFmpegExtractor> &extractor, size_t index);
76 virtual status_t start(MetaData *params);
77 virtual status_t stop();
78 virtual sp<MetaData> getFormat();
80 virtual status_t read(
81 MediaBuffer **buffer, const ReadOptions *options);
84 virtual ~FFmpegSource();
87 friend struct FFmpegExtractor;
89 sp<FFmpegExtractor> mExtractor;
92 enum AVMediaType mMediaType;
97 size_t mNALLengthSize;
103 int64_t mFirstKeyPktTimestamp;
107 DISALLOW_EVIL_CONSTRUCTORS(FFmpegSource);
110 ////////////////////////////////////////////////////////////////////////////////
112 FFmpegExtractor::FFmpegExtractor(const sp<DataSource> &source, const sp<AMessage> &meta)
113 : mDataSource(source),
116 mFFmpegInited(false),
118 mReaderThreadStarted(false) {
119 ALOGV("FFmpegExtractor::FFmpegExtractor");
121 fetchStuffsFromSniffedMeta(meta);
123 int err = initStreams();
125 ALOGE("failed to init ffmpeg");
129 // start reader here, as we want to extract extradata from bitstream if no extradata
132 while(mProbePkts <= EXTRACTOR_MAX_PROBE_PACKETS && !mEOF &&
133 (mFormatCtx->pb ? !mFormatCtx->pb->error : 1) &&
134 (mDefersToCreateVideoTrack || mDefersToCreateAudioTrack)) {
135 ALOGV("mProbePkts=%d", mProbePkts);
139 ALOGV("mProbePkts: %d, mEOF: %d, pb->error(if has): %d, mDefersToCreateVideoTrack: %d, mDefersToCreateAudioTrack: %d",
140 mProbePkts, mEOF, mFormatCtx->pb ? mFormatCtx->pb->error : 0, mDefersToCreateVideoTrack, mDefersToCreateAudioTrack);
145 FFmpegExtractor::~FFmpegExtractor() {
146 ALOGV("FFmpegExtractor::~FFmpegExtractor");
147 Mutex::Autolock autoLock(mLock);
148 // stop reader here if no track!
154 size_t FFmpegExtractor::countTracks() {
155 return mInitCheck == OK ? mTracks.size() : 0;
158 sp<MediaSource> FFmpegExtractor::getTrack(size_t index) {
159 ALOGV("FFmpegExtractor::getTrack[%d]", index);
161 if (mInitCheck != OK) {
165 if (index >= mTracks.size()) {
169 return new FFmpegSource(this, index);
172 sp<MetaData> FFmpegExtractor::getTrackMetaData(size_t index, uint32_t flags __unused) {
173 ALOGV("FFmpegExtractor::getTrackMetaData[%d]", index);
175 if (mInitCheck != OK) {
179 if (index >= mTracks.size()) {
183 /* Quick and dirty, just get a frame 1/4 in */
184 if (mTracks.itemAt(index).mIndex == mVideoStreamIdx) {
185 int64_t thumb_ts = av_rescale_q((mFormatCtx->streams[mVideoStreamIdx]->duration / 4),
186 mFormatCtx->streams[mVideoStreamIdx]->time_base, AV_TIME_BASE_Q);
187 mTracks.itemAt(index).mMeta->setInt64(kKeyThumbnailTime, thumb_ts);
190 return mTracks.itemAt(index).mMeta;
193 sp<MetaData> FFmpegExtractor::getMetaData() {
194 ALOGV("FFmpegExtractor::getMetaData");
196 if (mInitCheck != OK) {
203 uint32_t FFmpegExtractor::flags() const {
204 ALOGV("FFmpegExtractor::flags");
206 if (mInitCheck != OK) {
210 uint32_t flags = CAN_PAUSE;
212 if (mFormatCtx->duration != AV_NOPTS_VALUE) {
213 flags |= CAN_SEEK_BACKWARD | CAN_SEEK_FORWARD | CAN_SEEK;
219 int FFmpegExtractor::check_extradata(AVCodecContext *avctx)
221 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
222 const char *name = NULL;
223 bool *defersToCreateTrack = NULL;
224 AVBitStreamFilterContext **bsfc = NULL;
227 if (avctx->codec_type == AVMEDIA_TYPE_VIDEO) {
229 defersToCreateTrack = &mDefersToCreateVideoTrack;
230 } else if (avctx->codec_type == AVMEDIA_TYPE_AUDIO){
232 defersToCreateTrack = &mDefersToCreateAudioTrack;
235 codec_id = avctx->codec_id;
238 if (codec_id != AV_CODEC_ID_H264
239 && codec_id != AV_CODEC_ID_MPEG4
240 && codec_id != AV_CODEC_ID_MPEG1VIDEO
241 && codec_id != AV_CODEC_ID_MPEG2VIDEO
242 && codec_id != AV_CODEC_ID_AAC) {
246 // is extradata compatible with android?
247 if (codec_id != AV_CODEC_ID_AAC) {
248 int is_compatible = is_extradata_compatible_with_android(avctx);
249 if (!is_compatible) {
250 ALOGI("%s extradata is not compatible with android, should to extract it from bitstream",
251 av_get_media_type_string(avctx->codec_type));
252 *defersToCreateTrack = true;
253 *bsfc = NULL; // H264 don't need bsfc, only AAC?
259 if (codec_id == AV_CODEC_ID_AAC) {
260 name = "aac_adtstoasc";
263 if (avctx->extradata_size <= 0) {
264 ALOGI("No %s extradata found, should to extract it from bitstream",
265 av_get_media_type_string(avctx->codec_type));
266 *defersToCreateTrack = true;
267 //CHECK(name != NULL);
268 if (!*bsfc && name) {
269 *bsfc = av_bitstream_filter_init(name);
271 ALOGE("Cannot open the %s BSF!", name);
272 *defersToCreateTrack = false;
275 ALOGV("open the %s bsf", name);
285 void FFmpegExtractor::printTime(int64_t time)
287 int hours, mins, secs, us;
289 if (time == AV_NOPTS_VALUE)
292 secs = time / AV_TIME_BASE;
293 us = time % AV_TIME_BASE;
298 ALOGI("the time is %02d:%02d:%02d.%02d",
299 hours, mins, secs, (100 * us) / AV_TIME_BASE);
302 bool FFmpegExtractor::is_codec_supported(enum AVCodecID codec_id)
304 bool supported = false;
307 case AV_CODEC_ID_H264:
308 case AV_CODEC_ID_MPEG4:
309 case AV_CODEC_ID_H263:
310 case AV_CODEC_ID_H263P:
311 case AV_CODEC_ID_H263I:
312 case AV_CODEC_ID_AAC:
313 case AV_CODEC_ID_AC3:
314 case AV_CODEC_ID_MP2:
315 case AV_CODEC_ID_MP3:
316 case AV_CODEC_ID_MPEG1VIDEO:
317 case AV_CODEC_ID_MPEG2VIDEO:
318 case AV_CODEC_ID_WMV1:
319 case AV_CODEC_ID_WMV2:
320 case AV_CODEC_ID_WMV3:
321 case AV_CODEC_ID_VC1:
322 case AV_CODEC_ID_WMAV1:
323 case AV_CODEC_ID_WMAV2:
324 case AV_CODEC_ID_WMAPRO:
325 case AV_CODEC_ID_WMALOSSLESS:
326 case AV_CODEC_ID_RV20:
327 case AV_CODEC_ID_RV30:
328 case AV_CODEC_ID_RV40:
329 case AV_CODEC_ID_COOK:
330 case AV_CODEC_ID_APE:
331 case AV_CODEC_ID_DTS:
332 case AV_CODEC_ID_FLAC:
333 case AV_CODEC_ID_FLV1:
334 case AV_CODEC_ID_VORBIS:
335 case AV_CODEC_ID_HEVC:
340 ALOGD("unsuppoted codec(%s), but give it a chance",
341 avcodec_get_name(codec_id));
342 //Won't promise that the following codec id can be supported.
343 //Just give these codecs a chance.
351 sp<MetaData> FFmpegExtractor::setVideoFormat(AVStream *stream)
353 AVCodecContext *avctx = NULL;
354 sp<MetaData> meta = NULL;
356 avctx = stream->codec;
357 CHECK_EQ(avctx->codec_type, AVMEDIA_TYPE_VIDEO);
359 switch(avctx->codec_id) {
360 case AV_CODEC_ID_H264:
361 if (avctx->extradata[0] == 1) {
362 meta = setAVCFormat(avctx);
364 meta = setH264Format(avctx);
367 case AV_CODEC_ID_MPEG4:
368 meta = setMPEG4Format(avctx);
370 case AV_CODEC_ID_H263:
371 case AV_CODEC_ID_H263P:
372 case AV_CODEC_ID_H263I:
373 meta = setH263Format(avctx);
375 case AV_CODEC_ID_MPEG1VIDEO:
376 case AV_CODEC_ID_MPEG2VIDEO:
377 meta = setMPEG2VIDEOFormat(avctx);
379 case AV_CODEC_ID_VC1:
380 meta = setVC1Format(avctx);
382 case AV_CODEC_ID_WMV1:
383 meta = setWMV1Format(avctx);
385 case AV_CODEC_ID_WMV2:
386 meta = setWMV2Format(avctx);
388 case AV_CODEC_ID_WMV3:
389 meta = setWMV3Format(avctx);
391 case AV_CODEC_ID_RV20:
392 meta = setRV20Format(avctx);
394 case AV_CODEC_ID_RV30:
395 meta = setRV30Format(avctx);
397 case AV_CODEC_ID_RV40:
398 meta = setRV40Format(avctx);
400 case AV_CODEC_ID_FLV1:
401 meta = setFLV1Format(avctx);
403 case AV_CODEC_ID_HEVC:
404 meta = setHEVCFormat(avctx);
406 case AV_CODEC_ID_VP8:
407 meta = setVP8Format(avctx);
409 case AV_CODEC_ID_VP9:
410 meta = setVP9Format(avctx);
413 ALOGD("unsuppoted video codec(id:%d, name:%s), but give it a chance",
414 avctx->codec_id, avcodec_get_name(avctx->codec_id));
416 meta->setInt32(kKeyCodecId, avctx->codec_id);
417 meta->setCString(kKeyMIMEType, MEDIA_MIMETYPE_VIDEO_FFMPEG);
418 if (avctx->extradata_size > 0) {
419 meta->setData(kKeyRawCodecSpecificData, 0, avctx->extradata, avctx->extradata_size);
421 //CHECK(!"Should not be here. Unsupported codec.");
426 ALOGI("width: %d, height: %d, bit_rate: %d",
427 avctx->width, avctx->height, avctx->bit_rate);
429 meta->setInt32(kKeyWidth, avctx->width);
430 meta->setInt32(kKeyHeight, avctx->height);
431 if (avctx->bit_rate > 0) {
432 meta->setInt32(kKeyBitRate, avctx->bit_rate);
434 setDurationMetaData(stream, meta);
440 sp<MetaData> FFmpegExtractor::setAudioFormat(AVStream *stream)
442 AVCodecContext *avctx = NULL;
443 sp<MetaData> meta = NULL;
445 avctx = stream->codec;
446 CHECK_EQ(avctx->codec_type, AVMEDIA_TYPE_AUDIO);
448 switch(avctx->codec_id) {
449 case AV_CODEC_ID_MP2:
450 meta = setMP2Format(avctx);
452 case AV_CODEC_ID_MP3:
453 meta = setMP3Format(avctx);
455 case AV_CODEC_ID_VORBIS:
456 meta = setVORBISFormat(avctx);
458 case AV_CODEC_ID_AC3:
459 meta = setAC3Format(avctx);
461 case AV_CODEC_ID_AAC:
462 meta = setAACFormat(avctx);
464 case AV_CODEC_ID_WMAV1:
465 meta = setWMAV1Format(avctx);
467 case AV_CODEC_ID_WMAV2:
468 meta = setWMAV2Format(avctx);
470 case AV_CODEC_ID_WMAPRO:
471 meta = setWMAProFormat(avctx);
473 case AV_CODEC_ID_WMALOSSLESS:
474 meta = setWMALossLessFormat(avctx);
476 case AV_CODEC_ID_COOK:
477 meta = setRAFormat(avctx);
479 case AV_CODEC_ID_APE:
480 meta = setAPEFormat(avctx);
482 case AV_CODEC_ID_DTS:
483 meta = setDTSFormat(avctx);
485 case AV_CODEC_ID_FLAC:
486 meta = setFLACFormat(avctx);
489 ALOGD("unsuppoted audio codec(id:%d, name:%s), but give it a chance",
490 avctx->codec_id, avcodec_get_name(avctx->codec_id));
492 meta->setInt32(kKeyCodecId, avctx->codec_id);
493 meta->setInt32(kKeyCodedSampleBits, avctx->bits_per_coded_sample);
494 meta->setCString(kKeyMIMEType, MEDIA_MIMETYPE_AUDIO_FFMPEG);
495 if (avctx->extradata_size > 0) {
496 meta->setData(kKeyRawCodecSpecificData, 0, avctx->extradata, avctx->extradata_size);
498 //CHECK(!"Should not be here. Unsupported codec.");
503 ALOGD("bit_rate: %d, sample_rate: %d, channels: %d, "
504 "bits_per_coded_sample: %d, block_align: %d "
505 "bits_per_raw_sample: %d, sample_format: %d",
506 avctx->bit_rate, avctx->sample_rate, avctx->channels,
507 avctx->bits_per_coded_sample, avctx->block_align,
508 avctx->bits_per_raw_sample, avctx->sample_fmt);
510 meta->setInt32(kKeyChannelCount, avctx->channels);
511 meta->setInt32(kKeyBitRate, avctx->bit_rate);
512 meta->setInt32(kKeyBitsPerSample, av_get_bytes_per_sample(avctx->sample_fmt) > 2 ? 24 : 16);
513 meta->setInt32(kKeySampleRate, avctx->sample_rate);
514 meta->setInt32(kKeyBlockAlign, avctx->block_align);
515 meta->setInt32(kKeySampleFormat, avctx->sample_fmt);
516 setDurationMetaData(stream, meta);
522 void FFmpegExtractor::setDurationMetaData(AVStream *stream, sp<MetaData> &meta)
524 AVCodecContext *avctx = stream->codec;
526 if (stream->duration != AV_NOPTS_VALUE) {
527 int64_t duration = av_rescale_q(stream->duration, stream->time_base, AV_TIME_BASE_Q);
529 const char *s = av_get_media_type_string(avctx->codec_type);
530 if (stream->start_time != AV_NOPTS_VALUE) {
531 ALOGV("%s startTime:%lld", s, stream->start_time);
533 ALOGV("%s startTime:N/A", s);
535 meta->setInt64(kKeyDuration, duration);
537 // default when no stream duration
538 meta->setInt64(kKeyDuration, mFormatCtx->duration);
542 int FFmpegExtractor::stream_component_open(int stream_index)
544 TrackInfo *trackInfo = NULL;
545 AVCodecContext *avctx = NULL;
546 sp<MetaData> meta = NULL;
547 bool supported = false;
549 const void *data = NULL;
553 ALOGI("stream_index: %d", stream_index);
554 if (stream_index < 0 || stream_index >= (int)mFormatCtx->nb_streams)
556 avctx = mFormatCtx->streams[stream_index]->codec;
558 supported = is_codec_supported(avctx->codec_id);
561 ALOGE("unsupport the codec(%s)", avcodec_get_name(avctx->codec_id));
564 ALOGI("support the codec(%s)", avcodec_get_name(avctx->codec_id));
567 for (size_t i = 0; i < mTracks.size(); ++i) {
568 if (stream_index == mTracks.editItemAt(i).mIndex) {
569 ALOGE("this track already exists");
574 mFormatCtx->streams[stream_index]->discard = AVDISCARD_DEFAULT;
577 av_get_codec_tag_string(tagbuf, sizeof(tagbuf), avctx->codec_tag);
578 ALOGV("Tag %s/0x%08x with codec(%s)\n", tagbuf, avctx->codec_tag, avcodec_get_name(avctx->codec_id));
580 switch (avctx->codec_type) {
581 case AVMEDIA_TYPE_VIDEO:
582 if (mVideoStreamIdx == -1)
583 mVideoStreamIdx = stream_index;
584 if (mVideoStream == NULL)
585 mVideoStream = mFormatCtx->streams[stream_index];
587 ret = check_extradata(avctx);
590 // disable the stream
591 mVideoStreamIdx = -1;
593 packet_queue_flush(&mVideoQ);
594 mFormatCtx->streams[stream_index]->discard = AVDISCARD_ALL;
599 if (avctx->extradata) {
600 ALOGV("video stream extradata:");
601 hexdump(avctx->extradata, avctx->extradata_size);
603 ALOGV("video stream no extradata, but we can ignore it.");
606 meta = setVideoFormat(mVideoStream);
608 ALOGE("setVideoFormat failed");
612 ALOGV("create a video track");
614 trackInfo = &mTracks.editItemAt(mTracks.size() - 1);
615 trackInfo->mIndex = stream_index;
616 trackInfo->mMeta = meta;
617 trackInfo->mStream = mVideoStream;
618 trackInfo->mQueue = &mVideoQ;
620 mDefersToCreateVideoTrack = false;
623 case AVMEDIA_TYPE_AUDIO:
624 if (mAudioStreamIdx == -1)
625 mAudioStreamIdx = stream_index;
626 if (mAudioStream == NULL)
627 mAudioStream = mFormatCtx->streams[stream_index];
629 ret = check_extradata(avctx);
632 // disable the stream
633 mAudioStreamIdx = -1;
635 packet_queue_flush(&mAudioQ);
636 mFormatCtx->streams[stream_index]->discard = AVDISCARD_ALL;
641 if (avctx->extradata) {
642 ALOGV("audio stream extradata(%d):", avctx->extradata_size);
643 hexdump(avctx->extradata, avctx->extradata_size);
645 ALOGV("audio stream no extradata, but we can ignore it.");
648 meta = setAudioFormat(mAudioStream);
650 ALOGE("setAudioFormat failed");
654 ALOGV("create a audio track");
656 trackInfo = &mTracks.editItemAt(mTracks.size() - 1);
657 trackInfo->mIndex = stream_index;
658 trackInfo->mMeta = meta;
659 trackInfo->mStream = mAudioStream;
660 trackInfo->mQueue = &mAudioQ;
662 mDefersToCreateAudioTrack = false;
665 case AVMEDIA_TYPE_SUBTITLE:
667 CHECK(!"Should not be here. Unsupported media type.");
670 CHECK(!"Should not be here. Unsupported media type.");
676 void FFmpegExtractor::stream_component_close(int stream_index)
678 AVCodecContext *avctx;
680 if (stream_index < 0 || stream_index >= (int)mFormatCtx->nb_streams)
682 avctx = mFormatCtx->streams[stream_index]->codec;
684 switch (avctx->codec_type) {
685 case AVMEDIA_TYPE_VIDEO:
686 ALOGV("packet_queue_abort videoq");
687 packet_queue_abort(&mVideoQ);
688 ALOGV("packet_queue_end videoq");
689 packet_queue_flush(&mVideoQ);
691 case AVMEDIA_TYPE_AUDIO:
692 ALOGV("packet_queue_abort audioq");
693 packet_queue_abort(&mAudioQ);
694 ALOGV("packet_queue_end audioq");
695 packet_queue_flush(&mAudioQ);
697 case AVMEDIA_TYPE_SUBTITLE:
703 mFormatCtx->streams[stream_index]->discard = AVDISCARD_ALL;
704 switch (avctx->codec_type) {
705 case AVMEDIA_TYPE_VIDEO:
707 mVideoStreamIdx = -1;
709 av_bitstream_filter_close(mVideoBsfc);
713 case AVMEDIA_TYPE_AUDIO:
715 mAudioStreamIdx = -1;
717 av_bitstream_filter_close(mAudioBsfc);
721 case AVMEDIA_TYPE_SUBTITLE:
728 void FFmpegExtractor::reachedEOS(enum AVMediaType media_type)
730 Mutex::Autolock autoLock(mLock);
732 if (media_type == AVMEDIA_TYPE_VIDEO) {
733 mVideoEOSReceived = true;
734 } else if (media_type == AVMEDIA_TYPE_AUDIO) {
735 mAudioEOSReceived = true;
740 /* seek in the stream */
741 int FFmpegExtractor::stream_seek(int64_t pos, enum AVMediaType media_type,
742 MediaSource::ReadOptions::SeekMode mode)
744 Mutex::Autolock _l(mLock);
746 if (mSeekIdx >= 0 || (mVideoStreamIdx >= 0
747 && mAudioStreamIdx >= 0
748 && media_type == AVMEDIA_TYPE_AUDIO
749 && !mVideoEOSReceived)) {
754 if (mAudioStreamIdx >= 0)
755 packet_queue_flush(&mAudioQ);
756 if (mVideoStreamIdx >= 0)
757 packet_queue_flush(&mVideoQ);
759 mSeekIdx = media_type == AVMEDIA_TYPE_VIDEO ? mVideoStreamIdx : mAudioStreamIdx;
762 //mSeekFlags &= ~AVSEEK_FLAG_BYTE;
763 //if (mSeekByBytes) {
764 // mSeekFlags |= AVSEEK_FLAG_BYTE;
768 case MediaSource::ReadOptions::SEEK_PREVIOUS_SYNC:
769 mSeekMin = INT64_MIN;
772 case MediaSource::ReadOptions::SEEK_NEXT_SYNC:
774 mSeekMax = INT64_MAX;
776 case MediaSource::ReadOptions::SEEK_CLOSEST_SYNC:
777 mSeekMin = INT64_MIN;
778 mSeekMax = INT64_MAX;
780 case MediaSource::ReadOptions::SEEK_CLOSEST:
781 mSeekMin = INT64_MIN;
788 mCondition.wait(mLock);
793 int FFmpegExtractor::decode_interrupt_cb(void *ctx)
795 FFmpegExtractor *extractor = static_cast<FFmpegExtractor *>(ctx);
796 return extractor->mAbortRequest;
799 void FFmpegExtractor::fetchStuffsFromSniffedMeta(const sp<AMessage> &meta)
805 CHECK(meta->findString("extended-extractor-url", &url));
806 CHECK(url.c_str() != NULL);
807 CHECK(url.size() < PATH_MAX);
809 memcpy(mFilename, url.c_str(), url.size());
810 mFilename[url.size()] = '\0';
813 CHECK(meta->findString("extended-extractor-mime", &mime));
814 CHECK(mime.c_str() != NULL);
815 mMeta->setCString(kKeyMIMEType, mime.c_str());
818 void FFmpegExtractor::setFFmpegDefaultOpts()
821 #if DEBUG_DISABLE_VIDEO
826 #if DEBUG_DISABLE_AUDIO
832 mSeekByBytes = 0; /* seek by bytes 0=off 1=on -1=auto" */
833 mDuration = AV_NOPTS_VALUE;
834 mSeekPos = AV_NOPTS_VALUE;
835 mSeekMin = INT64_MIN;
836 mSeekMax = INT64_MAX;
839 mVideoStreamIdx = -1;
840 mAudioStreamIdx = -1;
843 mDefersToCreateVideoTrack = false;
844 mDefersToCreateAudioTrack = false;
857 int FFmpegExtractor::initStreams()
861 status_t status = UNKNOWN_ERROR;
863 int ret = 0, audio_ret = -1, video_ret = -1;
864 int pkt_in_play_range = 0;
865 AVDictionaryEntry *t = NULL;
866 AVDictionary **opts = NULL;
867 int orig_nb_streams = 0;
868 int st_index[AVMEDIA_TYPE_NB] = {0};
869 int wanted_stream[AVMEDIA_TYPE_NB] = {0};
870 st_index[AVMEDIA_TYPE_AUDIO] = -1;
871 st_index[AVMEDIA_TYPE_VIDEO] = -1;
872 wanted_stream[AVMEDIA_TYPE_AUDIO] = -1;
873 wanted_stream[AVMEDIA_TYPE_VIDEO] = -1;
874 const char *mime = NULL;
876 setFFmpegDefaultOpts();
878 status = initFFmpeg();
883 mFFmpegInited = true;
885 mFormatCtx = avformat_alloc_context();
888 ALOGE("oom for alloc avformat context");
892 mFormatCtx->interrupt_callback.callback = decode_interrupt_cb;
893 mFormatCtx->interrupt_callback.opaque = this;
894 ALOGV("mFilename: %s", mFilename);
895 err = avformat_open_input(&mFormatCtx, mFilename, NULL, &format_opts);
897 ALOGE("%s: avformat_open_input failed, err:%s", mFilename, av_err2str(err));
902 if ((t = av_dict_get(format_opts, "", NULL, AV_DICT_IGNORE_SUFFIX))) {
903 ALOGE("Option %s not found.\n", t->key);
904 //ret = AVERROR_OPTION_NOT_FOUND;
910 mFormatCtx->flags |= AVFMT_FLAG_GENPTS;
912 opts = setup_find_stream_info_opts(mFormatCtx, codec_opts);
913 orig_nb_streams = mFormatCtx->nb_streams;
915 err = avformat_find_stream_info(mFormatCtx, opts);
917 ALOGE("%s: could not find stream info, err:%s", mFilename, av_err2str(err));
921 for (i = 0; i < orig_nb_streams; i++)
922 av_dict_free(&opts[i]);
926 mFormatCtx->pb->eof_reached = 0; // FIXME hack, ffplay maybe should not use url_feof() to test for the end
928 if (mSeekByBytes < 0)
929 mSeekByBytes = !!(mFormatCtx->iformat->flags & AVFMT_TS_DISCONT)
930 && strcmp("ogg", mFormatCtx->iformat->name);
932 for (i = 0; i < (int)mFormatCtx->nb_streams; i++)
933 mFormatCtx->streams[i]->discard = AVDISCARD_ALL;
935 st_index[AVMEDIA_TYPE_VIDEO] =
936 av_find_best_stream(mFormatCtx, AVMEDIA_TYPE_VIDEO,
937 wanted_stream[AVMEDIA_TYPE_VIDEO], -1, NULL, 0);
939 st_index[AVMEDIA_TYPE_AUDIO] =
940 av_find_best_stream(mFormatCtx, AVMEDIA_TYPE_AUDIO,
941 wanted_stream[AVMEDIA_TYPE_AUDIO],
942 st_index[AVMEDIA_TYPE_VIDEO],
945 av_dump_format(mFormatCtx, 0, mFilename, 0);
948 if (mFormatCtx->duration != AV_NOPTS_VALUE &&
949 mFormatCtx->start_time != AV_NOPTS_VALUE) {
950 int hours, mins, secs, us;
952 ALOGV("file startTime: %lld", mFormatCtx->start_time);
954 mDuration = mFormatCtx->duration;
956 secs = mDuration / AV_TIME_BASE;
957 us = mDuration % AV_TIME_BASE;
962 ALOGI("the duration is %02d:%02d:%02d.%02d",
963 hours, mins, secs, (100 * us) / AV_TIME_BASE);
966 packet_queue_init(&mVideoQ);
967 packet_queue_init(&mAudioQ);
969 if (st_index[AVMEDIA_TYPE_AUDIO] >= 0) {
970 audio_ret = stream_component_open(st_index[AVMEDIA_TYPE_AUDIO]);
972 packet_queue_start(&mAudioQ);
975 if (st_index[AVMEDIA_TYPE_VIDEO] >= 0) {
976 video_ret = stream_component_open(st_index[AVMEDIA_TYPE_VIDEO]);
978 packet_queue_start(&mVideoQ);
981 if ( audio_ret < 0 && video_ret < 0) {
982 ALOGE("%s: could not open codecs\n", mFilename);
993 void FFmpegExtractor::deInitStreams()
995 packet_queue_destroy(&mVideoQ);
996 packet_queue_destroy(&mAudioQ);
999 avformat_close_input(&mFormatCtx);
1002 if (mFFmpegInited) {
1007 status_t FFmpegExtractor::startReaderThread() {
1008 ALOGV("Starting reader thread");
1010 if (mReaderThreadStarted)
1013 pthread_attr_t attr;
1014 pthread_attr_init(&attr);
1015 pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_JOINABLE);
1017 ALOGD("Reader thread starting");
1019 pthread_create(&mReaderThread, &attr, ReaderWrapper, this);
1020 pthread_attr_destroy(&attr);
1022 mReaderThreadStarted = true;
1023 mCondition.signal();
1028 void FFmpegExtractor::stopReaderThread() {
1029 ALOGV("Stopping reader thread");
1031 if (!mReaderThreadStarted) {
1032 ALOGD("Reader thread have been stopped");
1037 mCondition.signal();
1039 /* close each stream */
1040 if (mAudioStreamIdx >= 0)
1041 stream_component_close(mAudioStreamIdx);
1042 if (mVideoStreamIdx >= 0)
1043 stream_component_close(mVideoStreamIdx);
1045 pthread_join(mReaderThread, NULL);
1048 avformat_close_input(&mFormatCtx);
1051 mReaderThreadStarted = false;
1052 ALOGD("Reader thread stopped");
1056 void *FFmpegExtractor::ReaderWrapper(void *me) {
1057 ((FFmpegExtractor *)me)->readerEntry();
1062 void FFmpegExtractor::readerEntry() {
1064 AVPacket pkt1, *pkt = &pkt1;
1066 int pkt_in_play_range = 0;
1070 pid_t tid = gettid();
1071 androidSetThreadPriority(tid,
1072 mVideoStreamIdx >= 0 ? ANDROID_PRIORITY_NORMAL : ANDROID_PRIORITY_AUDIO);
1073 prctl(PR_SET_NAME, (unsigned long)"FFmpegExtractor Thread", 0, 0, 0);
1075 ALOGV("FFmpegExtractor wait for signal");
1076 while (!mReaderThreadStarted && !mAbortRequest) {
1077 mCondition.wait(mLock);
1079 ALOGV("FFmpegExtractor ready to run");
1081 if (mAbortRequest) {
1085 mVideoEOSReceived = false;
1086 mAudioEOSReceived = false;
1088 while (!mAbortRequest) {
1090 if (mPaused != mLastPaused) {
1091 mLastPaused = mPaused;
1093 mReadPauseReturn = av_read_pause(mFormatCtx);
1095 av_read_play(mFormatCtx);
1097 #if CONFIG_RTSP_DEMUXER || CONFIG_MMSH_PROTOCOL
1099 (!strcmp(mFormatCtx->iformat->name, "rtsp") ||
1100 (mFormatCtx->pb && !strncmp(mFilename, "mmsh:", 5)))) {
1101 /* wait 10 ms to avoid trying to get another packet */
1108 if (mSeekIdx >= 0) {
1109 Mutex::Autolock _l(mLock);
1110 ALOGV("readerEntry, mSeekIdx: %d mSeekPos: %lld (%lld/%lld)", mSeekIdx, mSeekPos, mSeekMin, mSeekMax);
1111 ret = avformat_seek_file(mFormatCtx, -1, mSeekMin, mSeekPos, mSeekMax, 0);
1113 ALOGE("%s: error while seeking", mFormatCtx->filename);
1115 if (mAudioStreamIdx >= 0) {
1116 packet_queue_flush(&mAudioQ);
1117 packet_queue_put(&mAudioQ, &mAudioQ.flush_pkt);
1119 if (mVideoStreamIdx >= 0) {
1120 packet_queue_flush(&mVideoQ);
1121 packet_queue_put(&mVideoQ, &mVideoQ.flush_pkt);
1126 mCondition.signal();
1129 /* if the queue are full, no need to read more */
1130 if ( mAudioQ.size + mVideoQ.size > MAX_QUEUE_SIZE
1131 || ( (mAudioQ .size > MIN_AUDIOQ_SIZE || mAudioStreamIdx < 0)
1132 && (mVideoQ .nb_packets > MIN_FRAMES || mVideoStreamIdx < 0))) {
1133 #if DEBUG_READ_ENTRY
1134 ALOGV("readerEntry, full(wtf!!!), mVideoQ.size: %d, mVideoQ.nb_packets: %d, mAudioQ.size: %d, mAudioQ.nb_packets: %d",
1135 mVideoQ.size, mVideoQ.nb_packets, mAudioQ.size, mAudioQ.nb_packets);
1138 mExtractorMutex.lock();
1139 mCondition.waitRelative(mExtractorMutex, milliseconds(10));
1140 mExtractorMutex.unlock();
1145 if (mVideoStreamIdx >= 0) {
1146 packet_queue_put_nullpacket(&mVideoQ, mVideoStreamIdx);
1148 if (mAudioStreamIdx >= 0) {
1149 packet_queue_put_nullpacket(&mAudioQ, mAudioStreamIdx);
1152 mExtractorMutex.lock();
1153 mCondition.waitRelative(mExtractorMutex, milliseconds(10));
1155 mExtractorMutex.unlock();
1159 ret = av_read_frame(mFormatCtx, pkt);
1165 if (mFormatCtx->pb && mFormatCtx->pb->error) {
1166 ALOGE("mFormatCtx->pb->error: %d", mFormatCtx->pb->error);
1170 mExtractorMutex.lock();
1171 mCondition.waitRelative(mExtractorMutex, milliseconds(10));
1172 mExtractorMutex.unlock();
1176 if (pkt->stream_index == mVideoStreamIdx) {
1177 if (mDefersToCreateVideoTrack) {
1178 AVCodecContext *avctx = mFormatCtx->streams[mVideoStreamIdx]->codec;
1180 int i = parser_split(avctx, pkt->data, pkt->size);
1181 if (i > 0 && i < FF_MAX_EXTRADATA_SIZE) {
1182 if (avctx->extradata)
1183 av_freep(&avctx->extradata);
1184 avctx->extradata_size= i;
1185 avctx->extradata = (uint8_t *)av_malloc(avctx->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);
1186 if (!avctx->extradata) {
1187 //return AVERROR(ENOMEM);
1188 ret = AVERROR(ENOMEM);
1191 // sps + pps(there may be sei in it)
1192 memcpy(avctx->extradata, pkt->data, avctx->extradata_size);
1193 memset(avctx->extradata + i, 0, FF_INPUT_BUFFER_PADDING_SIZE);
1195 av_free_packet(pkt);
1199 stream_component_open(mVideoStreamIdx);
1200 if (!mDefersToCreateVideoTrack)
1201 ALOGI("probe packet counter: %d when create video track ok", mProbePkts);
1202 if (mProbePkts == EXTRACTOR_MAX_PROBE_PACKETS)
1203 ALOGI("probe packet counter to max: %d, create video track: %d",
1204 mProbePkts, !mDefersToCreateVideoTrack);
1206 } else if (pkt->stream_index == mAudioStreamIdx) {
1210 AVCodecContext *avctx = mFormatCtx->streams[mAudioStreamIdx]->codec;
1211 if (mAudioBsfc && pkt && pkt->data) {
1212 ret = av_bitstream_filter_filter(mAudioBsfc, avctx, NULL, &outbuf, &outbuf_size,
1213 pkt->data, pkt->size, pkt->flags & AV_PKT_FLAG_KEY);
1215 if (ret < 0 ||!outbuf_size) {
1216 av_free_packet(pkt);
1219 if (outbuf && outbuf != pkt->data) {
1220 memmove(pkt->data, outbuf, outbuf_size);
1221 pkt->size = outbuf_size;
1224 if (mDefersToCreateAudioTrack) {
1225 if (avctx->extradata_size <= 0) {
1226 av_free_packet(pkt);
1229 stream_component_open(mAudioStreamIdx);
1230 if (!mDefersToCreateAudioTrack)
1231 ALOGI("probe packet counter: %d when create audio track ok", mProbePkts);
1232 if (mProbePkts == EXTRACTOR_MAX_PROBE_PACKETS)
1233 ALOGI("probe packet counter to max: %d, create audio track: %d",
1234 mProbePkts, !mDefersToCreateAudioTrack);
1238 if (pkt->stream_index == mAudioStreamIdx) {
1239 packet_queue_put(&mAudioQ, pkt);
1240 } else if (pkt->stream_index == mVideoStreamIdx) {
1241 packet_queue_put(&mVideoQ, pkt);
1243 av_free_packet(pkt);
1250 ALOGV("FFmpegExtractor exit thread(readerEntry)");
1253 ////////////////////////////////////////////////////////////////////////////////
1255 FFmpegSource::FFmpegSource(
1256 const sp<FFmpegExtractor> &extractor, size_t index)
1257 : mExtractor(extractor),
1261 mStream(mExtractor->mTracks.itemAt(index).mStream),
1262 mQueue(mExtractor->mTracks.itemAt(index).mQueue),
1263 mLastPTS(AV_NOPTS_VALUE),
1264 mTargetTime(AV_NOPTS_VALUE) {
1265 sp<MetaData> meta = mExtractor->mTracks.itemAt(index).mMeta;
1268 AVCodecContext *avctx = mStream->codec;
1270 /* Parse codec specific data */
1271 if (avctx->codec_id == AV_CODEC_ID_H264
1272 && avctx->extradata_size > 0
1273 && avctx->extradata[0] == 1) {
1279 CHECK(meta->findData(kKeyAVCC, &type, &data, &size));
1281 const uint8_t *ptr = (const uint8_t *)data;
1284 CHECK_EQ((unsigned)ptr[0], 1u); // configurationVersion == 1
1286 // The number of bytes used to encode the length of a NAL unit.
1287 mNALLengthSize = 1 + (ptr[4] & 3);
1289 ALOGV("the stream is AVC, the length of a NAL unit: %d", mNALLengthSize);
1295 mMediaType = mStream->codec->codec_type;
1296 mFirstKeyPktTimestamp = AV_NOPTS_VALUE;
1299 FFmpegSource::~FFmpegSource() {
1300 ALOGV("FFmpegSource::~FFmpegSource %s",
1301 av_get_media_type_string(mMediaType));
1305 status_t FFmpegSource::start(MetaData *params __unused) {
1306 ALOGV("FFmpegSource::start %s",
1307 av_get_media_type_string(mMediaType));
1311 status_t FFmpegSource::stop() {
1312 ALOGV("FFmpegSource::stop %s",
1313 av_get_media_type_string(mMediaType));
1317 sp<MetaData> FFmpegSource::getFormat() {
1318 return mExtractor->mTracks.itemAt(mTrackIndex).mMeta;;
1321 status_t FFmpegSource::read(
1322 MediaBuffer **buffer, const ReadOptions *options) {
1326 bool seeking = false;
1327 bool waitKeyPkt = false;
1328 ReadOptions::SeekMode mode;
1329 int64_t pktTS = AV_NOPTS_VALUE;
1330 int64_t seekTimeUs = AV_NOPTS_VALUE;
1331 int64_t timeUs = AV_NOPTS_VALUE;
1333 status_t status = OK;
1335 int64_t startTimeUs = mStream->start_time == AV_NOPTS_VALUE ? 0 :
1336 av_rescale_q(mStream->start_time, mStream->time_base, AV_TIME_BASE_Q);
1338 if (options && options->getSeekTo(&seekTimeUs, &mode)) {
1339 int64_t seekPTS = seekTimeUs;
1340 ALOGV("~~~%s seekTimeUs: %lld, seekPTS: %lld, mode: %d", av_get_media_type_string(mMediaType), seekTimeUs, seekPTS, mode);
1341 /* add the stream start time */
1342 if (mStream->start_time != AV_NOPTS_VALUE) {
1343 seekPTS += startTimeUs;
1345 ALOGV("~~~%s seekTimeUs[+startTime]: %lld, mode: %d start_time=%lld", av_get_media_type_string(mMediaType), seekPTS, mode, startTimeUs);
1346 seeking = (mExtractor->stream_seek(seekPTS, mMediaType, mode) == SEEK);
1350 if (packet_queue_get(mQueue, &pkt, 1) < 0) {
1351 ALOGD("read %s abort reqeust", av_get_media_type_string(mMediaType));
1352 mExtractor->reachedEOS(mMediaType);
1353 return ERROR_END_OF_STREAM;
1357 if (pkt.data != mQueue->flush_pkt.data) {
1358 av_free_packet(&pkt);
1362 #if WAIT_KEY_PACKET_AFTER_SEEK
1368 if (pkt.data == mQueue->flush_pkt.data) {
1369 ALOGV("read %s flush pkt", av_get_media_type_string(mMediaType));
1370 av_free_packet(&pkt);
1371 mFirstKeyPktTimestamp = AV_NOPTS_VALUE;
1373 } else if (pkt.data == NULL && pkt.size == 0) {
1374 ALOGD("read %s eos pkt", av_get_media_type_string(mMediaType));
1375 av_free_packet(&pkt);
1376 mExtractor->reachedEOS(mMediaType);
1377 return ERROR_END_OF_STREAM;
1380 key = pkt.flags & AV_PKT_FLAG_KEY ? 1 : 0;
1381 pktTS = pkt.pts == AV_NOPTS_VALUE ? pkt.dts : pkt.pts;
1385 ALOGV("drop the non-key packet");
1386 av_free_packet(&pkt);
1389 ALOGV("~~~~~~ got the key packet");
1394 if (pktTS != AV_NOPTS_VALUE && mFirstKeyPktTimestamp == AV_NOPTS_VALUE) {
1395 // update the first key timestamp
1396 mFirstKeyPktTimestamp = pktTS;
1399 MediaBuffer *mediaBuffer = new MediaBuffer(pkt.size + FF_INPUT_BUFFER_PADDING_SIZE);
1400 mediaBuffer->meta_data()->clear();
1401 mediaBuffer->set_range(0, pkt.size);
1404 if (mIsAVC && mNal2AnnexB) {
1405 /* This only works for NAL sizes 3-4 */
1406 CHECK(mNALLengthSize == 3 || mNALLengthSize == 4);
1408 uint8_t *dst = (uint8_t *)mediaBuffer->data();
1409 /* Convert H.264 NAL format to annex b */
1410 status = convertNal2AnnexB(dst, pkt.size, pkt.data, pkt.size, mNALLengthSize);
1412 ALOGE("convertNal2AnnexB failed");
1413 mediaBuffer->release();
1415 av_free_packet(&pkt);
1416 return ERROR_MALFORMED;
1419 memcpy(mediaBuffer->data(), pkt.data, pkt.size);
1422 if (pktTS != AV_NOPTS_VALUE)
1423 timeUs = av_rescale_q(pktTS, mStream->time_base, AV_TIME_BASE_Q) - startTimeUs;
1425 timeUs = SF_NOPTS_VALUE; //FIXME AV_NOPTS_VALUE is negative, but stagefright need positive
1427 // predict the next PTS to use for exact-frame seek below
1428 int64_t nextPTS = AV_NOPTS_VALUE;
1429 if (mLastPTS != AV_NOPTS_VALUE && timeUs > mLastPTS) {
1430 nextPTS = timeUs + (timeUs - mLastPTS);
1432 } else if (mLastPTS == AV_NOPTS_VALUE) {
1437 if (pktTS != AV_NOPTS_VALUE)
1438 ALOGV("read %s pkt, size:%d, key:%d, pktPTS: %lld, pts:%lld, dts:%lld, timeUs[-startTime]:%lld us (%.2f secs) start_time=%lld",
1439 av_get_media_type_string(mMediaType), pkt.size, key, pktTS, pkt.pts, pkt.dts, timeUs, timeUs/1E6, startTimeUs);
1441 ALOGV("read %s pkt, size:%d, key:%d, pts:N/A, dts:N/A, timeUs[-startTime]:N/A",
1442 av_get_media_type_string(mMediaType), pkt.size, key);
1445 mediaBuffer->meta_data()->setInt64(kKeyTime, timeUs);
1446 mediaBuffer->meta_data()->setInt32(kKeyIsSyncFrame, key);
1448 // deal with seek-to-exact-frame, we might be off a bit and Stagefright will assert on us
1449 if (seekTimeUs != AV_NOPTS_VALUE && timeUs < seekTimeUs &&
1450 mode == MediaSource::ReadOptions::SEEK_CLOSEST) {
1451 mTargetTime = seekTimeUs;
1452 mediaBuffer->meta_data()->setInt64(kKeyTargetTime, seekTimeUs);
1455 if (mTargetTime != AV_NOPTS_VALUE) {
1456 if (timeUs == mTargetTime) {
1457 mTargetTime = AV_NOPTS_VALUE;
1458 } else if (nextPTS != AV_NOPTS_VALUE && nextPTS > mTargetTime) {
1459 ALOGV("adjust target frame time to %lld", timeUs);
1460 mediaBuffer->meta_data()->setInt64(kKeyTime, mTargetTime);
1461 mTargetTime = AV_NOPTS_VALUE;
1465 *buffer = mediaBuffer;
1467 av_free_packet(&pkt);
1472 ////////////////////////////////////////////////////////////////////////////////
1476 const char *container;
1479 static formatmap FILE_FORMATS[] = {
1480 {"mpeg", MEDIA_MIMETYPE_CONTAINER_MPEG2PS },
1481 {"mpegts", MEDIA_MIMETYPE_CONTAINER_TS },
1482 {"mov,mp4,m4a,3gp,3g2,mj2", MEDIA_MIMETYPE_CONTAINER_MPEG4 },
1483 {"matroska,webm", MEDIA_MIMETYPE_CONTAINER_MATROSKA },
1484 {"asf", MEDIA_MIMETYPE_CONTAINER_ASF },
1485 {"rm", MEDIA_MIMETYPE_CONTAINER_RM },
1486 {"flv", MEDIA_MIMETYPE_CONTAINER_FLV },
1487 {"swf", MEDIA_MIMETYPE_CONTAINER_FLV },
1488 {"avi", MEDIA_MIMETYPE_CONTAINER_AVI },
1489 {"ape", MEDIA_MIMETYPE_CONTAINER_APE },
1490 {"dts", MEDIA_MIMETYPE_CONTAINER_DTS },
1491 {"flac", MEDIA_MIMETYPE_CONTAINER_FLAC },
1492 {"ac3", MEDIA_MIMETYPE_AUDIO_AC3 },
1493 {"mp3", MEDIA_MIMETYPE_AUDIO_MPEG },
1494 {"wav", MEDIA_MIMETYPE_CONTAINER_WAV },
1495 {"ogg", MEDIA_MIMETYPE_CONTAINER_OGG },
1496 {"vc1", MEDIA_MIMETYPE_CONTAINER_VC1 },
1497 {"hevc", MEDIA_MIMETYPE_CONTAINER_HEVC },
1498 {"divx", MEDIA_MIMETYPE_CONTAINER_DIVX },
1501 static AVCodecContext* getCodecContext(AVFormatContext *ic, AVMediaType codec_type)
1503 unsigned int idx = 0;
1504 AVCodecContext *avctx = NULL;
1506 for (idx = 0; idx < ic->nb_streams; idx++) {
1507 if (ic->streams[idx]->disposition & AV_DISPOSITION_ATTACHED_PIC) {
1508 // FFMPEG converts album art to MJPEG, but we don't want to
1509 // include that in the parsing as MJPEG is not supported by
1510 // Android, which forces the media to be extracted by FFMPEG
1511 // while in fact, Android supports it.
1515 avctx = ic->streams[idx]->codec;
1516 if (avctx->codec_type == codec_type) {
1524 static enum AVCodecID getCodecId(AVFormatContext *ic, AVMediaType codec_type)
1526 AVCodecContext *avctx = getCodecContext(ic, codec_type);
1527 return avctx == NULL ? AV_CODEC_ID_NONE : avctx->codec_id;
1530 static bool hasAudioCodecOnly(AVFormatContext *ic)
1532 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
1533 bool haveVideo = false;
1534 bool haveAudio = false;
1536 if (getCodecId(ic, AVMEDIA_TYPE_VIDEO) != AV_CODEC_ID_NONE) {
1539 if (getCodecId(ic, AVMEDIA_TYPE_AUDIO) != AV_CODEC_ID_NONE) {
1543 if (!haveVideo && haveAudio) {
1550 //FIXME all codecs: frameworks/av/media/libstagefright/codecs/*
1551 static bool isCodecSupportedByStagefright(enum AVCodecID codec_id)
1553 bool supported = false;
1557 case AV_CODEC_ID_HEVC:
1558 case AV_CODEC_ID_H264:
1559 case AV_CODEC_ID_MPEG4:
1560 case AV_CODEC_ID_H263:
1561 case AV_CODEC_ID_H263P:
1562 case AV_CODEC_ID_H263I:
1563 case AV_CODEC_ID_VP6:
1564 case AV_CODEC_ID_VP8:
1565 case AV_CODEC_ID_VP9:
1567 case AV_CODEC_ID_AAC:
1568 case AV_CODEC_ID_MP3:
1569 case AV_CODEC_ID_AMR_NB:
1570 case AV_CODEC_ID_AMR_WB:
1571 case AV_CODEC_ID_FLAC:
1572 case AV_CODEC_ID_VORBIS:
1573 case AV_CODEC_ID_PCM_MULAW: //g711
1574 case AV_CODEC_ID_PCM_ALAW: //g711
1575 case AV_CODEC_ID_GSM_MS:
1576 case AV_CODEC_ID_PCM_U8:
1577 case AV_CODEC_ID_PCM_S16LE:
1578 case AV_CODEC_ID_PCM_S24LE:
1586 ALOGD("%ssuppoted codec(%s) by official Stagefright",
1587 (supported ? "" : "un"),
1588 avcodec_get_name(codec_id));
1593 static void adjustMPEG4Confidence(AVFormatContext *ic, float *confidence)
1595 AVDictionary *tags = NULL;
1596 AVDictionaryEntry *tag = NULL;
1597 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
1600 codec_id = getCodecId(ic, AVMEDIA_TYPE_VIDEO);
1601 if (codec_id != AV_CODEC_ID_NONE
1602 && codec_id != AV_CODEC_ID_HEVC
1603 && codec_id != AV_CODEC_ID_H264
1604 && codec_id != AV_CODEC_ID_MPEG4
1605 && codec_id != AV_CODEC_ID_H263
1606 && codec_id != AV_CODEC_ID_H263P
1607 && codec_id != AV_CODEC_ID_H263I) {
1608 //the MEDIA_MIMETYPE_CONTAINER_MPEG4 of confidence is 0.4f
1609 ALOGI("[mp4]video codec(%s), confidence should be larger than MPEG4Extractor",
1610 avcodec_get_name(codec_id));
1611 *confidence = 0.41f;
1614 codec_id = getCodecId(ic, AVMEDIA_TYPE_AUDIO);
1615 if (codec_id != AV_CODEC_ID_NONE
1616 && codec_id != AV_CODEC_ID_MP3
1617 && codec_id != AV_CODEC_ID_AAC
1618 && codec_id != AV_CODEC_ID_AMR_NB
1619 && codec_id != AV_CODEC_ID_AMR_WB) {
1620 ALOGI("[mp4]audio codec(%s), confidence should be larger than MPEG4Extractor",
1621 avcodec_get_name(codec_id));
1622 *confidence = 0.41f;
1626 tags = ic->metadata;
1627 //NOTE: You can use command to show these tags,
1628 //e.g. "ffprobe -show_format 2012.mov"
1629 tag = av_dict_get(tags, "major_brand", NULL, 0);
1634 ALOGV("major_brand tag is:%s", tag->value);
1636 //when MEDIA_MIMETYPE_CONTAINER_MPEG4
1637 //WTF, MPEG4Extractor.cpp can not extractor mov format
1638 //NOTE: isCompatibleBrand(MPEG4Extractor.cpp)
1639 // Won't promise that the following file types can be played.
1640 // Just give these file types a chance.
1641 // FOURCC('q', 't', ' ', ' '), // Apple's QuickTime
1643 if (!strcmp(tag->value, "qt ")) {
1644 ALOGI("[mp4]format is mov, confidence should be larger than mpeg4");
1645 *confidence = 0.41f;
1649 static void adjustMPEG2TSConfidence(AVFormatContext *ic, float *confidence)
1651 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
1653 codec_id = getCodecId(ic, AVMEDIA_TYPE_VIDEO);
1654 if (codec_id != AV_CODEC_ID_NONE
1655 && codec_id != AV_CODEC_ID_H264
1656 && codec_id != AV_CODEC_ID_MPEG4
1657 && codec_id != AV_CODEC_ID_MPEG1VIDEO
1658 && codec_id != AV_CODEC_ID_MPEG2VIDEO) {
1659 //the MEDIA_MIMETYPE_CONTAINER_MPEG2TS of confidence is 0.1f
1660 ALOGI("[mpeg2ts]video codec(%s), confidence should be larger than MPEG2TSExtractor",
1661 avcodec_get_name(codec_id));
1662 *confidence = 0.11f;
1665 codec_id = getCodecId(ic, AVMEDIA_TYPE_AUDIO);
1666 if (codec_id != AV_CODEC_ID_NONE
1667 && codec_id != AV_CODEC_ID_AAC
1668 && codec_id != AV_CODEC_ID_PCM_S16LE
1669 && codec_id != AV_CODEC_ID_PCM_S24LE
1670 && codec_id != AV_CODEC_ID_MP1
1671 && codec_id != AV_CODEC_ID_MP2
1672 && codec_id != AV_CODEC_ID_MP3) {
1673 ALOGI("[mpeg2ts]audio codec(%s), confidence should be larger than MPEG2TSExtractor",
1674 avcodec_get_name(codec_id));
1675 *confidence = 0.11f;
1679 static void adjustMKVConfidence(AVFormatContext *ic, float *confidence)
1681 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
1683 codec_id = getCodecId(ic, AVMEDIA_TYPE_VIDEO);
1684 if (codec_id != AV_CODEC_ID_NONE
1685 && codec_id != AV_CODEC_ID_H264
1686 && codec_id != AV_CODEC_ID_MPEG4
1687 && codec_id != AV_CODEC_ID_VP6
1688 && codec_id != AV_CODEC_ID_VP8
1689 && codec_id != AV_CODEC_ID_VP9) {
1690 //the MEDIA_MIMETYPE_CONTAINER_MATROSKA of confidence is 0.6f
1691 ALOGI("[mkv]video codec(%s), confidence should be larger than MatroskaExtractor",
1692 avcodec_get_name(codec_id));
1693 *confidence = 0.61f;
1696 codec_id = getCodecId(ic, AVMEDIA_TYPE_AUDIO);
1697 if (codec_id != AV_CODEC_ID_NONE
1698 && codec_id != AV_CODEC_ID_AAC
1699 && codec_id != AV_CODEC_ID_MP3
1700 && codec_id != AV_CODEC_ID_VORBIS) {
1701 ALOGI("[mkv]audio codec(%s), confidence should be larger than MatroskaExtractor",
1702 avcodec_get_name(codec_id));
1703 *confidence = 0.61f;
1707 static void adjustCodecConfidence(AVFormatContext *ic, float *confidence)
1709 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
1711 codec_id = getCodecId(ic, AVMEDIA_TYPE_VIDEO);
1712 if (codec_id != AV_CODEC_ID_NONE) {
1713 if (!isCodecSupportedByStagefright(codec_id)) {
1714 *confidence = 0.88f;
1718 codec_id = getCodecId(ic, AVMEDIA_TYPE_AUDIO);
1719 if (codec_id != AV_CODEC_ID_NONE) {
1720 if (!isCodecSupportedByStagefright(codec_id)) {
1721 *confidence = 0.88f;
1725 if (getCodecId(ic, AVMEDIA_TYPE_VIDEO) != AV_CODEC_ID_NONE
1726 && getCodecId(ic, AVMEDIA_TYPE_AUDIO) == AV_CODEC_ID_MP3) {
1727 *confidence = 0.22f; //larger than MP3Extractor
1731 //TODO need more checks
1732 static void adjustConfidenceIfNeeded(const char *mime,
1733 AVFormatContext *ic, float *confidence)
1736 if (!strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MPEG4)) {
1737 adjustMPEG4Confidence(ic, confidence);
1738 } else if (!strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MPEG2TS)) {
1739 adjustMPEG2TSConfidence(ic, confidence);
1740 } else if (!strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MATROSKA)) {
1741 adjustMKVConfidence(ic, confidence);
1746 if (*confidence > 0.08) {
1751 adjustCodecConfidence(ic, confidence);
1754 static void adjustContainerIfNeeded(const char **mime, AVFormatContext *ic)
1756 const char *newMime = *mime;
1757 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
1759 AVCodecContext *avctx = getCodecContext(ic, AVMEDIA_TYPE_VIDEO);
1760 if (avctx != NULL && getDivXVersion(avctx) >= 0) {
1761 newMime = MEDIA_MIMETYPE_VIDEO_DIVX;
1763 } else if (hasAudioCodecOnly(ic)) {
1764 codec_id = getCodecId(ic, AVMEDIA_TYPE_AUDIO);
1765 CHECK(codec_id != AV_CODEC_ID_NONE);
1767 case AV_CODEC_ID_MP3:
1768 newMime = MEDIA_MIMETYPE_AUDIO_MPEG;
1770 case AV_CODEC_ID_AAC:
1771 newMime = MEDIA_MIMETYPE_AUDIO_AAC;
1773 case AV_CODEC_ID_VORBIS:
1774 newMime = MEDIA_MIMETYPE_AUDIO_VORBIS;
1776 case AV_CODEC_ID_FLAC:
1777 newMime = MEDIA_MIMETYPE_AUDIO_FLAC;
1779 case AV_CODEC_ID_AC3:
1780 newMime = MEDIA_MIMETYPE_AUDIO_AC3;
1782 case AV_CODEC_ID_APE:
1783 newMime = MEDIA_MIMETYPE_AUDIO_APE;
1785 case AV_CODEC_ID_DTS:
1786 newMime = MEDIA_MIMETYPE_AUDIO_DTS;
1788 case AV_CODEC_ID_MP2:
1789 newMime = MEDIA_MIMETYPE_AUDIO_MPEG_LAYER_II;
1791 case AV_CODEC_ID_COOK:
1792 newMime = MEDIA_MIMETYPE_AUDIO_RA;
1794 case AV_CODEC_ID_WMAV1:
1795 case AV_CODEC_ID_WMAV2:
1796 case AV_CODEC_ID_WMAPRO:
1797 case AV_CODEC_ID_WMALOSSLESS:
1798 newMime = MEDIA_MIMETYPE_AUDIO_WMA;
1804 if (!strcmp(*mime, MEDIA_MIMETYPE_CONTAINER_FFMPEG)) {
1805 newMime = MEDIA_MIMETYPE_AUDIO_FFMPEG;
1809 if (strcmp(*mime, newMime)) {
1810 ALOGI("adjust mime(%s -> %s)", *mime, newMime);
1815 static const char *findMatchingContainer(const char *name)
1818 #if SUPPOURT_UNKNOWN_FORMAT
1819 //The FFmpegExtractor support all ffmpeg formats!!!
1820 //Unknown format is defined as MEDIA_MIMETYPE_CONTAINER_FFMPEG
1821 const char *container = MEDIA_MIMETYPE_CONTAINER_FFMPEG;
1823 const char *container = NULL;
1826 ALOGV("list the formats suppoted by ffmpeg: ");
1827 ALOGV("========================================");
1828 for (i = 0; i < NELEM(FILE_FORMATS); ++i) {
1829 ALOGV("format_names[%02d]: %s", i, FILE_FORMATS[i].format);
1831 ALOGV("========================================");
1833 for (i = 0; i < NELEM(FILE_FORMATS); ++i) {
1834 int len = strlen(FILE_FORMATS[i].format);
1835 if (!strncasecmp(name, FILE_FORMATS[i].format, len)) {
1836 container = FILE_FORMATS[i].container;
1844 static const char *SniffFFMPEGCommon(const char *url, float *confidence, bool fastMPEG4)
1848 size_t nb_streams = 0;
1849 const char *container = NULL;
1850 AVFormatContext *ic = NULL;
1851 AVDictionary **opts = NULL;
1853 status_t status = initFFmpeg();
1855 ALOGE("could not init ffmpeg");
1859 ic = avformat_alloc_context();
1862 ALOGE("oom for alloc avformat context");
1866 err = avformat_open_input(&ic, url, NULL, NULL);
1869 ALOGE("%s: avformat_open_input failed, err:%s", url, av_err2str(err));
1873 if (ic->iformat != NULL && ic->iformat->name != NULL &&
1874 findMatchingContainer(ic->iformat->name) != NULL &&
1875 !strcasecmp(findMatchingContainer(ic->iformat->name),
1876 MEDIA_MIMETYPE_CONTAINER_MPEG4)) {
1878 container = findMatchingContainer(ic->iformat->name);
1883 opts = setup_find_stream_info_opts(ic, codec_opts);
1884 nb_streams = ic->nb_streams;
1885 err = avformat_find_stream_info(ic, opts);
1887 ALOGE("%s: could not find stream info, err:%s", url, av_err2str(err));
1890 for (i = 0; i < nb_streams; i++) {
1891 av_dict_free(&opts[i]);
1895 av_dump_format(ic, 0, url, 0);
1897 ALOGD("FFmpegExtrator, url: %s, format_name: %s, format_long_name: %s",
1898 url, ic->iformat->name, ic->iformat->long_name);
1900 container = findMatchingContainer(ic->iformat->name);
1902 adjustContainerIfNeeded(&container, ic);
1903 adjustConfidenceIfNeeded(container, ic, confidence);
1908 avformat_close_input(&ic);
1917 static const char *BetterSniffFFMPEG(const sp<DataSource> &source,
1918 float *confidence, sp<AMessage> meta)
1920 const char *ret = NULL;
1921 char url[PATH_MAX] = {0};
1923 ALOGI("android-source:%p", source.get());
1925 // pass the addr of smart pointer("source")
1926 snprintf(url, sizeof(url), "android-source:%p", source.get());
1928 ret = SniffFFMPEGCommon(url, confidence, (source->flags() & DataSource::kIsCachingDataSource));
1930 meta->setString("extended-extractor-url", url);
1936 static const char *LegacySniffFFMPEG(const sp<DataSource> &source,
1937 float *confidence, sp<AMessage> meta)
1939 const char *ret = NULL;
1940 char url[PATH_MAX] = {0};
1942 String8 uri = source->getUri();
1943 if (!uri.string()) {
1947 ALOGV("source url:%s", uri.string());
1949 // pass the addr of smart pointer("source") + file name
1950 snprintf(url, sizeof(url), "android-source:%p|file:%s", source.get(), uri.string());
1952 ret = SniffFFMPEGCommon(url, confidence, false);
1954 meta->setString("extended-extractor-url", url);
1961 const sp<DataSource> &source, String8 *mimeType, float *confidence,
1962 sp<AMessage> *meta) {
1963 ALOGV("SniffFFMPEG");
1965 *meta = new AMessage;
1966 *confidence = 0.08f; // be the last resort, by default
1968 const char *container = BetterSniffFFMPEG(source, confidence, *meta);
1970 ALOGW("sniff through BetterSniffFFMPEG failed, try LegacySniffFFMPEG");
1971 container = LegacySniffFFMPEG(source, confidence, *meta);
1973 ALOGV("sniff through LegacySniffFFMPEG success");
1976 ALOGV("sniff through BetterSniffFFMPEG success");
1979 if (container == NULL) {
1980 ALOGD("SniffFFMPEG failed to sniff this source");
1986 ALOGD("ffmpeg detected media content as '%s' with confidence %.2f",
1987 container, *confidence);
1989 /* use MPEG4Extractor(not extended extractor) for HTTP source only */
1990 if (!strcasecmp(container, MEDIA_MIMETYPE_CONTAINER_MPEG4)
1991 && (source->flags() & DataSource::kIsCachingDataSource)) {
1992 ALOGI("support container: %s, but it is caching data source, "
1993 "Don't use ffmpegextractor", container);
1999 mimeType->setTo(container);
2001 (*meta)->setString("extended-extractor", "extended-extractor");
2002 (*meta)->setString("extended-extractor-subtype", "ffmpegextractor");
2003 (*meta)->setString("extended-extractor-mime", container);
2006 char value[PROPERTY_VALUE_MAX];
2007 property_get("sys.media.parser.ffmpeg", value, "0");
2009 ALOGD("[debug] use ffmpeg parser");
2010 *confidence = 0.88f;
2013 if (*confidence > 0.08f) {
2014 (*meta)->setString("extended-extractor-use", "ffmpegextractor");
2020 MediaExtractor *CreateFFmpegExtractor(const sp<DataSource> &source, const char *mime, const sp<AMessage> &meta) {
2021 MediaExtractor *ret = NULL;
2023 if (meta.get() && meta->findString("extended-extractor", ¬use) && (
2024 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_MPEG) ||
2025 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_AAC) ||
2026 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_VORBIS) ||
2027 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_FLAC) ||
2028 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_AC3) ||
2029 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_APE) ||
2030 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_DTS) ||
2031 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_MPEG_LAYER_II) ||
2032 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_RA) ||
2033 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_WMA) ||
2034 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_FFMPEG) ||
2035 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MPEG4) ||
2036 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MOV) ||
2037 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MATROSKA) ||
2038 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_TS) ||
2039 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MPEG2PS) ||
2040 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_AVI) ||
2041 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_ASF) ||
2042 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_WEBM) ||
2043 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_WMV) ||
2044 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MPG) ||
2045 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_FLV) ||
2046 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_DIVX) ||
2047 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_RM) ||
2048 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_WAV) ||
2049 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_FLAC) ||
2050 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_APE) ||
2051 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_DTS) ||
2052 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MP2) ||
2053 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_RA) ||
2054 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_OGG) ||
2055 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_VC1) ||
2056 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_HEVC) ||
2057 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_WMA) ||
2058 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_FFMPEG))) {
2059 ret = new FFmpegExtractor(source, meta);
2062 ALOGD("%ssupported mime: %s", (ret ? "" : "un"), mime);
2066 } // namespace android
2068 extern "C" void getExtractorPlugin(android::MediaExtractor::Plugin *plugin)
2070 plugin->sniff = android::SniffFFMPEG;
2071 plugin->create = android::CreateFFmpegExtractor;