2 * Copyright 2012 Michael Chen <omxcodec@gmail.com>
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
8 * http://www.apache.org/licenses/LICENSE-2.0
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
18 #define LOG_TAG "FFmpegExtractor"
19 #include <utils/Log.h>
22 #include <limits.h> /* INT_MAX */
25 #include <utils/misc.h>
26 #include <utils/String8.h>
27 #include <cutils/properties.h>
28 #include <media/stagefright/foundation/ABitReader.h>
29 #include <media/stagefright/foundation/ABuffer.h>
30 #include <media/stagefright/foundation/ADebug.h>
31 #include <media/stagefright/foundation/AMessage.h>
32 #include <media/stagefright/foundation/hexdump.h>
33 #include <media/stagefright/DataSource.h>
34 #include <media/stagefright/MediaBuffer.h>
35 #include <media/stagefright/foundation/ADebug.h>
36 #include <media/stagefright/MediaDefs.h>
37 #include <media/stagefright/MediaErrors.h>
38 #include <media/stagefright/MediaSource.h>
39 #include <media/stagefright/MetaData.h>
40 #include <media/stagefright/Utils.h>
41 #include "include/avc_utils.h"
43 #include "utils/codec_utils.h"
44 #include "utils/ffmpeg_cmdutils.h"
46 #include "FFmpegExtractor.h"
48 #define MAX_QUEUE_SIZE (15 * 1024 * 1024)
49 #define MIN_AUDIOQ_SIZE (20 * 16 * 1024)
51 #define EXTRACTOR_MAX_PROBE_PACKETS 200
52 #define FF_MAX_EXTRADATA_SIZE ((1 << 28) - FF_INPUT_BUFFER_PADDING_SIZE)
55 #define DEBUG_READ_ENTRY 0
56 #define DEBUG_DISABLE_VIDEO 0
57 #define DEBUG_DISABLE_AUDIO 0
58 #define WAIT_KEY_PACKET_AFTER_SEEK 1
60 #define DEBUG_FORMATS 0
69 struct FFmpegExtractor::Track : public MediaSource {
70 Track(FFmpegExtractor *extractor, sp<MetaData> meta,
71 AVStream *stream, PacketQueue *queue);
73 virtual status_t start(MetaData *params);
74 virtual status_t stop();
75 virtual sp<MetaData> getFormat();
77 virtual status_t read(
78 MediaBuffer **buffer, const ReadOptions *options);
84 friend struct FFmpegExtractor;
86 FFmpegExtractor *mExtractor;
89 enum AVMediaType mMediaType;
94 size_t mNALLengthSize;
100 int64_t mFirstKeyPktTimestamp;
102 DISALLOW_EVIL_CONSTRUCTORS(Track);
105 ////////////////////////////////////////////////////////////////////////////////
107 FFmpegExtractor::FFmpegExtractor(const sp<DataSource> &source, const sp<AMessage> &meta)
108 : mDataSource(source),
111 mFFmpegInited(false),
113 mReaderThreadStarted(false) {
114 ALOGV("FFmpegExtractor::FFmpegExtractor");
116 fetchStuffsFromSniffedMeta(meta);
118 int err = initStreams();
120 ALOGE("failed to init ffmpeg");
124 // start reader here, as we want to extract extradata from bitstream if no extradata
127 while(mProbePkts <= EXTRACTOR_MAX_PROBE_PACKETS && !mEOF &&
128 (mFormatCtx->pb ? !mFormatCtx->pb->error : 1) &&
129 (mDefersToCreateVideoTrack || mDefersToCreateAudioTrack)) {
130 // FIXME, i am so lazy! Should use pthread_cond_wait to wait conditions
134 ALOGV("mProbePkts: %d, mEOF: %d, pb->error(if has): %d, mDefersToCreateVideoTrack: %d, mDefersToCreateAudioTrack: %d",
135 mProbePkts, mEOF, mFormatCtx->pb ? mFormatCtx->pb->error : 0, mDefersToCreateVideoTrack, mDefersToCreateAudioTrack);
140 FFmpegExtractor::~FFmpegExtractor() {
141 ALOGV("FFmpegExtractor::~FFmpegExtractor");
143 // stop reader here if no track!
149 size_t FFmpegExtractor::countTracks() {
150 return mInitCheck == OK ? mTracks.size() : 0;
153 sp<MediaSource> FFmpegExtractor::getTrack(size_t index) {
154 ALOGV("FFmpegExtractor::getTrack[%d]", index);
156 if (mInitCheck != OK) {
160 if (index >= mTracks.size()) {
164 return mTracks.valueAt(index);
167 sp<MetaData> FFmpegExtractor::getTrackMetaData(size_t index, uint32_t flags) {
168 ALOGV("FFmpegExtractor::getTrackMetaData[%d]", index);
170 if (mInitCheck != OK) {
174 if (index >= mTracks.size()) {
178 return mTracks.valueAt(index)->getFormat();
181 sp<MetaData> FFmpegExtractor::getMetaData() {
182 ALOGV("FFmpegExtractor::getMetaData");
184 if (mInitCheck != OK) {
191 uint32_t FFmpegExtractor::flags() const {
192 ALOGV("FFmpegExtractor::flags");
194 if (mInitCheck != OK) {
198 uint32_t flags = CAN_PAUSE;
200 if (mFormatCtx->duration != AV_NOPTS_VALUE) {
201 flags |= CAN_SEEK_BACKWARD | CAN_SEEK_FORWARD | CAN_SEEK;
207 int FFmpegExtractor::check_extradata(AVCodecContext *avctx)
209 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
210 const char *name = NULL;
211 bool *defersToCreateTrack = NULL;
212 AVBitStreamFilterContext **bsfc = NULL;
215 if (avctx->codec_type == AVMEDIA_TYPE_VIDEO) {
217 defersToCreateTrack = &mDefersToCreateVideoTrack;
218 } else if (avctx->codec_type == AVMEDIA_TYPE_AUDIO){
220 defersToCreateTrack = &mDefersToCreateAudioTrack;
223 codec_id = avctx->codec_id;
226 if (codec_id != AV_CODEC_ID_H264
227 && codec_id != AV_CODEC_ID_MPEG4
228 && codec_id != AV_CODEC_ID_MPEG1VIDEO
229 && codec_id != AV_CODEC_ID_MPEG2VIDEO
230 && codec_id != AV_CODEC_ID_AAC) {
234 // is extradata compatible with android?
235 if (codec_id != AV_CODEC_ID_AAC) {
236 int is_compatible = is_extradata_compatible_with_android(avctx);
237 if (!is_compatible) {
238 ALOGI("%s extradata is not compatible with android, should to extract it from bitstream",
239 av_get_media_type_string(avctx->codec_type));
240 *defersToCreateTrack = true;
241 *bsfc = NULL; // H264 don't need bsfc, only AAC?
247 if (codec_id == AV_CODEC_ID_AAC) {
248 name = "aac_adtstoasc";
251 if (avctx->extradata_size <= 0) {
252 ALOGI("No %s extradata found, should to extract it from bitstream",
253 av_get_media_type_string(avctx->codec_type));
254 *defersToCreateTrack = true;
255 //CHECK(name != NULL);
256 if (!*bsfc && name) {
257 *bsfc = av_bitstream_filter_init(name);
259 ALOGE("Cannot open the %s BSF!", name);
260 *defersToCreateTrack = false;
263 ALOGV("open the %s bsf", name);
273 void FFmpegExtractor::printTime(int64_t time)
275 int hours, mins, secs, us;
277 if (time == AV_NOPTS_VALUE)
280 secs = time / AV_TIME_BASE;
281 us = time % AV_TIME_BASE;
286 ALOGI("the time is %02d:%02d:%02d.%02d",
287 hours, mins, secs, (100 * us) / AV_TIME_BASE);
290 bool FFmpegExtractor::is_codec_supported(enum AVCodecID codec_id)
292 bool supported = false;
295 case AV_CODEC_ID_H264:
296 case AV_CODEC_ID_MPEG4:
297 case AV_CODEC_ID_H263:
298 case AV_CODEC_ID_H263P:
299 case AV_CODEC_ID_H263I:
300 case AV_CODEC_ID_AAC:
301 case AV_CODEC_ID_AC3:
302 case AV_CODEC_ID_MP2:
303 case AV_CODEC_ID_MP3:
304 case AV_CODEC_ID_MPEG1VIDEO:
305 case AV_CODEC_ID_MPEG2VIDEO:
306 case AV_CODEC_ID_WMV1:
307 case AV_CODEC_ID_WMV2:
308 case AV_CODEC_ID_WMV3:
309 case AV_CODEC_ID_VC1:
310 case AV_CODEC_ID_WMAV1:
311 case AV_CODEC_ID_WMAV2:
312 case AV_CODEC_ID_WMAPRO:
313 case AV_CODEC_ID_WMALOSSLESS:
314 case AV_CODEC_ID_RV20:
315 case AV_CODEC_ID_RV30:
316 case AV_CODEC_ID_RV40:
317 case AV_CODEC_ID_COOK:
318 case AV_CODEC_ID_APE:
319 case AV_CODEC_ID_DTS:
320 case AV_CODEC_ID_FLAC:
321 case AV_CODEC_ID_FLV1:
322 case AV_CODEC_ID_VORBIS:
323 case AV_CODEC_ID_HEVC:
328 ALOGD("unsuppoted codec(%s), but give it a chance",
329 avcodec_get_name(codec_id));
330 //Won't promise that the following codec id can be supported.
331 //Just give these codecs a chance.
339 sp<MetaData> FFmpegExtractor::setVideoFormat(AVStream *stream)
341 AVCodecContext *avctx = NULL;
342 sp<MetaData> meta = NULL;
344 avctx = stream->codec;
345 CHECK_EQ(avctx->codec_type, AVMEDIA_TYPE_VIDEO);
347 switch(avctx->codec_id) {
348 case AV_CODEC_ID_H264:
349 if (avctx->extradata[0] == 1) {
350 meta = setAVCFormat(avctx);
352 meta = setH264Format(avctx);
355 case AV_CODEC_ID_MPEG4:
356 meta = setMPEG4Format(avctx);
358 case AV_CODEC_ID_H263:
359 case AV_CODEC_ID_H263P:
360 case AV_CODEC_ID_H263I:
361 meta = setH263Format(avctx);
363 case AV_CODEC_ID_MPEG1VIDEO:
364 case AV_CODEC_ID_MPEG2VIDEO:
365 meta = setMPEG2VIDEOFormat(avctx);
367 case AV_CODEC_ID_VC1:
368 meta = setVC1Format(avctx);
370 case AV_CODEC_ID_WMV1:
371 meta = setWMV1Format(avctx);
373 case AV_CODEC_ID_WMV2:
374 meta = setWMV2Format(avctx);
376 case AV_CODEC_ID_WMV3:
377 meta = setWMV3Format(avctx);
379 case AV_CODEC_ID_RV20:
380 meta = setRV20Format(avctx);
382 case AV_CODEC_ID_RV30:
383 meta = setRV30Format(avctx);
385 case AV_CODEC_ID_RV40:
386 meta = setRV40Format(avctx);
388 case AV_CODEC_ID_FLV1:
389 meta = setFLV1Format(avctx);
391 case AV_CODEC_ID_HEVC:
392 meta = setHEVCFormat(avctx);
394 case AV_CODEC_ID_VP8:
395 meta = setVP8Format(avctx);
397 case AV_CODEC_ID_VP9:
398 meta = setVP9Format(avctx);
401 ALOGD("unsuppoted video codec(id:%d, name:%s), but give it a chance",
402 avctx->codec_id, avcodec_get_name(avctx->codec_id));
404 meta->setInt32(kKeyCodecId, avctx->codec_id);
405 meta->setCString(kKeyMIMEType, MEDIA_MIMETYPE_VIDEO_FFMPEG);
406 if (avctx->extradata_size > 0) {
407 meta->setData(kKeyRawCodecSpecificData, 0, avctx->extradata, avctx->extradata_size);
409 //CHECK(!"Should not be here. Unsupported codec.");
414 ALOGI("width: %d, height: %d, bit_rate: %d",
415 avctx->width, avctx->height, avctx->bit_rate);
417 meta->setInt32(kKeyWidth, avctx->width);
418 meta->setInt32(kKeyHeight, avctx->height);
419 if (avctx->bit_rate > 0) {
420 meta->setInt32(kKeyBitRate, avctx->bit_rate);
422 setDurationMetaData(stream, meta);
428 sp<MetaData> FFmpegExtractor::setAudioFormat(AVStream *stream)
430 AVCodecContext *avctx = NULL;
431 sp<MetaData> meta = NULL;
433 avctx = stream->codec;
434 CHECK_EQ(avctx->codec_type, AVMEDIA_TYPE_AUDIO);
436 switch(avctx->codec_id) {
437 case AV_CODEC_ID_MP2:
438 meta = setMP2Format(avctx);
440 case AV_CODEC_ID_MP3:
441 meta = setMP3Format(avctx);
443 case AV_CODEC_ID_VORBIS:
444 meta = setVORBISFormat(avctx);
446 case AV_CODEC_ID_AC3:
447 meta = setAC3Format(avctx);
449 case AV_CODEC_ID_AAC:
450 meta = setAACFormat(avctx);
452 case AV_CODEC_ID_WMAV1:
453 meta = setWMAV1Format(avctx);
455 case AV_CODEC_ID_WMAV2:
456 meta = setWMAV2Format(avctx);
458 case AV_CODEC_ID_WMAPRO:
459 meta = setWMAProFormat(avctx);
461 case AV_CODEC_ID_WMALOSSLESS:
462 meta = setWMALossLessFormat(avctx);
464 case AV_CODEC_ID_COOK:
465 meta = setRAFormat(avctx);
467 case AV_CODEC_ID_APE:
468 meta = setAPEFormat(avctx);
470 case AV_CODEC_ID_DTS:
471 meta = setDTSFormat(avctx);
473 case AV_CODEC_ID_FLAC:
474 meta = setFLACFormat(avctx);
477 ALOGD("unsuppoted audio codec(id:%d, name:%s), but give it a chance",
478 avctx->codec_id, avcodec_get_name(avctx->codec_id));
480 meta->setInt32(kKeyCodecId, avctx->codec_id);
481 meta->setCString(kKeyMIMEType, MEDIA_MIMETYPE_AUDIO_FFMPEG);
482 if (avctx->extradata_size > 0) {
483 meta->setData(kKeyRawCodecSpecificData, 0, avctx->extradata, avctx->extradata_size);
485 //CHECK(!"Should not be here. Unsupported codec.");
490 ALOGI("bit_rate: %d, sample_rate: %d, channels: %d, "
491 "bits_per_coded_sample: %d, block_align:%d",
492 avctx->bit_rate, avctx->sample_rate, avctx->channels,
493 avctx->bits_per_coded_sample, avctx->block_align);
495 meta->setInt32(kKeyChannelCount, avctx->channels);
496 meta->setInt32(kKeyBitRate, avctx->bit_rate);
497 meta->setInt32(kKeyBitspersample, avctx->bits_per_coded_sample);
498 meta->setInt32(kKeySampleRate, avctx->sample_rate);
499 meta->setInt32(kKeyBlockAlign, avctx->block_align);
500 meta->setInt32(kKeySampleFormat, avctx->sample_fmt);
501 setDurationMetaData(stream, meta);
507 void FFmpegExtractor::setDurationMetaData(AVStream *stream, sp<MetaData> &meta)
509 AVCodecContext *avctx = stream->codec;
511 if (stream->duration != AV_NOPTS_VALUE) {
512 int64_t duration = stream->duration * av_q2d(stream->time_base) * 1000000;
514 const char *s = av_get_media_type_string(avctx->codec_type);
515 if (stream->start_time != AV_NOPTS_VALUE) {
516 ALOGV("%s startTime:%lld", s, stream->start_time);
518 ALOGV("%s startTime:N/A", s);
520 meta->setInt64(kKeyDuration, duration);
522 // default when no stream duration
523 meta->setInt64(kKeyDuration, mFormatCtx->duration);
527 int FFmpegExtractor::stream_component_open(int stream_index)
529 AVCodecContext *avctx = NULL;
530 sp<MetaData> meta = NULL;
531 bool supported = false;
533 const void *data = NULL;
537 ALOGI("stream_index: %d", stream_index);
538 if (stream_index < 0 || stream_index >= (int)mFormatCtx->nb_streams)
540 avctx = mFormatCtx->streams[stream_index]->codec;
542 supported = is_codec_supported(avctx->codec_id);
545 ALOGE("unsupport the codec(%s)", avcodec_get_name(avctx->codec_id));
548 ALOGI("support the codec(%s)", avcodec_get_name(avctx->codec_id));
551 ssize_t index = mTracks.indexOfKey(stream_index);
554 ALOGE("this track already exists");
558 mFormatCtx->streams[stream_index]->discard = AVDISCARD_DEFAULT;
561 av_get_codec_tag_string(tagbuf, sizeof(tagbuf), avctx->codec_tag);
562 ALOGV("Tag %s/0x%08x with codec(%s)\n", tagbuf, avctx->codec_tag, avcodec_get_name(avctx->codec_id));
564 switch (avctx->codec_type) {
565 case AVMEDIA_TYPE_VIDEO:
566 if (mVideoStreamIdx == -1)
567 mVideoStreamIdx = stream_index;
568 if (mVideoStream == NULL)
569 mVideoStream = mFormatCtx->streams[stream_index];
571 ret = check_extradata(avctx);
574 // disable the stream
575 mVideoStreamIdx = -1;
577 packet_queue_end(&mVideoQ);
578 mFormatCtx->streams[stream_index]->discard = AVDISCARD_ALL;
583 if (avctx->extradata) {
584 ALOGV("video stream extradata:");
585 hexdump(avctx->extradata, avctx->extradata_size);
587 ALOGV("video stream no extradata, but we can ignore it.");
590 meta = setVideoFormat(mVideoStream);
592 ALOGE("setVideoFormat failed");
596 ALOGV("create a video track");
598 stream_index, new Track(this, meta, mVideoStream, &mVideoQ));
600 mDefersToCreateVideoTrack = false;
603 case AVMEDIA_TYPE_AUDIO:
604 if (mAudioStreamIdx == -1)
605 mAudioStreamIdx = stream_index;
606 if (mAudioStream == NULL)
607 mAudioStream = mFormatCtx->streams[stream_index];
609 ret = check_extradata(avctx);
612 // disable the stream
613 mAudioStreamIdx = -1;
615 packet_queue_end(&mAudioQ);
616 mFormatCtx->streams[stream_index]->discard = AVDISCARD_ALL;
621 if (avctx->extradata) {
622 ALOGV("audio stream extradata(%d):", avctx->extradata_size);
623 hexdump(avctx->extradata, avctx->extradata_size);
625 ALOGV("audio stream no extradata, but we can ignore it.");
628 meta = setAudioFormat(mAudioStream);
630 ALOGE("setAudioFormat failed");
634 ALOGV("create a audio track");
636 stream_index, new Track(this, meta, mAudioStream, &mAudioQ));
638 mDefersToCreateAudioTrack = false;
641 case AVMEDIA_TYPE_SUBTITLE:
643 CHECK(!"Should not be here. Unsupported media type.");
646 CHECK(!"Should not be here. Unsupported media type.");
652 void FFmpegExtractor::stream_component_close(int stream_index)
654 AVCodecContext *avctx;
656 if (stream_index < 0 || stream_index >= (int)mFormatCtx->nb_streams)
658 avctx = mFormatCtx->streams[stream_index]->codec;
660 switch (avctx->codec_type) {
661 case AVMEDIA_TYPE_VIDEO:
662 ALOGV("packet_queue_abort videoq");
663 packet_queue_abort(&mVideoQ);
664 /* wait until the end */
665 while (!mAbortRequest && !mVideoEOSReceived) {
666 ALOGV("wait for video received");
669 ALOGV("packet_queue_end videoq");
670 packet_queue_end(&mVideoQ);
672 case AVMEDIA_TYPE_AUDIO:
673 ALOGV("packet_queue_abort audioq");
674 packet_queue_abort(&mAudioQ);
675 while (!mAbortRequest && !mAudioEOSReceived) {
676 ALOGV("wait for audio received");
679 ALOGV("packet_queue_end audioq");
680 packet_queue_end(&mAudioQ);
682 case AVMEDIA_TYPE_SUBTITLE:
688 mFormatCtx->streams[stream_index]->discard = AVDISCARD_ALL;
689 switch (avctx->codec_type) {
690 case AVMEDIA_TYPE_VIDEO:
692 mVideoStreamIdx = -1;
694 av_bitstream_filter_close(mVideoBsfc);
698 case AVMEDIA_TYPE_AUDIO:
700 mAudioStreamIdx = -1;
702 av_bitstream_filter_close(mAudioBsfc);
706 case AVMEDIA_TYPE_SUBTITLE:
713 void FFmpegExtractor::reachedEOS(enum AVMediaType media_type)
715 Mutex::Autolock autoLock(mLock);
717 if (media_type == AVMEDIA_TYPE_VIDEO) {
718 mVideoEOSReceived = true;
719 } else if (media_type == AVMEDIA_TYPE_AUDIO) {
720 mAudioEOSReceived = true;
724 /* seek in the stream */
725 int FFmpegExtractor::stream_seek(int64_t pos, enum AVMediaType media_type)
727 Mutex::Autolock autoLock(mLock);
729 if (mVideoStreamIdx >= 0
730 && mAudioStreamIdx >= 0
731 && media_type == AVMEDIA_TYPE_AUDIO
732 && !mVideoEOSReceived) {
737 if (mAudioStreamIdx >= 0)
738 packet_queue_flush(&mAudioQ);
739 if (mVideoStreamIdx >= 0)
740 packet_queue_flush(&mVideoQ);
743 mSeekFlags &= ~AVSEEK_FLAG_BYTE;
750 int FFmpegExtractor::decode_interrupt_cb(void *ctx)
752 FFmpegExtractor *extrator = static_cast<FFmpegExtractor *>(ctx);
753 return extrator->mAbortRequest;
756 void FFmpegExtractor::fetchStuffsFromSniffedMeta(const sp<AMessage> &meta)
762 CHECK(meta->findString("extended-extractor-url", &url));
763 CHECK(url.c_str() != NULL);
764 CHECK(url.size() < PATH_MAX);
766 memcpy(mFilename, url.c_str(), url.size());
767 mFilename[url.size()] = '\0';
770 CHECK(meta->findString("extended-extractor-mime", &mime));
771 CHECK(mime.c_str() != NULL);
772 mMeta->setCString(kKeyMIMEType, mime.c_str());
775 void FFmpegExtractor::setFFmpegDefaultOpts()
778 #if DEBUG_DISABLE_VIDEO
783 #if DEBUG_DISABLE_AUDIO
789 mSeekByBytes = 0; /* seek by bytes 0=off 1=on -1=auto" */
790 mDuration = AV_NOPTS_VALUE;
791 mSeekPos = AV_NOPTS_VALUE;
795 mVideoStreamIdx = -1;
796 mAudioStreamIdx = -1;
799 mDefersToCreateVideoTrack = false;
800 mDefersToCreateAudioTrack = false;
813 int FFmpegExtractor::initStreams()
817 status_t status = UNKNOWN_ERROR;
819 int ret = 0, audio_ret = -1, video_ret = -1;
820 int pkt_in_play_range = 0;
821 AVDictionaryEntry *t = NULL;
822 AVDictionary **opts = NULL;
823 int orig_nb_streams = 0;
824 int st_index[AVMEDIA_TYPE_NB] = {0};
825 int wanted_stream[AVMEDIA_TYPE_NB] = {0};
826 st_index[AVMEDIA_TYPE_AUDIO] = -1;
827 st_index[AVMEDIA_TYPE_VIDEO] = -1;
828 wanted_stream[AVMEDIA_TYPE_AUDIO] = -1;
829 wanted_stream[AVMEDIA_TYPE_VIDEO] = -1;
830 const char *mime = NULL;
832 setFFmpegDefaultOpts();
834 status = initFFmpeg();
839 mFFmpegInited = true;
841 mFormatCtx = avformat_alloc_context();
844 ALOGE("oom for alloc avformat context");
848 mFormatCtx->interrupt_callback.callback = decode_interrupt_cb;
849 mFormatCtx->interrupt_callback.opaque = this;
850 ALOGV("mFilename: %s", mFilename);
851 err = avformat_open_input(&mFormatCtx, mFilename, NULL, &format_opts);
853 ALOGE("%s: avformat_open_input failed, err:%s", mFilename, av_err2str(err));
858 if ((t = av_dict_get(format_opts, "", NULL, AV_DICT_IGNORE_SUFFIX))) {
859 ALOGE("Option %s not found.\n", t->key);
860 //ret = AVERROR_OPTION_NOT_FOUND;
866 mFormatCtx->flags |= AVFMT_FLAG_GENPTS;
868 opts = setup_find_stream_info_opts(mFormatCtx, codec_opts);
869 orig_nb_streams = mFormatCtx->nb_streams;
871 err = avformat_find_stream_info(mFormatCtx, opts);
873 ALOGE("%s: could not find stream info, err:%s", mFilename, av_err2str(err));
877 for (i = 0; i < orig_nb_streams; i++)
878 av_dict_free(&opts[i]);
882 mFormatCtx->pb->eof_reached = 0; // FIXME hack, ffplay maybe should not use url_feof() to test for the end
884 if (mSeekByBytes < 0)
885 mSeekByBytes = !!(mFormatCtx->iformat->flags & AVFMT_TS_DISCONT);
887 for (i = 0; i < (int)mFormatCtx->nb_streams; i++)
888 mFormatCtx->streams[i]->discard = AVDISCARD_ALL;
890 st_index[AVMEDIA_TYPE_VIDEO] =
891 av_find_best_stream(mFormatCtx, AVMEDIA_TYPE_VIDEO,
892 wanted_stream[AVMEDIA_TYPE_VIDEO], -1, NULL, 0);
894 st_index[AVMEDIA_TYPE_AUDIO] =
895 av_find_best_stream(mFormatCtx, AVMEDIA_TYPE_AUDIO,
896 wanted_stream[AVMEDIA_TYPE_AUDIO],
897 st_index[AVMEDIA_TYPE_VIDEO],
900 av_dump_format(mFormatCtx, 0, mFilename, 0);
903 if (mFormatCtx->duration != AV_NOPTS_VALUE &&
904 mFormatCtx->start_time != AV_NOPTS_VALUE) {
905 int hours, mins, secs, us;
907 ALOGV("file startTime: %lld", mFormatCtx->start_time);
909 mDuration = mFormatCtx->duration;
911 secs = mDuration / AV_TIME_BASE;
912 us = mDuration % AV_TIME_BASE;
917 ALOGI("the duration is %02d:%02d:%02d.%02d",
918 hours, mins, secs, (100 * us) / AV_TIME_BASE);
921 packet_queue_init(&mVideoQ);
922 packet_queue_init(&mAudioQ);
924 if (st_index[AVMEDIA_TYPE_AUDIO] >= 0) {
925 audio_ret = stream_component_open(st_index[AVMEDIA_TYPE_AUDIO]);
928 if (st_index[AVMEDIA_TYPE_VIDEO] >= 0) {
929 video_ret = stream_component_open(st_index[AVMEDIA_TYPE_VIDEO]);
932 if ( audio_ret < 0 && video_ret < 0) {
933 ALOGE("%s: could not open codecs\n", mFilename);
944 void FFmpegExtractor::deInitStreams()
946 packet_queue_destroy(&mVideoQ);
947 packet_queue_destroy(&mAudioQ);
950 avformat_close_input(&mFormatCtx);
958 status_t FFmpegExtractor::startReaderThread() {
959 ALOGV("Starting reader thread");
960 Mutex::Autolock autoLock(mLock);
962 if (mReaderThreadStarted)
966 pthread_attr_init(&attr);
967 pthread_attr_setdetachstate(&attr, PTHREAD_CREATE_JOINABLE);
968 pthread_create(&mReaderThread, &attr, ReaderWrapper, this);
969 pthread_attr_destroy(&attr);
970 mReaderThreadStarted = true;
971 ALOGD("Reader thread started");
976 void FFmpegExtractor::stopReaderThread() {
977 ALOGV("Stopping reader thread");
978 Mutex::Autolock autoLock(mLock);
980 if (!mReaderThreadStarted) {
981 ALOGD("Reader thread have been stopped");
988 pthread_join(mReaderThread, &dummy);
989 mReaderThreadStarted = false;
990 ALOGD("Reader thread stopped");
994 void *FFmpegExtractor::ReaderWrapper(void *me) {
995 ((FFmpegExtractor *)me)->readerEntry();
1000 void FFmpegExtractor::readerEntry() {
1002 AVPacket pkt1, *pkt = &pkt1;
1004 int pkt_in_play_range = 0;
1006 ALOGV("FFmpegExtractor enter thread(readerEntry)");
1008 mVideoEOSReceived = false;
1009 mAudioEOSReceived = false;
1015 if (mPaused != mLastPaused) {
1016 mLastPaused = mPaused;
1018 mReadPauseReturn = av_read_pause(mFormatCtx);
1020 av_read_play(mFormatCtx);
1022 #if CONFIG_RTSP_DEMUXER || CONFIG_MMSH_PROTOCOL
1024 (!strcmp(mFormatCtx->iformat->name, "rtsp") ||
1025 (mFormatCtx->pb && !strncmp(mFilename, "mmsh:", 5)))) {
1026 /* wait 10 ms to avoid trying to get another packet */
1034 ALOGV("readerEntry, mSeekReq: %d", mSeekReq);
1035 ret = avformat_seek_file(mFormatCtx, -1, INT64_MIN, mSeekPos, INT64_MAX, mSeekFlags);
1037 ALOGE("%s: error while seeking", mFormatCtx->filename);
1039 if (mAudioStreamIdx >= 0) {
1040 packet_queue_flush(&mAudioQ);
1041 packet_queue_put(&mAudioQ, &mAudioQ.flush_pkt);
1043 if (mVideoStreamIdx >= 0) {
1044 packet_queue_flush(&mVideoQ);
1045 packet_queue_put(&mVideoQ, &mVideoQ.flush_pkt);
1052 /* if the queue are full, no need to read more */
1053 if ( mAudioQ.size + mVideoQ.size > MAX_QUEUE_SIZE
1054 || ( (mAudioQ .size > MIN_AUDIOQ_SIZE || mAudioStreamIdx < 0)
1055 && (mVideoQ .nb_packets > MIN_FRAMES || mVideoStreamIdx < 0))) {
1056 #if DEBUG_READ_ENTRY
1057 ALOGV("readerEntry, full(wtf!!!), mVideoQ.size: %d, mVideoQ.nb_packets: %d, mAudioQ.size: %d, mAudioQ.nb_packets: %d",
1058 mVideoQ.size, mVideoQ.nb_packets, mAudioQ.size, mAudioQ.nb_packets);
1066 if (mVideoStreamIdx >= 0) {
1067 packet_queue_put_nullpacket(&mVideoQ, mVideoStreamIdx);
1069 if (mAudioStreamIdx >= 0) {
1070 packet_queue_put_nullpacket(&mAudioQ, mAudioStreamIdx);
1073 #if DEBUG_READ_ENTRY
1074 ALOGV("readerEntry, eof = 1, mVideoQ.size: %d, mVideoQ.nb_packets: %d, mAudioQ.size: %d, mAudioQ.nb_packets: %d",
1075 mVideoQ.size, mVideoQ.nb_packets, mAudioQ.size, mAudioQ.nb_packets);
1077 if (mAudioQ.size + mVideoQ.size == 0) {
1087 ret = av_read_frame(mFormatCtx, pkt);
1090 if (ret == AVERROR_EOF || url_feof(mFormatCtx->pb))
1091 if (ret == AVERROR_EOF) {
1092 //ALOGV("ret == AVERROR_EOF");
1094 if (url_feof(mFormatCtx->pb)) {
1095 //ALOGV("url_feof(mFormatCtx->pb)");
1100 if (mFormatCtx->pb && mFormatCtx->pb->error) {
1101 ALOGE("mFormatCtx->pb->error: %d", mFormatCtx->pb->error);
1108 if (pkt->stream_index == mVideoStreamIdx) {
1109 if (mDefersToCreateVideoTrack) {
1110 AVCodecContext *avctx = mFormatCtx->streams[mVideoStreamIdx]->codec;
1112 int i = parser_split(avctx, pkt->data, pkt->size);
1113 if (i > 0 && i < FF_MAX_EXTRADATA_SIZE) {
1114 if (avctx->extradata)
1115 av_freep(&avctx->extradata);
1116 avctx->extradata_size= i;
1117 avctx->extradata = (uint8_t *)av_malloc(avctx->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);
1118 if (!avctx->extradata) {
1119 //return AVERROR(ENOMEM);
1120 ret = AVERROR(ENOMEM);
1123 // sps + pps(there may be sei in it)
1124 memcpy(avctx->extradata, pkt->data, avctx->extradata_size);
1125 memset(avctx->extradata + i, 0, FF_INPUT_BUFFER_PADDING_SIZE);
1127 av_free_packet(pkt);
1131 stream_component_open(mVideoStreamIdx);
1132 if (!mDefersToCreateVideoTrack)
1133 ALOGI("probe packet counter: %d when create video track ok", mProbePkts);
1134 if (mProbePkts == EXTRACTOR_MAX_PROBE_PACKETS)
1135 ALOGI("probe packet counter to max: %d, create video track: %d",
1136 mProbePkts, !mDefersToCreateVideoTrack);
1138 } else if (pkt->stream_index == mAudioStreamIdx) {
1142 AVCodecContext *avctx = mFormatCtx->streams[mAudioStreamIdx]->codec;
1143 if (mAudioBsfc && pkt && pkt->data) {
1144 ret = av_bitstream_filter_filter(mAudioBsfc, avctx, NULL, &outbuf, &outbuf_size,
1145 pkt->data, pkt->size, pkt->flags & AV_PKT_FLAG_KEY);
1147 if (ret < 0 ||!outbuf_size) {
1148 av_free_packet(pkt);
1151 if (outbuf && outbuf != pkt->data) {
1152 memmove(pkt->data, outbuf, outbuf_size);
1153 pkt->size = outbuf_size;
1156 if (mDefersToCreateAudioTrack) {
1157 if (avctx->extradata_size <= 0) {
1158 av_free_packet(pkt);
1161 stream_component_open(mAudioStreamIdx);
1162 if (!mDefersToCreateAudioTrack)
1163 ALOGI("probe packet counter: %d when create audio track ok", mProbePkts);
1164 if (mProbePkts == EXTRACTOR_MAX_PROBE_PACKETS)
1165 ALOGI("probe packet counter to max: %d, create audio track: %d",
1166 mProbePkts, !mDefersToCreateAudioTrack);
1170 if (pkt->stream_index == mAudioStreamIdx) {
1171 packet_queue_put(&mAudioQ, pkt);
1172 } else if (pkt->stream_index == mVideoStreamIdx) {
1173 packet_queue_put(&mVideoQ, pkt);
1175 av_free_packet(pkt);
1178 /* wait until the end */
1179 while (!mAbortRequest) {
1185 ALOGI("reader thread goto end...");
1187 /* close each stream */
1188 if (mAudioStreamIdx >= 0)
1189 stream_component_close(mAudioStreamIdx);
1190 if (mVideoStreamIdx >= 0)
1191 stream_component_close(mVideoStreamIdx);
1193 avformat_close_input(&mFormatCtx);
1196 ALOGV("FFmpegExtractor exit thread(readerEntry)");
1199 ////////////////////////////////////////////////////////////////////////////////
1201 FFmpegExtractor::Track::Track(
1202 FFmpegExtractor *extractor, sp<MetaData> meta,
1203 AVStream *stream, PacketQueue *queue)
1204 : mExtractor(extractor),
1212 /* H.264 Video Types */
1214 AVCodecContext *avctx = stream->codec;
1216 if (avctx->codec_id == AV_CODEC_ID_H264
1217 && avctx->extradata_size > 0
1218 && avctx->extradata[0] == 1) {
1224 CHECK(meta->findData(kKeyAVCC, &type, &data, &size));
1226 const uint8_t *ptr = (const uint8_t *)data;
1229 CHECK_EQ((unsigned)ptr[0], 1u); // configurationVersion == 1
1231 // The number of bytes used to encode the length of a NAL unit.
1232 mNALLengthSize = 1 + (ptr[4] & 3);
1234 ALOGV("the stream is AVC, the length of a NAL unit: %d", mNALLengthSize);
1240 mMediaType = mStream->codec->codec_type;
1241 mFirstKeyPktTimestamp = AV_NOPTS_VALUE;
1244 FFmpegExtractor::Track::~Track() {
1245 ALOGV("FFmpegExtractor::Track::~Track %s",
1246 av_get_media_type_string(mMediaType));
1251 status_t FFmpegExtractor::Track::start(MetaData *params) {
1252 ALOGV("FFmpegExtractor::Track::start %s",
1253 av_get_media_type_string(mMediaType));
1254 Mutex::Autolock autoLock(mLock);
1255 //mExtractor->startReaderThread();
1259 status_t FFmpegExtractor::Track::stop() {
1260 ALOGV("FFmpegExtractor::Track::stop %s",
1261 av_get_media_type_string(mMediaType));
1262 Mutex::Autolock autoLock(mLock);
1263 //mExtractor->stopReaderThread();
1267 sp<MetaData> FFmpegExtractor::Track::getFormat() {
1268 Mutex::Autolock autoLock(mLock);
1273 status_t FFmpegExtractor::Track::read(
1274 MediaBuffer **buffer, const ReadOptions *options) {
1277 Mutex::Autolock autoLock(mLock);
1280 bool seeking = false;
1281 bool waitKeyPkt = false;
1282 ReadOptions::SeekMode mode;
1283 int64_t pktTS = AV_NOPTS_VALUE;
1284 int64_t seekTimeUs = AV_NOPTS_VALUE;
1285 int64_t timeUs = AV_NOPTS_VALUE;
1287 status_t status = OK;
1289 if (options && options->getSeekTo(&seekTimeUs, &mode)) {
1290 ALOGV("~~~%s seekTimeUs: %lld, mode: %d", av_get_media_type_string(mMediaType), seekTimeUs, mode);
1291 /* add the stream start time */
1292 if (mStream->start_time != AV_NOPTS_VALUE)
1293 seekTimeUs += mStream->start_time * av_q2d(mStream->time_base) * 1000000;
1294 ALOGV("~~~%s seekTimeUs[+startTime]: %lld, mode: %d", av_get_media_type_string(mMediaType), seekTimeUs, mode);
1296 if (mExtractor->stream_seek(seekTimeUs, mMediaType) == SEEK)
1301 if (packet_queue_get(mQueue, &pkt, 1) < 0) {
1302 mExtractor->reachedEOS(mMediaType);
1303 return ERROR_END_OF_STREAM;
1307 if (pkt.data != mQueue->flush_pkt.data) {
1308 av_free_packet(&pkt);
1312 #if WAIT_KEY_PACKET_AFTER_SEEK
1318 if (pkt.data == mQueue->flush_pkt.data) {
1319 ALOGV("read %s flush pkt", av_get_media_type_string(mMediaType));
1320 av_free_packet(&pkt);
1321 mFirstKeyPktTimestamp = AV_NOPTS_VALUE;
1323 } else if (pkt.data == NULL && pkt.size == 0) {
1324 ALOGD("read %s eos pkt", av_get_media_type_string(mMediaType));
1325 av_free_packet(&pkt);
1326 mExtractor->reachedEOS(mMediaType);
1327 return ERROR_END_OF_STREAM;
1330 key = pkt.flags & AV_PKT_FLAG_KEY ? 1 : 0;
1331 pktTS = pkt.pts; //FIXME AV_NOPTS_VALUE??
1334 if (pkt.pts == AV_NOPTS_VALUE)
1337 //FIXME, drop, omxcodec requires a positive timestamp! e.g. vorbis
1338 if (pktTS != AV_NOPTS_VALUE && pktTS < 0) {
1339 ALOGW("drop the packet with negative timestamp(pts:%lld)", pktTS);
1340 av_free_packet(&pkt);
1346 ALOGV("drop the non-key packet");
1347 av_free_packet(&pkt);
1350 ALOGV("~~~~~~ got the key packet");
1355 if (pktTS != AV_NOPTS_VALUE && mFirstKeyPktTimestamp == AV_NOPTS_VALUE) {
1356 // update the first key timestamp
1357 mFirstKeyPktTimestamp = pktTS;
1360 if (pktTS != AV_NOPTS_VALUE && pktTS < mFirstKeyPktTimestamp) {
1361 ALOGV("drop the packet with the backward timestamp, maybe they are B-frames after I-frame ^_^");
1362 av_free_packet(&pkt);
1366 MediaBuffer *mediaBuffer = new MediaBuffer(pkt.size + FF_INPUT_BUFFER_PADDING_SIZE);
1367 mediaBuffer->meta_data()->clear();
1368 mediaBuffer->set_range(0, pkt.size);
1371 if (mIsAVC && mNal2AnnexB) {
1372 /* This only works for NAL sizes 3-4 */
1373 CHECK(mNALLengthSize == 3 || mNALLengthSize == 4);
1375 uint8_t *dst = (uint8_t *)mediaBuffer->data();
1376 /* Convert H.264 NAL format to annex b */
1377 status = convertNal2AnnexB(dst, pkt.size, pkt.data, pkt.size, mNALLengthSize);
1379 ALOGE("convertNal2AnnexB failed");
1380 mediaBuffer->release();
1382 av_free_packet(&pkt);
1383 return ERROR_MALFORMED;
1386 memcpy(mediaBuffer->data(), pkt.data, pkt.size);
1389 int64_t start_time = mStream->start_time != AV_NOPTS_VALUE ? mStream->start_time : 0;
1390 if (pktTS != AV_NOPTS_VALUE)
1391 timeUs = (int64_t)((pktTS - start_time) * av_q2d(mStream->time_base) * 1000000);
1393 timeUs = SF_NOPTS_VALUE; //FIXME AV_NOPTS_VALUE is negative, but stagefright need positive
1396 if (pktTS != AV_NOPTS_VALUE)
1397 ALOGV("read %s pkt, size:%d, key:%d, pts:%lld, dts:%lld, timeUs[-startTime]:%lld us (%.2f secs)",
1398 av_get_media_type_string(mMediaType), pkt.size, key, pkt.pts, pkt.dts, timeUs, timeUs/1E6);
1400 ALOGV("read %s pkt, size:%d, key:%d, pts:N/A, dts:N/A, timeUs[-startTime]:N/A",
1401 av_get_media_type_string(mMediaType), pkt.size, key);
1404 mediaBuffer->meta_data()->setInt64(kKeyTime, timeUs);
1405 mediaBuffer->meta_data()->setInt32(kKeyIsSyncFrame, key);
1407 *buffer = mediaBuffer;
1409 av_free_packet(&pkt);
1414 ////////////////////////////////////////////////////////////////////////////////
1418 const char *container;
1421 static formatmap FILE_FORMATS[] = {
1422 {"mpeg", MEDIA_MIMETYPE_CONTAINER_MPEG2PS },
1423 {"mpegts", MEDIA_MIMETYPE_CONTAINER_TS },
1424 {"mov,mp4,m4a,3gp,3g2,mj2", MEDIA_MIMETYPE_CONTAINER_MPEG4 },
1425 {"matroska,webm", MEDIA_MIMETYPE_CONTAINER_MATROSKA },
1426 {"asf", MEDIA_MIMETYPE_CONTAINER_ASF },
1427 {"rm", MEDIA_MIMETYPE_CONTAINER_RM },
1428 {"flv", MEDIA_MIMETYPE_CONTAINER_FLV },
1429 {"swf", MEDIA_MIMETYPE_CONTAINER_FLV },
1430 {"avi", MEDIA_MIMETYPE_CONTAINER_AVI },
1431 {"ape", MEDIA_MIMETYPE_CONTAINER_APE },
1432 {"dts", MEDIA_MIMETYPE_CONTAINER_DTS },
1433 {"flac", MEDIA_MIMETYPE_CONTAINER_FLAC },
1434 {"ac3", MEDIA_MIMETYPE_AUDIO_AC3 },
1435 {"mp3", MEDIA_MIMETYPE_AUDIO_MPEG },
1436 {"wav", MEDIA_MIMETYPE_CONTAINER_WAV },
1437 {"ogg", MEDIA_MIMETYPE_CONTAINER_OGG },
1438 {"vc1", MEDIA_MIMETYPE_CONTAINER_VC1 },
1439 {"hevc", MEDIA_MIMETYPE_CONTAINER_HEVC },
1442 static enum AVCodecID getCodecId(AVFormatContext *ic, AVMediaType codec_type)
1444 unsigned int idx = 0;
1445 AVCodecContext *avctx = NULL;
1447 for (idx = 0; idx < ic->nb_streams; idx++) {
1448 if (ic->streams[idx]->disposition & AV_DISPOSITION_ATTACHED_PIC) {
1449 // FFMPEG converts album art to MJPEG, but we don't want to
1450 // include that in the parsing as MJPEG is not supported by
1451 // Android, which forces the media to be extracted by FFMPEG
1452 // while in fact, Android supports it.
1456 avctx = ic->streams[idx]->codec;
1457 if (avctx->codec_type == codec_type) {
1458 return avctx->codec_id;
1462 return AV_CODEC_ID_NONE;
1465 static bool hasAudioCodecOnly(AVFormatContext *ic)
1467 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
1468 bool haveVideo = false;
1469 bool haveAudio = false;
1471 if (getCodecId(ic, AVMEDIA_TYPE_VIDEO) != AV_CODEC_ID_NONE) {
1474 if (getCodecId(ic, AVMEDIA_TYPE_AUDIO) != AV_CODEC_ID_NONE) {
1478 if (!haveVideo && haveAudio) {
1485 //FIXME all codecs: frameworks/av/media/libstagefright/codecs/*
1486 static bool isCodecSupportedByStagefright(enum AVCodecID codec_id)
1488 bool supported = false;
1492 case AV_CODEC_ID_H264:
1493 case AV_CODEC_ID_MPEG4:
1494 case AV_CODEC_ID_H263:
1495 case AV_CODEC_ID_H263P:
1496 case AV_CODEC_ID_H263I:
1497 case AV_CODEC_ID_VP6:
1498 case AV_CODEC_ID_VP8:
1499 case AV_CODEC_ID_VP9:
1501 case AV_CODEC_ID_AAC:
1502 case AV_CODEC_ID_MP3:
1503 case AV_CODEC_ID_AMR_NB:
1504 case AV_CODEC_ID_AMR_WB:
1505 case AV_CODEC_ID_FLAC:
1506 case AV_CODEC_ID_VORBIS:
1507 case AV_CODEC_ID_PCM_MULAW: //g711
1508 case AV_CODEC_ID_PCM_ALAW: //g711
1509 case AV_CODEC_ID_GSM_MS:
1510 case AV_CODEC_ID_PCM_U8:
1511 case AV_CODEC_ID_PCM_S16LE:
1512 case AV_CODEC_ID_PCM_S24LE:
1520 ALOGD("%ssuppoted codec(%s) by official Stagefright",
1521 (supported ? "" : "un"),
1522 avcodec_get_name(codec_id));
1527 static void adjustMPEG4Confidence(AVFormatContext *ic, float *confidence)
1529 AVDictionary *tags = NULL;
1530 AVDictionaryEntry *tag = NULL;
1531 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
1534 codec_id = getCodecId(ic, AVMEDIA_TYPE_VIDEO);
1535 if (codec_id != AV_CODEC_ID_NONE
1536 && codec_id != AV_CODEC_ID_H264
1537 && codec_id != AV_CODEC_ID_MPEG4
1538 && codec_id != AV_CODEC_ID_H263
1539 && codec_id != AV_CODEC_ID_H263P
1540 && codec_id != AV_CODEC_ID_H263I) {
1541 //the MEDIA_MIMETYPE_CONTAINER_MPEG4 of confidence is 0.4f
1542 ALOGI("[mp4]video codec(%s), confidence should be larger than MPEG4Extractor",
1543 avcodec_get_name(codec_id));
1544 *confidence = 0.41f;
1547 codec_id = getCodecId(ic, AVMEDIA_TYPE_AUDIO);
1548 if (codec_id != AV_CODEC_ID_NONE
1549 && codec_id != AV_CODEC_ID_MP3
1550 && codec_id != AV_CODEC_ID_AAC
1551 && codec_id != AV_CODEC_ID_AMR_NB
1552 && codec_id != AV_CODEC_ID_AMR_WB) {
1553 ALOGI("[mp4]audio codec(%s), confidence should be larger than MPEG4Extractor",
1554 avcodec_get_name(codec_id));
1555 *confidence = 0.41f;
1559 tags = ic->metadata;
1560 //NOTE: You can use command to show these tags,
1561 //e.g. "ffprobe -show_format 2012.mov"
1562 tag = av_dict_get(tags, "major_brand", NULL, 0);
1567 ALOGV("major_brand tag is:%s", tag->value);
1569 //when MEDIA_MIMETYPE_CONTAINER_MPEG4
1570 //WTF, MPEG4Extractor.cpp can not extractor mov format
1571 //NOTE: isCompatibleBrand(MPEG4Extractor.cpp)
1572 // Won't promise that the following file types can be played.
1573 // Just give these file types a chance.
1574 // FOURCC('q', 't', ' ', ' '), // Apple's QuickTime
1576 if (!strcmp(tag->value, "qt ")) {
1577 ALOGI("[mp4]format is mov, confidence should be larger than mpeg4");
1578 *confidence = 0.41f;
1582 static void adjustMPEG2TSConfidence(AVFormatContext *ic, float *confidence)
1584 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
1586 codec_id = getCodecId(ic, AVMEDIA_TYPE_VIDEO);
1587 if (codec_id != AV_CODEC_ID_NONE
1588 && codec_id != AV_CODEC_ID_H264
1589 && codec_id != AV_CODEC_ID_MPEG4
1590 && codec_id != AV_CODEC_ID_MPEG1VIDEO
1591 && codec_id != AV_CODEC_ID_MPEG2VIDEO) {
1592 //the MEDIA_MIMETYPE_CONTAINER_MPEG2TS of confidence is 0.1f
1593 ALOGI("[mpeg2ts]video codec(%s), confidence should be larger than MPEG2TSExtractor",
1594 avcodec_get_name(codec_id));
1595 *confidence = 0.11f;
1598 codec_id = getCodecId(ic, AVMEDIA_TYPE_AUDIO);
1599 if (codec_id != AV_CODEC_ID_NONE
1600 && codec_id != AV_CODEC_ID_AAC
1601 && codec_id != AV_CODEC_ID_PCM_S16LE //FIXME, AV_CODEC_ID_PCM_S24LE, AV_CODEC_ID_PCM_S32LE?
1602 && codec_id != AV_CODEC_ID_MP1
1603 && codec_id != AV_CODEC_ID_MP2
1604 && codec_id != AV_CODEC_ID_MP3) {
1605 ALOGI("[mpeg2ts]audio codec(%s), confidence should be larger than MPEG2TSExtractor",
1606 avcodec_get_name(codec_id));
1607 *confidence = 0.11f;
1611 static void adjustMKVConfidence(AVFormatContext *ic, float *confidence)
1613 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
1615 codec_id = getCodecId(ic, AVMEDIA_TYPE_VIDEO);
1616 if (codec_id != AV_CODEC_ID_NONE
1617 && codec_id != AV_CODEC_ID_H264
1618 && codec_id != AV_CODEC_ID_MPEG4
1619 && codec_id != AV_CODEC_ID_VP6
1620 && codec_id != AV_CODEC_ID_VP8
1621 && codec_id != AV_CODEC_ID_VP9) {
1622 //the MEDIA_MIMETYPE_CONTAINER_MATROSKA of confidence is 0.6f
1623 ALOGI("[mkv]video codec(%s), confidence should be larger than MatroskaExtractor",
1624 avcodec_get_name(codec_id));
1625 *confidence = 0.61f;
1628 codec_id = getCodecId(ic, AVMEDIA_TYPE_AUDIO);
1629 if (codec_id != AV_CODEC_ID_NONE
1630 && codec_id != AV_CODEC_ID_AAC
1631 && codec_id != AV_CODEC_ID_MP3
1632 && codec_id != AV_CODEC_ID_VORBIS) {
1633 ALOGI("[mkv]audio codec(%s), confidence should be larger than MatroskaExtractor",
1634 avcodec_get_name(codec_id));
1635 *confidence = 0.61f;
1639 static void adjustCodecConfidence(AVFormatContext *ic, float *confidence)
1641 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
1643 codec_id = getCodecId(ic, AVMEDIA_TYPE_VIDEO);
1644 if (codec_id != AV_CODEC_ID_NONE) {
1645 if (!isCodecSupportedByStagefright(codec_id)) {
1646 *confidence = 0.88f;
1650 codec_id = getCodecId(ic, AVMEDIA_TYPE_AUDIO);
1651 if (codec_id != AV_CODEC_ID_NONE) {
1652 if (!isCodecSupportedByStagefright(codec_id)) {
1653 *confidence = 0.88f;
1657 if (getCodecId(ic, AVMEDIA_TYPE_VIDEO) != AV_CODEC_ID_NONE
1658 && getCodecId(ic, AVMEDIA_TYPE_AUDIO) == AV_CODEC_ID_MP3) {
1659 *confidence = 0.22f; //larger than MP3Extractor
1663 //TODO need more checks
1664 static void adjustConfidenceIfNeeded(const char *mime,
1665 AVFormatContext *ic, float *confidence)
1668 if (!strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MPEG4)) {
1669 adjustMPEG4Confidence(ic, confidence);
1670 } else if (!strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MPEG2TS)) {
1671 adjustMPEG2TSConfidence(ic, confidence);
1672 } else if (!strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MATROSKA)) {
1673 adjustMKVConfidence(ic, confidence);
1678 if (*confidence > 0.08) {
1683 adjustCodecConfidence(ic, confidence);
1686 static void adjustContainerIfNeeded(const char **mime, AVFormatContext *ic)
1688 const char *newMime = *mime;
1689 enum AVCodecID codec_id = AV_CODEC_ID_NONE;
1691 if (!hasAudioCodecOnly(ic)) {
1695 codec_id = getCodecId(ic, AVMEDIA_TYPE_AUDIO);
1696 CHECK(codec_id != AV_CODEC_ID_NONE);
1698 case AV_CODEC_ID_MP3:
1699 newMime = MEDIA_MIMETYPE_AUDIO_MPEG;
1701 case AV_CODEC_ID_AAC:
1702 newMime = MEDIA_MIMETYPE_AUDIO_AAC;
1704 case AV_CODEC_ID_VORBIS:
1705 newMime = MEDIA_MIMETYPE_AUDIO_VORBIS;
1707 case AV_CODEC_ID_FLAC:
1708 newMime = MEDIA_MIMETYPE_AUDIO_FLAC;
1710 case AV_CODEC_ID_AC3:
1711 newMime = MEDIA_MIMETYPE_AUDIO_AC3;
1713 case AV_CODEC_ID_APE:
1714 newMime = MEDIA_MIMETYPE_AUDIO_APE;
1716 case AV_CODEC_ID_DTS:
1717 newMime = MEDIA_MIMETYPE_AUDIO_DTS;
1719 case AV_CODEC_ID_MP2:
1720 newMime = MEDIA_MIMETYPE_AUDIO_MPEG_LAYER_II;
1722 case AV_CODEC_ID_COOK:
1723 newMime = MEDIA_MIMETYPE_AUDIO_RA;
1725 case AV_CODEC_ID_WMAV1:
1726 case AV_CODEC_ID_WMAV2:
1727 case AV_CODEC_ID_WMAPRO:
1728 case AV_CODEC_ID_WMALOSSLESS:
1729 newMime = MEDIA_MIMETYPE_AUDIO_WMA;
1735 if (!strcmp(*mime, MEDIA_MIMETYPE_CONTAINER_FFMPEG)) {
1736 newMime = MEDIA_MIMETYPE_AUDIO_FFMPEG;
1739 if (strcmp(*mime, newMime)) {
1740 ALOGI("adjust mime(%s -> %s)", *mime, newMime);
1745 static const char *findMatchingContainer(const char *name)
1748 const char *container = NULL;
1751 ALOGI("list the formats suppoted by ffmpeg: ");
1752 ALOGI("========================================");
1753 for (i = 0; i < NELEM(FILE_FORMATS); ++i) {
1754 ALOGV("format_names[%02d]: %s", i, FILE_FORMATS[i].format);
1756 ALOGI("========================================");
1759 for (i = 0; i < NELEM(FILE_FORMATS); ++i) {
1760 int len = strlen(FILE_FORMATS[i].format);
1761 if (!strncasecmp(name, FILE_FORMATS[i].format, len)) {
1762 container = FILE_FORMATS[i].container;
1770 static const char *SniffFFMPEGCommon(const char *url, float *confidence, bool fastMPEG4)
1774 size_t nb_streams = 0;
1775 const char *container = NULL;
1776 AVFormatContext *ic = NULL;
1777 AVDictionary **opts = NULL;
1779 status_t status = initFFmpeg();
1781 ALOGE("could not init ffmpeg");
1785 ic = avformat_alloc_context();
1788 ALOGE("oom for alloc avformat context");
1792 err = avformat_open_input(&ic, url, NULL, NULL);
1794 if (ic->iformat != NULL && ic->iformat->name != NULL &&
1795 findMatchingContainer(ic->iformat->name) != NULL &&
1796 !strcasecmp(findMatchingContainer(ic->iformat->name),
1797 MEDIA_MIMETYPE_CONTAINER_MPEG4)) {
1799 container = findMatchingContainer(ic->iformat->name);
1805 ALOGE("%s: avformat_open_input failed, err:%s", url, av_err2str(err));
1809 opts = setup_find_stream_info_opts(ic, codec_opts);
1810 nb_streams = ic->nb_streams;
1811 err = avformat_find_stream_info(ic, opts);
1813 ALOGE("%s: could not find stream info, err:%s", url, av_err2str(err));
1816 for (i = 0; i < nb_streams; i++) {
1817 av_dict_free(&opts[i]);
1821 av_dump_format(ic, 0, url, 0);
1823 ALOGI("FFmpegExtrator, url: %s, format_name: %s, format_long_name: %s",
1824 url, ic->iformat->name, ic->iformat->long_name);
1826 container = findMatchingContainer(ic->iformat->name);
1829 adjustContainerIfNeeded(&container, ic);
1830 adjustConfidenceIfNeeded(container, ic, confidence);
1835 avformat_close_input(&ic);
1844 static const char *BetterSniffFFMPEG(const sp<DataSource> &source,
1845 float *confidence, sp<AMessage> meta)
1847 const char *ret = NULL;
1848 char url[PATH_MAX] = {0};
1850 ALOGI("android-source:%p", source.get());
1852 // pass the addr of smart pointer("source")
1853 snprintf(url, sizeof(url), "android-source:%p", source.get());
1855 ret = SniffFFMPEGCommon(url, confidence, (source->flags() & DataSource::kIsCachingDataSource));
1857 meta->setString("extended-extractor-url", url);
1863 static const char *LegacySniffFFMPEG(const sp<DataSource> &source,
1864 float *confidence, sp<AMessage> meta)
1866 const char *ret = NULL;
1867 char url[PATH_MAX] = {0};
1869 String8 uri = source->getUri();
1870 if (!uri.string()) {
1874 ALOGI("source url:%s", uri.string());
1876 // pass the addr of smart pointer("source") + file name
1877 snprintf(url, sizeof(url), "android-source:%p|file:%s", source.get(), uri.string());
1879 ret = SniffFFMPEGCommon(url, confidence, false);
1881 meta->setString("extended-extractor-url", url);
1888 const sp<DataSource> &source, String8 *mimeType, float *confidence,
1889 sp<AMessage> *meta) {
1890 ALOGV("SniffFFMPEG");
1892 *meta = new AMessage;
1893 *confidence = 0.08f; // be the last resort, by default
1895 const char *container = BetterSniffFFMPEG(source, confidence, *meta);
1897 ALOGW("sniff through BetterSniffFFMPEG failed, try LegacySniffFFMPEG");
1898 container = LegacySniffFFMPEG(source, confidence, *meta);
1900 ALOGI("sniff through LegacySniffFFMPEG success");
1903 ALOGI("sniff through BetterSniffFFMPEG success");
1906 if (container == NULL) {
1907 ALOGD("SniffFFMPEG failed to sniff this source");
1913 ALOGD("ffmpeg detected media content as '%s' with confidence %.2f",
1914 container, *confidence);
1916 /* use MPEG4Extractor(not extended extractor) for HTTP source only */
1917 if (!strcasecmp(container, MEDIA_MIMETYPE_CONTAINER_MPEG4)
1918 && (source->flags() & DataSource::kIsCachingDataSource)) {
1919 ALOGI("support container: %s, but it is caching data source, "
1920 "Don't use ffmpegextractor", container);
1926 mimeType->setTo(container);
1928 (*meta)->setString("extended-extractor", "extended-extractor");
1929 (*meta)->setString("extended-extractor-subtype", "ffmpegextractor");
1930 (*meta)->setString("extended-extractor-mime", container);
1933 char value[PROPERTY_VALUE_MAX];
1934 property_get("sys.media.parser.ffmpeg", value, "0");
1936 ALOGI("[debug] use ffmpeg parser");
1937 *confidence = 0.88f;
1940 if (*confidence > 0.08f) {
1941 (*meta)->setString("extended-extractor-use", "ffmpegextractor");
1947 MediaExtractor *CreateFFmpegExtractor(const sp<DataSource> &source, const char *mime, const sp<AMessage> &meta) {
1948 MediaExtractor *ret = NULL;
1950 if (meta.get() && meta->findString("extended-extractor", ¬use) && (
1951 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_MPEG) ||
1952 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_AAC) ||
1953 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_VORBIS) ||
1954 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_FLAC) ||
1955 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_AC3) ||
1956 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_APE) ||
1957 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_DTS) ||
1958 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_MPEG_LAYER_II) ||
1959 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_RA) ||
1960 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_WMA) ||
1961 !strcasecmp(mime, MEDIA_MIMETYPE_AUDIO_FFMPEG) ||
1962 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MPEG4) ||
1963 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MOV) ||
1964 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MATROSKA) ||
1965 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_TS) ||
1966 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MPEG2PS) ||
1967 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_AVI) ||
1968 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_ASF) ||
1969 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_WEBM) ||
1970 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_WMV) ||
1971 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MPG) ||
1972 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_FLV) ||
1973 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_DIVX) ||
1974 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_RM) ||
1975 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_WAV) ||
1976 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_FLAC) ||
1977 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_APE) ||
1978 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_DTS) ||
1979 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_MP2) ||
1980 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_RA) ||
1981 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_OGG) ||
1982 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_VC1) ||
1983 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_HEVC) ||
1984 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_WMA) ||
1985 !strcasecmp(mime, MEDIA_MIMETYPE_CONTAINER_FFMPEG))) {
1986 ret = new FFmpegExtractor(source, meta);
1989 ALOGD("%ssupported mime: %s", (ret ? "" : "un"), mime);
1993 } // namespace android
1995 extern "C" void getExtractorPlugin(android::MediaExtractor::Plugin *plugin)
1997 plugin->sniff = android::SniffFFMPEG;
1998 plugin->create = android::CreateFFmpegExtractor;