| // Copyright 2018 The Cobalt Authors. All Rights Reserved. |
| // |
| // Licensed under the Apache License, Version 2.0 (the "License"); |
| // you may not use this file except in compliance with the License. |
| // You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| |
| // This file contains the explicit specialization of the AudioDecoderImpl class |
| // for the value 'FFMPEG'. |
| |
| #include "starboard/shared/ffmpeg/ffmpeg_audio_decoder_impl.h" |
| |
| #include <string> |
| |
| #include "starboard/audio_sink.h" |
| #include "starboard/common/log.h" |
| #include "starboard/common/string.h" |
| #include "starboard/media.h" |
| #include "starboard/memory.h" |
| #include "starboard/shared/starboard/media/media_util.h" |
| |
| namespace starboard { |
| namespace shared { |
| namespace ffmpeg { |
| |
| namespace { |
| |
| SbMediaAudioSampleType GetSupportedSampleType() { |
| if (SbAudioSinkIsAudioSampleTypeSupported(kSbMediaAudioSampleTypeFloat32)) { |
| return kSbMediaAudioSampleTypeFloat32; |
| } |
| return kSbMediaAudioSampleTypeInt16Deprecated; |
| } |
| |
| AVCodecID GetFfmpegCodecIdByMediaCodec( |
| starboard::media::AudioStreamInfo stream_info) { |
| SbMediaAudioCodec audio_codec = stream_info.codec; |
| |
| switch (audio_codec) { |
| case kSbMediaAudioCodecAac: |
| return AV_CODEC_ID_AAC; |
| case kSbMediaAudioCodecAc3: |
| #if SB_API_VERSION < 15 |
| return kSbHasAc3Audio ? AV_CODEC_ID_AC3 : AV_CODEC_ID_NONE; |
| #endif // SB_API_VERSION < 15 |
| return AV_CODEC_ID_AC3; |
| case kSbMediaAudioCodecEac3: |
| #if SB_API_VERSION < 15 |
| return kSbHasAc3Audio ? AV_CODEC_ID_EAC3 : AV_CODEC_ID_NONE; |
| #endif // SB_API_VERSION < 15 |
| return AV_CODEC_ID_EAC3; |
| case kSbMediaAudioCodecOpus: |
| return AV_CODEC_ID_OPUS; |
| case kSbMediaAudioCodecVorbis: |
| return AV_CODEC_ID_VORBIS; |
| case kSbMediaAudioCodecMp3: |
| return AV_CODEC_ID_MP3; |
| case kSbMediaAudioCodecPcm: |
| if (stream_info.bits_per_sample == 16) { |
| return AV_CODEC_ID_PCM_S16LE; |
| } else { |
| SB_LOG(ERROR) << "PCM is only supported for 16-bit audio (" |
| << stream_info.bits_per_sample |
| << " bits per sample was requested)"; |
| return AV_CODEC_ID_NONE; |
| } |
| case kSbMediaAudioCodecFlac: |
| if (stream_info.bits_per_sample == 16) { |
| return AV_CODEC_ID_FLAC; |
| } else { |
| SB_LOG(ERROR) << "FLAC is only supported for 16-bit audio (" |
| << stream_info.bits_per_sample |
| << " bits per sample was requested)"; |
| return AV_CODEC_ID_NONE; |
| } |
| default: |
| return AV_CODEC_ID_NONE; |
| } |
| } |
| |
| const bool g_registered = |
| FFMPEGDispatch::RegisterSpecialization(FFMPEG, |
| LIBAVCODEC_VERSION_MAJOR, |
| LIBAVFORMAT_VERSION_MAJOR, |
| LIBAVUTIL_VERSION_MAJOR); |
| |
| } // namespace |
| |
| AudioDecoderImpl<FFMPEG>::AudioDecoderImpl( |
| const AudioStreamInfo& audio_stream_info) |
| : codec_context_(NULL), |
| av_frame_(NULL), |
| stream_ended_(false), |
| audio_stream_info_(audio_stream_info) { |
| SB_DCHECK(g_registered) << "Decoder Specialization registration failed."; |
| SB_DCHECK(GetFfmpegCodecIdByMediaCodec(audio_stream_info_) != |
| AV_CODEC_ID_NONE) |
| << "Unsupported audio codec " << audio_stream_info_.codec; |
| ffmpeg_ = FFMPEGDispatch::GetInstance(); |
| SB_DCHECK(ffmpeg_); |
| if ((ffmpeg_->specialization_version()) == FFMPEG) { |
| InitializeCodec(); |
| } |
| } |
| |
| AudioDecoderImpl<FFMPEG>::~AudioDecoderImpl() { |
| TeardownCodec(); |
| } |
| |
| // static |
| AudioDecoder* AudioDecoderImpl<FFMPEG>::Create( |
| const AudioStreamInfo& audio_stream_info) { |
| return new AudioDecoderImpl<FFMPEG>(audio_stream_info); |
| } |
| |
| void AudioDecoderImpl<FFMPEG>::Initialize(const OutputCB& output_cb, |
| const ErrorCB& error_cb) { |
| SB_DCHECK(BelongsToCurrentThread()); |
| SB_DCHECK(output_cb); |
| SB_DCHECK(!output_cb_); |
| SB_DCHECK(error_cb); |
| SB_DCHECK(!error_cb_); |
| |
| output_cb_ = output_cb; |
| error_cb_ = error_cb; |
| } |
| |
| void AudioDecoderImpl<FFMPEG>::Decode(const InputBuffers& input_buffers, |
| const ConsumedCB& consumed_cb) { |
| SB_DCHECK(BelongsToCurrentThread()); |
| SB_DCHECK(input_buffers.size() == 1); |
| SB_DCHECK(input_buffers[0]); |
| SB_DCHECK(output_cb_); |
| SB_CHECK(codec_context_ != NULL); |
| |
| Schedule(consumed_cb); |
| |
| if (input_buffers.empty() || !input_buffers[0]) { |
| SB_LOG(ERROR) << "No input buffer to decode."; |
| return; |
| } |
| if (stream_ended_) { |
| SB_LOG(ERROR) << "Decode() is called after WriteEndOfStream() is called."; |
| return; |
| } |
| const auto& input_buffer = input_buffers[0]; |
| |
| AVPacket packet; |
| ffmpeg_->av_init_packet(&packet); |
| packet.data = const_cast<uint8_t*>(input_buffer->data()); |
| packet.size = input_buffer->size(); |
| |
| #if LIBAVUTIL_VERSION_INT < LIBAVUTIL_VERSION_52_8 |
| ffmpeg_->avcodec_get_frame_defaults(av_frame_); |
| #endif // LIBAVUTIL_VERSION_INT < LIBAVUTIL_VERSION_52_8 |
| |
| int result = 0; |
| if (ffmpeg_->avcodec_version() < kAVCodecHasUniformDecodeAPI) { |
| int frame_decoded = 0; |
| result = ffmpeg_->avcodec_decode_audio4(codec_context_, av_frame_, |
| &frame_decoded, &packet); |
| if (result != input_buffer->size()) { |
| // TODO: Consider fill it with silence. |
| SB_DLOG(WARNING) << "avcodec_decode_audio4() failed with result: " |
| << result |
| << " with input buffer size: " << input_buffer->size() |
| << " and frame decoded: " << frame_decoded; |
| error_cb_(kSbPlayerErrorDecode, |
| FormatString("avcodec_decode_audio4() failed with result %d.", |
| result)); |
| return; |
| } |
| |
| if (frame_decoded != 1) { |
| // TODO: Adjust timestamp accordingly when decoding result is shifted. |
| SB_DCHECK(frame_decoded == 0); |
| SB_DLOG(WARNING) << "avcodec_decode_audio4()/avcodec_receive_frame() " |
| "returns with 0 frames decoded"; |
| return; |
| } |
| |
| ProcessDecodedFrame(*input_buffer, *av_frame_); |
| return; |
| } |
| |
| // Newer decode API. |
| const int send_packet_result = |
| ffmpeg_->avcodec_send_packet(codec_context_, &packet); |
| if (send_packet_result != 0) { |
| const std::string error_message = FormatString( |
| "avcodec_send_packet() failed with result %d.", send_packet_result); |
| SB_DLOG(WARNING) << error_message; |
| error_cb_(kSbPlayerErrorDecode, error_message); |
| return; |
| } |
| |
| // Keep receiving frames until the decoder has processed the entire packet. |
| for (;;) { |
| result = ffmpeg_->avcodec_receive_frame(codec_context_, av_frame_); |
| if (result != 0) { |
| // We either hit an error or are done processing packet. |
| break; |
| } |
| ProcessDecodedFrame(*input_buffer, *av_frame_); |
| } |
| |
| // A return value of AVERROR(EAGAIN) signifies that the decoder needs |
| // another packet, so we are done processing the existing packet at that |
| // point. |
| if (result != AVERROR(EAGAIN)) { |
| SB_DLOG(WARNING) << "avcodec_receive_frame() failed with result: " |
| << result; |
| error_cb_( |
| kSbPlayerErrorDecode, |
| FormatString("avcodec_receive_frame() failed with result %d.", result)); |
| } |
| } |
| |
| void AudioDecoderImpl<FFMPEG>::ProcessDecodedFrame( |
| const InputBuffer& input_buffer, |
| const AVFrame& av_frame) { |
| int decoded_audio_size = ffmpeg_->av_samples_get_buffer_size( |
| NULL, codec_context_->channels, av_frame.nb_samples, |
| codec_context_->sample_fmt, 1); |
| audio_stream_info_.samples_per_second = codec_context_->sample_rate; |
| |
| if (decoded_audio_size <= 0) { |
| // TODO: Consider fill it with silence. |
| SB_LOG(ERROR) << "Decoded audio frame is empty."; |
| return; |
| } |
| |
| scoped_refptr<DecodedAudio> decoded_audio = new DecodedAudio( |
| codec_context_->channels, GetSampleType(), GetStorageType(), |
| input_buffer.timestamp(), |
| codec_context_->channels * av_frame.nb_samples * |
| starboard::media::GetBytesPerSample(GetSampleType())); |
| if (GetStorageType() == kSbMediaAudioFrameStorageTypeInterleaved) { |
| memcpy(decoded_audio->data(), *av_frame.extended_data, |
| decoded_audio->size_in_bytes()); |
| } else { |
| SB_DCHECK(GetStorageType() == kSbMediaAudioFrameStorageTypePlanar); |
| const int per_channel_size_in_bytes = |
| decoded_audio->size_in_bytes() / decoded_audio->channels(); |
| for (int i = 0; i < decoded_audio->channels(); ++i) { |
| memcpy(decoded_audio->data() + per_channel_size_in_bytes * i, |
| av_frame.extended_data[i], per_channel_size_in_bytes); |
| } |
| decoded_audio = decoded_audio->SwitchFormatTo( |
| GetSampleType(), kSbMediaAudioFrameStorageTypeInterleaved); |
| } |
| decoded_audio->AdjustForDiscardedDurations( |
| audio_stream_info_.samples_per_second, |
| input_buffer.audio_sample_info().discarded_duration_from_front, |
| input_buffer.audio_sample_info().discarded_duration_from_back); |
| decoded_audios_.push(decoded_audio); |
| Schedule(output_cb_); |
| } |
| |
| void AudioDecoderImpl<FFMPEG>::WriteEndOfStream() { |
| SB_DCHECK(BelongsToCurrentThread()); |
| SB_DCHECK(output_cb_); |
| |
| // AAC has no dependent frames so we needn't flush the decoder. Set the flag |
| // to ensure that Decode() is not called when the stream is ended. |
| stream_ended_ = true; |
| // Put EOS into the queue. |
| decoded_audios_.push(new DecodedAudio); |
| |
| Schedule(output_cb_); |
| } |
| |
| scoped_refptr<AudioDecoderImpl<FFMPEG>::DecodedAudio> |
| AudioDecoderImpl<FFMPEG>::Read(int* samples_per_second) { |
| SB_DCHECK(BelongsToCurrentThread()); |
| SB_DCHECK(output_cb_); |
| SB_DCHECK(!decoded_audios_.empty()); |
| |
| scoped_refptr<DecodedAudio> result; |
| if (!decoded_audios_.empty()) { |
| result = decoded_audios_.front(); |
| decoded_audios_.pop(); |
| } |
| *samples_per_second = audio_stream_info_.samples_per_second; |
| return result; |
| } |
| |
| void AudioDecoderImpl<FFMPEG>::Reset() { |
| SB_DCHECK(BelongsToCurrentThread()); |
| |
| TeardownCodec(); |
| if ((ffmpeg_->specialization_version()) == FFMPEG) { |
| InitializeCodec(); |
| } |
| |
| stream_ended_ = false; |
| while (!decoded_audios_.empty()) { |
| decoded_audios_.pop(); |
| } |
| |
| CancelPendingJobs(); |
| } |
| |
| bool AudioDecoderImpl<FFMPEG>::is_valid() const { |
| return (ffmpeg_ != NULL) && ffmpeg_->is_valid() && (codec_context_ != NULL); |
| } |
| |
| SbMediaAudioSampleType AudioDecoderImpl<FFMPEG>::GetSampleType() const { |
| SB_DCHECK(BelongsToCurrentThread()); |
| |
| if (codec_context_->sample_fmt == AV_SAMPLE_FMT_S16 || |
| codec_context_->sample_fmt == AV_SAMPLE_FMT_S16P) { |
| return kSbMediaAudioSampleTypeInt16Deprecated; |
| } else if (codec_context_->sample_fmt == AV_SAMPLE_FMT_FLT || |
| codec_context_->sample_fmt == AV_SAMPLE_FMT_FLTP) { |
| return kSbMediaAudioSampleTypeFloat32; |
| } |
| |
| SB_NOTREACHED(); |
| |
| return kSbMediaAudioSampleTypeFloat32; |
| } |
| |
| SbMediaAudioFrameStorageType AudioDecoderImpl<FFMPEG>::GetStorageType() const { |
| SB_DCHECK(BelongsToCurrentThread()); |
| |
| if (codec_context_->sample_fmt == AV_SAMPLE_FMT_S16 || |
| codec_context_->sample_fmt == AV_SAMPLE_FMT_FLT) { |
| return kSbMediaAudioFrameStorageTypeInterleaved; |
| } |
| if (codec_context_->sample_fmt == AV_SAMPLE_FMT_S16P || |
| codec_context_->sample_fmt == AV_SAMPLE_FMT_FLTP) { |
| return kSbMediaAudioFrameStorageTypePlanar; |
| } |
| |
| SB_NOTREACHED(); |
| return kSbMediaAudioFrameStorageTypeInterleaved; |
| } |
| |
| void AudioDecoderImpl<FFMPEG>::InitializeCodec() { |
| codec_context_ = ffmpeg_->avcodec_alloc_context3(NULL); |
| |
| if (codec_context_ == NULL) { |
| SB_LOG(ERROR) << "Unable to allocate ffmpeg codec context"; |
| return; |
| } |
| |
| codec_context_->codec_type = AVMEDIA_TYPE_AUDIO; |
| codec_context_->codec_id = GetFfmpegCodecIdByMediaCodec(audio_stream_info_); |
| // Request_sample_fmt is set by us, but sample_fmt is set by the decoder. |
| if (GetSupportedSampleType() == kSbMediaAudioSampleTypeInt16Deprecated |
| // If we request FLT for 16-bit FLAC, FFmpeg will pick S32 as the closest |
| // option. Since the rest of this pipeline doesn't support S32, we should |
| // use S16 as the desired format. |
| || audio_stream_info_.codec == kSbMediaAudioCodecFlac) { |
| codec_context_->request_sample_fmt = AV_SAMPLE_FMT_S16; |
| } else { |
| codec_context_->request_sample_fmt = AV_SAMPLE_FMT_FLT; |
| } |
| |
| codec_context_->channels = audio_stream_info_.number_of_channels; |
| codec_context_->sample_rate = audio_stream_info_.samples_per_second; |
| codec_context_->extradata = NULL; |
| codec_context_->extradata_size = 0; |
| |
| if ((codec_context_->codec_id == AV_CODEC_ID_OPUS || |
| codec_context_->codec_id == AV_CODEC_ID_VORBIS) && |
| !audio_stream_info_.audio_specific_config.empty()) { |
| // AV_INPUT_BUFFER_PADDING_SIZE is not defined in ancient avcodec.h. Use a |
| // large enough padding here explicitly. |
| const int kAvInputBufferPaddingSize = 256; |
| codec_context_->extradata_size = |
| audio_stream_info_.audio_specific_config.size(); |
| codec_context_->extradata = static_cast<uint8_t*>(ffmpeg_->av_malloc( |
| codec_context_->extradata_size + kAvInputBufferPaddingSize)); |
| SB_DCHECK(codec_context_->extradata); |
| memcpy(codec_context_->extradata, |
| audio_stream_info_.audio_specific_config.data(), |
| codec_context_->extradata_size); |
| memset(codec_context_->extradata + codec_context_->extradata_size, 0, |
| kAvInputBufferPaddingSize); |
| } |
| |
| AVCodec* codec = ffmpeg_->avcodec_find_decoder(codec_context_->codec_id); |
| |
| if (codec == NULL) { |
| SB_LOG(ERROR) << "Unable to allocate ffmpeg codec context"; |
| TeardownCodec(); |
| return; |
| } |
| |
| int rv = ffmpeg_->OpenCodec(codec_context_, codec); |
| if (rv < 0) { |
| SB_LOG(ERROR) << "Unable to open codec"; |
| TeardownCodec(); |
| return; |
| } |
| |
| if (ffmpeg_->avcodec_version() > kAVCodecSupportsAvFrameAlloc) { |
| av_frame_ = ffmpeg_->av_frame_alloc(); |
| } else { |
| av_frame_ = ffmpeg_->avcodec_alloc_frame(); |
| } |
| if (av_frame_ == NULL) { |
| SB_LOG(ERROR) << "Unable to allocate audio frame"; |
| TeardownCodec(); |
| } |
| } |
| |
| void AudioDecoderImpl<FFMPEG>::TeardownCodec() { |
| if (codec_context_) { |
| ffmpeg_->CloseCodec(codec_context_); |
| ffmpeg_->FreeContext(&codec_context_); |
| } |
| ffmpeg_->FreeFrame(&av_frame_); |
| } |
| |
| } // namespace ffmpeg |
| } // namespace shared |
| } // namespace starboard |