third_party/chromium/media/formats/mp4/mp4_stream_parser_unittest.cc - cobalt - Git at Google

 // Copyright 2014 The Chromium Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "media/formats/mp4/mp4_stream_parser.h"

 #include <stddef.h>
 #include <stdint.h>

 #include <algorithm>
 #include <memory>
 #include <string>
 #include <tuple>

 #include "base/bind.h"
 #include "base/callback_helpers.h"
 #include "base/logging.h"
 #include "base/memory/ref_counted.h"
 #include "base/test/metrics/histogram_tester.h"
 #include "base/test/mock_callback.h"
 #include "base/time/time.h"
 #include "media/base/audio_decoder_config.h"
 #include "media/base/decoder_buffer.h"
 #include "media/base/media_switches.h"
 #include "media/base/media_track.h"
 #include "media/base/media_tracks.h"
 #include "media/base/mock_media_log.h"
 #include "media/base/stream_parser.h"
 #include "media/base/stream_parser_buffer.h"
 #include "media/base/test_data_util.h"
 #include "media/base/test_helpers.h"
 #include "media/base/text_track_config.h"
 #include "media/base/video_decoder_config.h"
 #include "media/formats/mp4/es_descriptor.h"
 #include "media/formats/mp4/fourccs.h"
 #include "media/media_buildflags.h"
 #include "testing/gmock/include/gmock/gmock.h"
 #include "testing/gtest/include/gtest/gtest-param-test.h"
 #include "testing/gtest/include/gtest/gtest.h"

 using ::testing::InSequence;
 using ::testing::StrictMock;

 namespace media {
 namespace mp4 {
 namespace {

 // Useful in single-track test media cases that need to verify
 // keyframe/non-keyframe sequence in output of parse.
 enum class Keyframeness {
   kKeyframe = 0,
   kNonKeyframe,
 };

 // Tells gtest how to print our Keyframeness enum values.
 std::ostream& operator<<(std::ostream& os, Keyframeness k) {
   return os << (k == Keyframeness::kKeyframe ? "kKeyframe" : "kNonKeyframe");
 }

 }  // namespace

 // Matchers for verifying common media log entry strings.
 MATCHER(SampleEncryptionInfoUnavailableLog, "") {
   return CONTAINS_STRING(arg, "Sample encryption info is not available.");
 }

 MATCHER_P(ErrorLog, error_string, "") {
   return CONTAINS_STRING(arg, error_string) && CONTAINS_STRING(arg, "error");
 }

 MATCHER_P(DebugLog, debug_string, "") {
   return CONTAINS_STRING(arg, debug_string) && CONTAINS_STRING(arg, "debug");
 }

 class MP4StreamParserTest : public testing::Test {
  public:
   MP4StreamParserTest()
       : configs_received_(false),
         lower_bound_(
             DecodeTimestamp::FromPresentationTime(base::TimeDelta::Max())),
         verifying_keyframeness_sequence_(false) {
     std::set<int> audio_object_types;
     audio_object_types.insert(kISO_14496_3);
     parser_.reset(new MP4StreamParser(audio_object_types, false, false));
   }

  protected:
   StrictMock<MockMediaLog> media_log_;
   std::unique_ptr<MP4StreamParser> parser_;
   bool configs_received_;
   std::unique_ptr<MediaTracks> media_tracks_;
   AudioDecoderConfig audio_decoder_config_;
   VideoDecoderConfig video_decoder_config_;
   DecodeTimestamp lower_bound_;
   StreamParser::TrackId audio_track_id_;
   StreamParser::TrackId video_track_id_;
   bool verifying_keyframeness_sequence_;
   StrictMock<base::MockRepeatingCallback<void(Keyframeness)>> keyframeness_cb_;

   bool AppendData(const uint8_t* data, size_t length) {
     return parser_->Parse(data, length);
   }

   bool AppendDataInPieces(const uint8_t* data,
                           size_t length,
                           size_t piece_size) {
     const uint8_t* start = data;
     const uint8_t* end = data + length;
     while (start < end) {
       size_t append_size = std::min(piece_size,
                                     static_cast<size_t>(end - start));
       if (!AppendData(start, append_size))
         return false;
       start += append_size;
     }
     return true;
   }

   void InitF(const StreamParser::InitParameters& expected_params,
              const StreamParser::InitParameters& params) {
     DVLOG(1) << "InitF: dur=" << params.duration.InMicroseconds();
     EXPECT_EQ(expected_params.duration, params.duration);
     EXPECT_EQ(expected_params.timeline_offset, params.timeline_offset);
     EXPECT_EQ(expected_params.liveness, params.liveness);
     EXPECT_EQ(expected_params.detected_audio_track_count,
               params.detected_audio_track_count);
     EXPECT_EQ(expected_params.detected_video_track_count,
               params.detected_video_track_count);
     EXPECT_EQ(expected_params.detected_text_track_count,
               params.detected_text_track_count);
   }

   bool NewConfigF(std::unique_ptr<MediaTracks> tracks,
                   const StreamParser::TextTrackConfigMap& tc) {
     configs_received_ = true;
     CHECK(tracks.get());
     DVLOG(1) << "NewConfigF: got " << tracks->tracks().size() << " tracks";
     for (const auto& track : tracks->tracks()) {
       const auto& track_id = track->bytestream_track_id();
       if (track->type() == MediaTrack::Audio) {
         audio_track_id_ = track_id;
         audio_decoder_config_ = tracks->getAudioConfig(track_id);
         DVLOG(1) << "track_id=" << track_id << " audio config="
                  << (audio_decoder_config_.IsValidConfig()
                          ? audio_decoder_config_.AsHumanReadableString()
                          : "INVALID");
       } else if (track->type() == MediaTrack::Video) {
         video_track_id_ = track_id;
         video_decoder_config_ = tracks->getVideoConfig(track_id);
         DVLOG(1) << "track_id=" << track_id << " video config="
                  << (video_decoder_config_.IsValidConfig()
                          ? video_decoder_config_.AsHumanReadableString()
                          : "INVALID");
       }
     }
     media_tracks_ = std::move(tracks);
     return true;
   }

   bool NewBuffersF(const StreamParser::BufferQueueMap& buffer_queue_map) {
     DecodeTimestamp lowest_end_dts = kNoDecodeTimestamp();
     for (const auto& it : buffer_queue_map) {
       DVLOG(3) << "Buffers for track_id=" << it.first;
       DCHECK(!it.second.empty());

       if (lowest_end_dts == kNoDecodeTimestamp() ||
           lowest_end_dts > it.second.back()->GetDecodeTimestamp())
         lowest_end_dts = it.second.back()->GetDecodeTimestamp();

       for (const auto& buf : it.second) {
         DVLOG(3) << "  track_id=" << buf->track_id()
                  << ", size=" << buf->data_size()
                  << ", pts=" << buf->timestamp().InSecondsF()
                  << ", dts=" << buf->GetDecodeTimestamp().InSecondsF()
                  << ", dur=" << buf->duration().InSecondsF();
         // Ensure that track ids are properly assigned on all emitted buffers.
         EXPECT_EQ(it.first, buf->track_id());

         // Let single-track tests verify the sequence of keyframes/nonkeyframes.
         if (verifying_keyframeness_sequence_) {
           keyframeness_cb_.Run(buf->is_key_frame()
                                    ? Keyframeness::kKeyframe
                                    : Keyframeness::kNonKeyframe);
         }
       }
     }

     EXPECT_NE(lowest_end_dts, kNoDecodeTimestamp());

     if (lower_bound_ != kNoDecodeTimestamp() && lowest_end_dts < lower_bound_) {
       return false;
     }

     lower_bound_ = lowest_end_dts;
     return true;
   }

   void KeyNeededF(EmeInitDataType type, const std::vector<uint8_t>& init_data) {
     DVLOG(1) << "KeyNeededF: " << init_data.size();
     EXPECT_EQ(EmeInitDataType::CENC, type);
     EXPECT_FALSE(init_data.empty());
   }

   void NewSegmentF() {
     DVLOG(1) << "NewSegmentF";
     lower_bound_ = kNoDecodeTimestamp();
   }

   void EndOfSegmentF() {
     DVLOG(1) << "EndOfSegmentF()";
     lower_bound_ =
         DecodeTimestamp::FromPresentationTime(base::TimeDelta::Max());
   }

   void InitializeParserWithInitParametersExpectations(
       StreamParser::InitParameters params) {
     parser_->Init(base::BindOnce(&MP4StreamParserTest::InitF,
                                  base::Unretained(this), params),
                   base::BindRepeating(&MP4StreamParserTest::NewConfigF,
                                       base::Unretained(this)),
                   base::BindRepeating(&MP4StreamParserTest::NewBuffersF,
                                       base::Unretained(this)),
                   true,
                   base::BindRepeating(&MP4StreamParserTest::KeyNeededF,
                                       base::Unretained(this)),
                   base::BindRepeating(&MP4StreamParserTest::NewSegmentF,
                                       base::Unretained(this)),
                   base::BindRepeating(&MP4StreamParserTest::EndOfSegmentF,
                                       base::Unretained(this)),
                   &media_log_);
   }

   StreamParser::InitParameters GetDefaultInitParametersExpectations() {
     // Most unencrypted test mp4 files have zero duration and are treated as
     // live streams.
     StreamParser::InitParameters params(kInfiniteDuration);
     params.liveness = DemuxerStream::LIVENESS_LIVE;
     params.detected_audio_track_count = 1;
     params.detected_video_track_count = 1;
     params.detected_text_track_count = 0;
     return params;
   }

   void InitializeParserAndExpectLiveness(DemuxerStream::Liveness liveness) {
     auto params = GetDefaultInitParametersExpectations();
     params.liveness = liveness;
     InitializeParserWithInitParametersExpectations(params);
   }

   void InitializeParser() {
     InitializeParserWithInitParametersExpectations(
         GetDefaultInitParametersExpectations());
   }

   bool ParseMP4File(const std::string& filename, int append_bytes) {
     scoped_refptr<DecoderBuffer> buffer = ReadTestDataFile(filename);
     EXPECT_TRUE(AppendDataInPieces(buffer->data(),
                                    buffer->data_size(),
                                    append_bytes));
     return true;
   }
 };

 TEST_F(MP4StreamParserTest, UnalignedAppend) {
   // Test small, non-segment-aligned appends (small enough to exercise
   // incremental append system)
   InitializeParser();
   ParseMP4File("bear-1280x720-av_frag.mp4", 512);
 }

 constexpr char kShakaPackagerUMA[] = "Media.MSE.DetectedShakaPackagerInMp4";

 TEST_F(MP4StreamParserTest, DidNotUseShakaPackager) {
   // Encrypted files have non-zero duration and are treated as recorded streams.
   auto params = GetDefaultInitParametersExpectations();
   params.duration = base::Microseconds(2736066);
   params.liveness = DemuxerStream::LIVENESS_RECORDED;
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);

   base::HistogramTester tester;

   // Test file has ID32 box, but no shaka player metadata.
   ParseMP4File("bear-640x360-v_frag-cenc-senc-no-saiz-saio.mp4", 512);
   tester.ExpectUniqueSample(kShakaPackagerUMA, 0, 1);
 }

 TEST_F(MP4StreamParserTest, UsedShakaPackager) {
   auto params = GetDefaultInitParametersExpectations();
   params.duration = base::Microseconds(2736000);
   params.liveness = DemuxerStream::LIVENESS_RECORDED;
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);

   base::HistogramTester tester;
   ParseMP4File("bear-320x240-v_frag-vp9.mp4", 512);
   tester.ExpectUniqueSample(kShakaPackagerUMA, 1, 1);
 }

 TEST_F(MP4StreamParserTest, BytewiseAppend) {
   // Ensure no incremental errors occur when parsing
   InitializeParser();
   ParseMP4File("bear-1280x720-av_frag.mp4", 1);
 }

 TEST_F(MP4StreamParserTest, MultiFragmentAppend) {
   // Large size ensures multiple fragments are appended in one call (size is
   // larger than this particular test file)
   InitializeParser();
   ParseMP4File("bear-1280x720-av_frag.mp4", 768432);
 }

 TEST_F(MP4StreamParserTest, Flush) {
   // Flush while reading sample data, then start a new stream.
   InitializeParser();

   scoped_refptr<DecoderBuffer> buffer =
       ReadTestDataFile("bear-1280x720-av_frag.mp4");
   EXPECT_TRUE(AppendDataInPieces(buffer->data(), 65536, 512));
   parser_->Flush();
   EXPECT_TRUE(AppendDataInPieces(buffer->data(),
                                  buffer->data_size(),
                                  512));
 }

 TEST_F(MP4StreamParserTest, Reinitialization) {
   InitializeParser();

   scoped_refptr<DecoderBuffer> buffer =
       ReadTestDataFile("bear-1280x720-av_frag.mp4");
   EXPECT_TRUE(AppendDataInPieces(buffer->data(),
                                  buffer->data_size(),
                                  512));
   EXPECT_TRUE(AppendDataInPieces(buffer->data(),
                                  buffer->data_size(),
                                  512));
 }

 TEST_F(MP4StreamParserTest, UnknownDuration_V0_AllBitsSet) {
   InitializeParser();
   // 32 bit duration field in mvhd box, all bits set.
   ParseMP4File(
       "bear-1280x720-av_frag-initsegment-mvhd_version_0-mvhd_duration_bits_all_"
       "set.mp4",
       512);
 }

 TEST_F(MP4StreamParserTest, AVC_KeyAndNonKeyframeness_Match_Container) {
   // Both AVC video frames' keyframe-ness metadata matches the MP4:
   // Frame 0: AVC IDR, trun.first_sample_flags: sync sample that doesn't
   //          depend on others.
   // Frame 1: AVC Non-IDR, tfhd.default_sample_flags: not sync sample, depends
   //          on others.
   // This is the base case; see also the "Mismatches" cases, below.
   InSequence s;  // The EXPECT* sequence matters for this test.
   auto params = GetDefaultInitParametersExpectations();
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);
   verifying_keyframeness_sequence_ = true;
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kKeyframe));
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kNonKeyframe));
   ParseMP4File("bear-640x360-v-2frames_frag.mp4", 512);
 }

 TEST_F(MP4StreamParserTest, AVC_Keyframeness_Mismatches_Container) {
   // The first AVC video frame's keyframe-ness metadata mismatches the MP4:
   // Frame 0: AVC IDR, trun.first_sample_flags: NOT sync sample, DEPENDS on
   //          others.
   // Frame 1: AVC Non-IDR, tfhd.default_sample_flags: not sync sample, depends
   //          on others.
   InSequence s;  // The EXPECT* sequence matters for this test.
   auto params = GetDefaultInitParametersExpectations();
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);
   verifying_keyframeness_sequence_ = true;
   EXPECT_MEDIA_LOG(DebugLog(
       "ISO-BMFF container metadata for video frame indicates that the frame is "
       "not a keyframe, but the video frame contents indicate the opposite."));
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kKeyframe));
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kNonKeyframe));
   ParseMP4File("bear-640x360-v-2frames-keyframe-is-non-sync-sample_frag.mp4",
                512);
 }

 TEST_F(MP4StreamParserTest, AVC_NonKeyframeness_Mismatches_Container) {
   // The second AVC video frame's keyframe-ness metadata mismatches the MP4:
   // Frame 0: AVC IDR, trun.first_sample_flags: sync sample that doesn't
   //          depend on others.
   // Frame 1: AVC Non-IDR, tfhd.default_sample_flags: SYNC sample, DOES NOT
   //          depend on others.
   InSequence s;  // The EXPECT* sequence matters for this test.
   auto params = GetDefaultInitParametersExpectations();
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);
   verifying_keyframeness_sequence_ = true;
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kKeyframe));
   EXPECT_MEDIA_LOG(DebugLog(
       "ISO-BMFF container metadata for video frame indicates that the frame is "
       "a keyframe, but the video frame contents indicate the opposite."));
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kNonKeyframe));
   ParseMP4File("bear-640x360-v-2frames-nonkeyframe-is-sync-sample_frag.mp4",
                512);
 }

 TEST_F(MP4StreamParserTest, MPEG2_AAC_LC) {
   InSequence s;
   std::set<int> audio_object_types;
   audio_object_types.insert(kISO_13818_7_AAC_LC);
   parser_.reset(new MP4StreamParser(audio_object_types, false, false));
   auto params = GetDefaultInitParametersExpectations();
   params.detected_video_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);
   ParseMP4File("bear-mpeg2-aac-only_frag.mp4", 512);
   EXPECT_EQ(audio_decoder_config_.profile(), AudioCodecProfile::kUnknown);
 }

 TEST_F(MP4StreamParserTest, MPEG4_XHE_AAC) {
   InSequence s;  // The keyframeness sequence matters for this test.
   std::set<int> audio_object_types;
   audio_object_types.insert(kISO_14496_3);
   parser_.reset(new MP4StreamParser(audio_object_types, false, false));
   auto params = GetDefaultInitParametersExpectations();
   params.detected_video_track_count = 0;

   InitializeParserWithInitParametersExpectations(params);

   // This test file contains a single audio keyframe followed by 23
   // non-keyframes.
   verifying_keyframeness_sequence_ = true;
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kKeyframe));
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kNonKeyframe)).Times(23);

   ParseMP4File("noise-xhe-aac.mp4", 512);
   EXPECT_EQ(audio_decoder_config_.profile(), AudioCodecProfile::kXHE_AAC);
 }

 // Test that a moov box is not always required after Flush() is called.
 TEST_F(MP4StreamParserTest, NoMoovAfterFlush) {
   InitializeParser();

   scoped_refptr<DecoderBuffer> buffer =
       ReadTestDataFile("bear-1280x720-av_frag.mp4");
   EXPECT_TRUE(AppendDataInPieces(buffer->data(),
                                  buffer->data_size(),
                                  512));
   parser_->Flush();

   const int kFirstMoofOffset = 1307;
   EXPECT_TRUE(AppendDataInPieces(buffer->data() + kFirstMoofOffset,
                                  buffer->data_size() - kFirstMoofOffset,
                                  512));
 }

 // Test an invalid file where there are encrypted samples, but
 // SampleEncryptionBox (senc) and SampleAuxiliaryInformation{Sizes|Offsets}Box
 // (saiz|saio) are missing.
 // The parser should fail instead of crash. See http://crbug.com/361347
 TEST_F(MP4StreamParserTest, MissingSampleEncryptionInfo) {
   InSequence s;

   // Encrypted test mp4 files have non-zero duration and are treated as
   // recorded streams.
   auto params = GetDefaultInitParametersExpectations();
   params.duration = base::Microseconds(23219);
   params.liveness = DemuxerStream::LIVENESS_RECORDED;
   params.detected_video_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);

   scoped_refptr<DecoderBuffer> buffer =
       ReadTestDataFile("bear-1280x720-a_frag-cenc_missing-saiz-saio.mp4");
   EXPECT_MEDIA_LOG(SampleEncryptionInfoUnavailableLog());
   EXPECT_FALSE(AppendDataInPieces(buffer->data(), buffer->data_size(), 512));
 }

 // Test a file where all video samples start with an Access Unit
 // Delimiter (AUD) NALU.
 TEST_F(MP4StreamParserTest, VideoSamplesStartWithAUDs) {
   auto params = GetDefaultInitParametersExpectations();
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);
   ParseMP4File("bear-1280x720-av_with-aud-nalus_frag.mp4", 512);
 }

 TEST_F(MP4StreamParserTest, HEVC_in_MP4_container) {
 #if BUILDFLAG(ENABLE_PLATFORM_HEVC)
   bool expect_success = true;
 #else
   bool expect_success = false;
   EXPECT_MEDIA_LOG(ErrorLog("Unsupported VisualSampleEntry type hev1"));
 #endif
   auto params = GetDefaultInitParametersExpectations();
   params.duration = base::Microseconds(1002000);
   params.liveness = DemuxerStream::LIVENESS_RECORDED;
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);

   scoped_refptr<DecoderBuffer> buffer = ReadTestDataFile("bear-hevc-frag.mp4");
   EXPECT_EQ(expect_success,
             AppendDataInPieces(buffer->data(), buffer->data_size(), 512));
 #if BUILDFLAG(ENABLE_PLATFORM_HEVC)
   EXPECT_EQ(VideoCodec::kHEVC, video_decoder_config_.codec());
   EXPECT_EQ(HEVCPROFILE_MAIN, video_decoder_config_.profile());
 #endif
 }

 #if BUILDFLAG(ENABLE_PLATFORM_HEVC)
 TEST_F(MP4StreamParserTest, HEVC_KeyAndNonKeyframeness_Match_Container) {
   // Both HEVC video frames' keyframe-ness metadata matches the MP4:
   // Frame 0: HEVC IDR, trun.first_sample_flags: sync sample that doesn't
   //          depend on others.
   // Frame 1: HEVC Non-IDR, tfhd.default_sample_flags: not sync sample, depends
   //          on others.
   // This is the base case; see also the "Mismatches" cases, below.
   InSequence s;  // The EXPECT* sequence matters for this test.
   auto params = GetDefaultInitParametersExpectations();
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);
   verifying_keyframeness_sequence_ = true;
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kKeyframe));
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kNonKeyframe));
   ParseMP4File("bear-320x240-v-2frames_frag-hevc.mp4", 256);
 }

 TEST_F(MP4StreamParserTest, HEVC_Keyframeness_Mismatches_Container) {
   // The first HEVC video frame's keyframe-ness metadata mismatches the MP4:
   // Frame 0: HEVC IDR, trun.first_sample_flags: NOT sync sample, DEPENDS on
   //          others.
   // Frame 1: HEVC Non-IDR, tfhd.default_sample_flags: not sync sample, depends
   //          on others.
   InSequence s;  // The EXPECT* sequence matters for this test.
   auto params = GetDefaultInitParametersExpectations();
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);
   verifying_keyframeness_sequence_ = true;
   EXPECT_MEDIA_LOG(DebugLog(
       "ISO-BMFF container metadata for video frame indicates that the frame is "
       "not a keyframe, but the video frame contents indicate the opposite."));
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kKeyframe));
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kNonKeyframe));
   ParseMP4File(
       "bear-320x240-v-2frames-keyframe-is-non-sync-sample_frag-hevc.mp4", 256);
 }

 TEST_F(MP4StreamParserTest, HEVC_NonKeyframeness_Mismatches_Container) {
   // The second HEVC video frame's keyframe-ness metadata mismatches the MP4:
   // Frame 0: HEVC IDR, trun.first_sample_flags: sync sample that doesn't
   //          depend on others.
   // Frame 1: HEVC Non-IDR, tfhd.default_sample_flags: SYNC sample, DOES NOT
   //          depend on others.
   InSequence s;  // The EXPECT* sequence matters for this test.
   auto params = GetDefaultInitParametersExpectations();
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);
   verifying_keyframeness_sequence_ = true;
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kKeyframe));
   EXPECT_MEDIA_LOG(DebugLog(
       "ISO-BMFF container metadata for video frame indicates that the frame is "
       "a keyframe, but the video frame contents indicate the opposite."));
   EXPECT_CALL(keyframeness_cb_, Run(Keyframeness::kNonKeyframe));
   ParseMP4File(
       "bear-320x240-v-2frames-nonkeyframe-is-sync-sample_frag-hevc.mp4", 256);
 }
 #endif

 // Sample encryption information is stored as CencSampleAuxiliaryDataFormat
 // (ISO/IEC 23001-7:2015 8) inside 'mdat' box. No SampleEncryption ('senc') box.
 TEST_F(MP4StreamParserTest, CencWithEncryptionInfoStoredAsAuxDataInMdat) {
   // Encrypted test mp4 files have non-zero duration and are treated as
   // recorded streams.
   auto params = GetDefaultInitParametersExpectations();
   params.duration = base::Microseconds(2736066);
   params.liveness = DemuxerStream::LIVENESS_RECORDED;
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);

   scoped_refptr<DecoderBuffer> buffer =
       ReadTestDataFile("bear-1280x720-v_frag-cenc.mp4");
   EXPECT_TRUE(AppendDataInPieces(buffer->data(), buffer->data_size(), 512));
 }

 TEST_F(MP4StreamParserTest, CencWithSampleEncryptionBox) {
   // Encrypted test mp4 files have non-zero duration and are treated as
   // recorded streams.
   auto params = GetDefaultInitParametersExpectations();
   params.duration = base::Microseconds(2736066);
   params.liveness = DemuxerStream::LIVENESS_RECORDED;
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);

   scoped_refptr<DecoderBuffer> buffer =
       ReadTestDataFile("bear-640x360-v_frag-cenc-senc.mp4");
   EXPECT_TRUE(AppendDataInPieces(buffer->data(), buffer->data_size(), 512));
 }

 TEST_F(MP4StreamParserTest, NaturalSizeWithoutPASP) {
   auto params = GetDefaultInitParametersExpectations();
   params.duration = base::Microseconds(1000966);
   params.liveness = DemuxerStream::LIVENESS_RECORDED;
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);

   scoped_refptr<DecoderBuffer> buffer =
       ReadTestDataFile("bear-640x360-non_square_pixel-without_pasp.mp4");

   EXPECT_TRUE(AppendDataInPieces(buffer->data(), buffer->data_size(), 512));
   EXPECT_EQ(gfx::Size(639, 360), video_decoder_config_.natural_size());
 }

 TEST_F(MP4StreamParserTest, NaturalSizeWithPASP) {
   auto params = GetDefaultInitParametersExpectations();
   params.duration = base::Microseconds(1000966);
   params.liveness = DemuxerStream::LIVENESS_RECORDED;
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);

   scoped_refptr<DecoderBuffer> buffer =
       ReadTestDataFile("bear-640x360-non_square_pixel-with_pasp.mp4");

   EXPECT_TRUE(AppendDataInPieces(buffer->data(), buffer->data_size(), 512));
   EXPECT_EQ(gfx::Size(639, 360), video_decoder_config_.natural_size());
 }

 TEST_F(MP4StreamParserTest, DemuxingAC3) {
   std::set<int> audio_object_types;
   audio_object_types.insert(kAC3);
   parser_.reset(new MP4StreamParser(audio_object_types, false, false));

 #if BUILDFLAG(ENABLE_PLATFORM_AC3_EAC3_AUDIO)
   bool expect_success = true;
 #else
   bool expect_success = false;
   EXPECT_MEDIA_LOG(ErrorLog("Unsupported audio format 0x61632d33 in stsd box"));
 #endif

   auto params = GetDefaultInitParametersExpectations();
   params.duration = base::Microseconds(1045000);
   params.liveness = DemuxerStream::LIVENESS_RECORDED;
   params.detected_video_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);

   scoped_refptr<DecoderBuffer> buffer =
       ReadTestDataFile("bear-ac3-only-frag.mp4");
   EXPECT_EQ(expect_success,
             AppendDataInPieces(buffer->data(), buffer->data_size(), 512));
 }

 TEST_F(MP4StreamParserTest, DemuxingEAC3) {
   std::set<int> audio_object_types;
   audio_object_types.insert(kEAC3);
   parser_.reset(new MP4StreamParser(audio_object_types, false, false));

 #if BUILDFLAG(ENABLE_PLATFORM_AC3_EAC3_AUDIO)
   bool expect_success = true;
 #else
   bool expect_success = false;
   EXPECT_MEDIA_LOG(ErrorLog("Unsupported audio format 0x65632d33 in stsd box"));
 #endif

   auto params = GetDefaultInitParametersExpectations();
   params.duration = base::Microseconds(1045000);
   params.liveness = DemuxerStream::LIVENESS_RECORDED;
   params.detected_video_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);

   scoped_refptr<DecoderBuffer> buffer =
       ReadTestDataFile("bear-eac3-only-frag.mp4");
   EXPECT_EQ(expect_success,
             AppendDataInPieces(buffer->data(), buffer->data_size(), 512));
 }

 TEST_F(MP4StreamParserTest, Flac) {
   parser_.reset(new MP4StreamParser(std::set<int>(), false, true));

   auto params = GetDefaultInitParametersExpectations();
   params.detected_video_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);

   scoped_refptr<DecoderBuffer> buffer = ReadTestDataFile("bear-flac_frag.mp4");
   EXPECT_TRUE(AppendDataInPieces(buffer->data(), buffer->data_size(), 512));
 }

 TEST_F(MP4StreamParserTest, Flac192kHz) {
   parser_.reset(new MP4StreamParser(std::set<int>(), false, true));

   auto params = GetDefaultInitParametersExpectations();
   params.detected_video_track_count = 0;

   // 192kHz exceeds the range of AudioSampleEntry samplerate. The correct
   // samplerate should be applied from the dfLa STREAMINFO metadata block.
   EXPECT_MEDIA_LOG(FlacAudioSampleRateOverriddenByStreaminfo("0", "192000"));
   InitializeParserWithInitParametersExpectations(params);

   scoped_refptr<DecoderBuffer> buffer =
       ReadTestDataFile("bear-flac-192kHz_frag.mp4");
   EXPECT_TRUE(AppendDataInPieces(buffer->data(), buffer->data_size(), 512));
 }

 TEST_F(MP4StreamParserTest, Vp9) {
   auto params = GetDefaultInitParametersExpectations();
   params.detected_audio_track_count = 0;
   InitializeParserWithInitParametersExpectations(params);

   auto buffer = ReadTestDataFile("vp9-hdr-init-segment.mp4");
   EXPECT_TRUE(AppendDataInPieces(buffer->data(), buffer->data_size(), 512));

   EXPECT_EQ(video_decoder_config_.profile(), VP9PROFILE_PROFILE2);
   EXPECT_EQ(video_decoder_config_.level(), 31u);
   EXPECT_EQ(video_decoder_config_.color_space_info(),
             VideoColorSpace(VideoColorSpace::PrimaryID::BT2020,
                             VideoColorSpace::TransferID::SMPTEST2084,
                             VideoColorSpace::MatrixID::BT2020_NCL,
                             gfx::ColorSpace::RangeID::LIMITED));

   ASSERT_TRUE(video_decoder_config_.hdr_metadata().has_value());

   const auto& hdr_metadata = *video_decoder_config_.hdr_metadata();
   EXPECT_EQ(hdr_metadata.max_content_light_level, 1000u);
   EXPECT_EQ(hdr_metadata.max_frame_average_light_level, 640u);

   const auto& color_volume_metadata = hdr_metadata.color_volume_metadata;

   constexpr float kColorCoordinateUnit = 1 / 16.0f;
   EXPECT_NEAR(color_volume_metadata.primary_r.x(), 0.68, kColorCoordinateUnit);
   EXPECT_NEAR(color_volume_metadata.primary_r.y(), 0.31998,
               kColorCoordinateUnit);
   EXPECT_NEAR(color_volume_metadata.primary_g.x(), 0.26496,
               kColorCoordinateUnit);
   EXPECT_NEAR(color_volume_metadata.primary_g.y(), 0.68998,
               kColorCoordinateUnit);
   EXPECT_NEAR(color_volume_metadata.primary_b.x(), 0.15, kColorCoordinateUnit);
   EXPECT_NEAR(color_volume_metadata.primary_b.y(), 0.05998,
               kColorCoordinateUnit);
   EXPECT_NEAR(color_volume_metadata.white_point.x(), 0.314,
               kColorCoordinateUnit);
   EXPECT_NEAR(color_volume_metadata.white_point.y(), 0.351,
               kColorCoordinateUnit);

   constexpr float kLuminanceMaxUnit = 1 / 8.0f;
   EXPECT_NEAR(color_volume_metadata.luminance_max, 1000.0f, kLuminanceMaxUnit);

   constexpr float kLuminanceMinUnit = 1 / 14.0;
   EXPECT_NEAR(color_volume_metadata.luminance_min, 0.01f, kLuminanceMinUnit);
 }

 TEST_F(MP4StreamParserTest, FourCCToString) {
   // A real FOURCC should print.
   EXPECT_EQ("mvex", FourCCToString(FOURCC_MVEX));

   // Invalid FOURCC should also print whenever ASCII values are printable.
   EXPECT_EQ("fake", FourCCToString(static_cast<FourCC>(0x66616b65)));

   // Invalid FORCC with non-printable values should not give error message.
   EXPECT_EQ("0x66616b00", FourCCToString(static_cast<FourCC>(0x66616b00)));
 }

 TEST_F(MP4StreamParserTest, MediaTrackInfoSourcing) {
   InitializeParser();
   ParseMP4File("bear-1280x720-av_frag.mp4", 4096);

   EXPECT_EQ(media_tracks_->tracks().size(), 2u);
   const MediaTrack& video_track = *(media_tracks_->tracks()[0]);
   EXPECT_EQ(video_track.type(), MediaTrack::Video);
   EXPECT_EQ(video_track.bytestream_track_id(), 1);
   EXPECT_EQ(video_track.kind().value(), "main");
   EXPECT_EQ(video_track.label().value(), "VideoHandler");
   EXPECT_EQ(video_track.language().value(), "und");

   const MediaTrack& audio_track = *(media_tracks_->tracks()[1]);
   EXPECT_EQ(audio_track.type(), MediaTrack::Audio);
   EXPECT_EQ(audio_track.bytestream_track_id(), 2);
   EXPECT_EQ(audio_track.kind().value(), "main");
   EXPECT_EQ(audio_track.label().value(), "SoundHandler");
   EXPECT_EQ(audio_track.language().value(), "und");
 }

 TEST_F(MP4StreamParserTest, TextTrackDetection) {
   auto params = GetDefaultInitParametersExpectations();
   params.detected_text_track_count = 1;
   InitializeParserWithInitParametersExpectations(params);

   scoped_refptr<DecoderBuffer> buffer =
       ReadTestDataFile("bear-1280x720-avt_subt_frag.mp4");

   EXPECT_TRUE(AppendDataInPieces(buffer->data(), buffer->data_size(), 512));
 }

 TEST_F(MP4StreamParserTest, MultiTrackFile) {
   auto params = GetDefaultInitParametersExpectations();
   params.duration = base::Milliseconds(4248);
   params.liveness = DemuxerStream::LIVENESS_RECORDED;
   params.detected_audio_track_count = 2;
   params.detected_video_track_count = 2;
   InitializeParserWithInitParametersExpectations(params);
   ParseMP4File("bbb-320x240-2video-2audio.mp4", 4096);

   EXPECT_EQ(media_tracks_->tracks().size(), 4u);

   const MediaTrack& video_track1 = *(media_tracks_->tracks()[0]);
   EXPECT_EQ(video_track1.type(), MediaTrack::Video);
   EXPECT_EQ(video_track1.bytestream_track_id(), 1);
   EXPECT_EQ(video_track1.kind().value(), "main");
   EXPECT_EQ(video_track1.label().value(), "VideoHandler");
   EXPECT_EQ(video_track1.language().value(), "und");

   const MediaTrack& audio_track1 = *(media_tracks_->tracks()[1]);
   EXPECT_EQ(audio_track1.type(), MediaTrack::Audio);
   EXPECT_EQ(audio_track1.bytestream_track_id(), 2);
   EXPECT_EQ(audio_track1.kind().value(), "main");
   EXPECT_EQ(audio_track1.label().value(), "SoundHandler");
   EXPECT_EQ(audio_track1.language().value(), "und");

   const MediaTrack& video_track2 = *(media_tracks_->tracks()[2]);
   EXPECT_EQ(video_track2.type(), MediaTrack::Video);
   EXPECT_EQ(video_track2.bytestream_track_id(), 3);
   EXPECT_EQ(video_track2.kind().value(), "");
   EXPECT_EQ(video_track2.label().value(), "VideoHandler");
   EXPECT_EQ(video_track2.language().value(), "und");

   const MediaTrack& audio_track2 = *(media_tracks_->tracks()[3]);
   EXPECT_EQ(audio_track2.type(), MediaTrack::Audio);
   EXPECT_EQ(audio_track2.bytestream_track_id(), 4);
   EXPECT_EQ(audio_track2.kind().value(), "");
   EXPECT_EQ(audio_track2.label().value(), "SoundHandler");
   EXPECT_EQ(audio_track2.language().value(), "und");
 }

 // <cos(θ), sin(θ), θ expressed as a rotation Enum>
 using MatrixRotationTestCaseParam =
     std::tuple<double, double, VideoTransformation>;

 class MP4StreamParserRotationMatrixEvaluatorTest
     : public ::testing::TestWithParam<MatrixRotationTestCaseParam> {
  public:
   MP4StreamParserRotationMatrixEvaluatorTest() {
     std::set<int> audio_object_types;
     audio_object_types.insert(kISO_14496_3);
     parser_.reset(new MP4StreamParser(audio_object_types, false, false));
   }

  protected:
   std::unique_ptr<MP4StreamParser> parser_;
 };

 TEST_P(MP4StreamParserRotationMatrixEvaluatorTest, RotationCalculation) {
   TrackHeader track_header;
   MovieHeader movie_header;

   // Identity matrix, with 16.16 and 2.30 fixed points.
   uint32_t identity_matrix[9] = {1 << 16, 0, 0, 0, 1 << 16, 0, 0, 0, 1 << 30};

   memcpy(movie_header.display_matrix, identity_matrix, sizeof(identity_matrix));
   memcpy(track_header.display_matrix, identity_matrix, sizeof(identity_matrix));

   MatrixRotationTestCaseParam data = GetParam();

   // Insert fixed point decimal data into the rotation matrix.
   track_header.display_matrix[0] = std::get<0>(data) * (1 << 16);
   track_header.display_matrix[4] = std::get<0>(data) * (1 << 16);
   track_header.display_matrix[1] = -(std::get<1>(data) * (1 << 16));
   track_header.display_matrix[3] = std::get<1>(data) * (1 << 16);

   VideoTransformation expected = std::get<2>(data);
   VideoTransformation actual =
       parser_->CalculateRotation(track_header, movie_header);
   EXPECT_EQ(actual.rotation, expected.rotation);
   EXPECT_EQ(actual.mirrored, expected.mirrored);
 }

 MatrixRotationTestCaseParam rotation_test_cases[6] = {
     {1, 0, VideoTransformation(VIDEO_ROTATION_0)},  // cos(0)  = 1, sin(0)  = 0
     {0, -1,
      VideoTransformation(VIDEO_ROTATION_90)},  // cos(90) = 0, sin(90) =-1
     {-1, 0,
      VideoTransformation(VIDEO_ROTATION_180)},  // cos(180)=-1, sin(180)= 0
     {0, 1,
      VideoTransformation(VIDEO_ROTATION_270)},      // cos(270)= 0, sin(270)= 1
     {1, 1, VideoTransformation(VIDEO_ROTATION_0)},  // Error case
     {5, 5, VideoTransformation(VIDEO_ROTATION_0)},  // Error case
 };
 INSTANTIATE_TEST_SUITE_P(CheckMath,
                          MP4StreamParserRotationMatrixEvaluatorTest,
                          testing::ValuesIn(rotation_test_cases));

 }  // namespace mp4
 }  // namespace media