src/cobalt/media/filters/frame_processor_unittest.cc - cobalt - Git at Google

 // Copyright 2014 The Chromium Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include <map>
 #include <memory>
 #include <string>
 #include <vector>

 #include "base/basictypes.h"
 #include "base/bind.h"
 #include "base/message_loop/message_loop.h"
 #include "base/run_loop.h"
 #include "base/strings/string_number_conversions.h"
 #include "base/strings/string_split.h"
 #include "base/strings/string_util.h"
 #include "base/time/time.h"
 #include "cobalt/media/base/media_log.h"
 #include "cobalt/media/base/media_util.h"
 #include "cobalt/media/base/mock_filters.h"
 #include "cobalt/media/base/test_helpers.h"
 #include "cobalt/media/base/timestamp_constants.h"
 #include "cobalt/media/filters/chunk_demuxer.h"
 #include "cobalt/media/filters/frame_processor.h"
 #include "starboard/types.h"
 #include "testing/gtest/include/gtest/gtest.h"

 using ::testing::InSequence;
 using ::testing::StrictMock;
 using ::testing::Values;

 namespace cobalt {
 namespace media {

 typedef StreamParser::BufferQueue BufferQueue;
 typedef StreamParser::TrackId TrackId;

 // Used for setting expectations on callbacks. Using a StrictMock also lets us
 // test for missing or extra callbacks.
 class FrameProcessorTestCallbackHelper {
  public:
   FrameProcessorTestCallbackHelper() {}
   virtual ~FrameProcessorTestCallbackHelper() {}

   MOCK_METHOD1(PossibleDurationIncrease, void(base::TimeDelta new_duration));

   // Helper that calls the mock method as well as does basic sanity checks on
   // |new_duration|.
   void OnPossibleDurationIncrease(base::TimeDelta new_duration) {
     PossibleDurationIncrease(new_duration);
     ASSERT_NE(kNoTimestamp, new_duration);
     ASSERT_NE(kInfiniteDuration, new_duration);
   }

  private:
   DISALLOW_COPY_AND_ASSIGN(FrameProcessorTestCallbackHelper);
 };

 // Test parameter determines indicates if the TEST_P instance is targeted for
 // sequence mode (if true), or segments mode (if false).
 class FrameProcessorTest : public testing::TestWithParam<bool> {
  protected:
   FrameProcessorTest()
       : frame_processor_(new FrameProcessor(
             base::Bind(
                 &FrameProcessorTestCallbackHelper::OnPossibleDurationIncrease,
                 base::Unretained(&callbacks_)),
             new MediaLog())),
         append_window_end_(kInfiniteDuration),
         frame_duration_(base::TimeDelta::FromMilliseconds(10)),
         audio_id_(1),
         video_id_(2) {}

   enum StreamFlags { HAS_AUDIO = 1 << 0, HAS_VIDEO = 1 << 1 };

   void AddTestTracks(int stream_flags) {
     const bool has_audio = (stream_flags & HAS_AUDIO) != 0;
     const bool has_video = (stream_flags & HAS_VIDEO) != 0;
     ASSERT_TRUE(has_audio || has_video);

     if (has_audio) {
       CreateAndConfigureStream(DemuxerStream::AUDIO);
       ASSERT_TRUE(audio_);
       EXPECT_TRUE(frame_processor_->AddTrack(audio_id_, audio_.get()));
       seek(audio_.get(), base::TimeDelta());
     }
     if (has_video) {
       CreateAndConfigureStream(DemuxerStream::VIDEO);
       ASSERT_TRUE(video_);
       EXPECT_TRUE(frame_processor_->AddTrack(video_id_, video_.get()));
       seek(video_.get(), base::TimeDelta());
     }
   }

   void SetTimestampOffset(base::TimeDelta new_offset) {
     timestamp_offset_ = new_offset;
     frame_processor_->SetGroupStartTimestampIfInSequenceMode(timestamp_offset_);
   }

   BufferQueue StringToBufferQueue(const std::string& buffers_to_append,
                                   const TrackId track_id,
                                   const DemuxerStream::Type type) {
     std::vector<std::string> timestamps = base::SplitString(
         buffers_to_append, " ", base::TRIM_WHITESPACE, base::SPLIT_WANT_ALL);

     BufferQueue buffers;
     for (size_t i = 0; i < timestamps.size(); i++) {
       bool is_keyframe = false;
       if (base::EndsWith(timestamps[i], "K", base::CompareCase::SENSITIVE)) {
         is_keyframe = true;
         // Remove the "K" off of the token.
         timestamps[i] = timestamps[i].substr(0, timestamps[i].length() - 1);
       }

       // Use custom decode timestamp if included.
       std::vector<std::string> buffer_timestamps = base::SplitString(
           timestamps[i], "|", base::TRIM_WHITESPACE, base::SPLIT_WANT_ALL);
       if (buffer_timestamps.size() == 1)
         buffer_timestamps.push_back(buffer_timestamps[0]);
       CHECK_EQ(2u, buffer_timestamps.size());

       double time_in_ms, decode_time_in_ms;
       CHECK(base::StringToDouble(buffer_timestamps[0], &time_in_ms));
       CHECK(base::StringToDouble(buffer_timestamps[1], &decode_time_in_ms));

       // Create buffer. Encode the original time_in_ms as the buffer's data to
       // enable later verification of possible buffer relocation in presentation
       // timeline due to coded frame processing.
       const uint8_t* timestamp_as_data =
           reinterpret_cast<uint8_t*>(&time_in_ms);
       scoped_refptr<StreamParserBuffer> buffer = StreamParserBuffer::CopyFrom(
           timestamp_as_data, sizeof(time_in_ms), is_keyframe, type, track_id);
       ASSERT_TRUE(buffer);
       base::TimeDelta timestamp = base::TimeDelta::FromSecondsD(
           time_in_ms / base::Time::kMillisecondsPerSecond);
       buffer->set_timestamp(timestamp);
       if (time_in_ms != decode_time_in_ms) {
         DecodeTimestamp decode_timestamp = DecodeTimestamp::FromSecondsD(
             decode_time_in_ms / base::Time::kMillisecondsPerSecond);
         buffer->SetDecodeTimestamp(decode_timestamp);
       }

       buffer->set_duration(frame_duration_);
       buffers.push_back(buffer);
     }
     return buffers;
   }

   void ProcessFrames(const std::string& audio_timestamps,
                      const std::string& video_timestamps) {
     StreamParser::BufferQueueMap buffer_queue_map;
     const auto& audio_buffers =
         StringToBufferQueue(audio_timestamps, audio_id_, DemuxerStream::AUDIO);
     if (!audio_buffers.empty())
       buffer_queue_map.insert(std::make_pair(audio_id_, audio_buffers));
     const auto& video_buffers =
         StringToBufferQueue(video_timestamps, video_id_, DemuxerStream::VIDEO);
     if (!video_buffers.empty())
       buffer_queue_map.insert(std::make_pair(video_id_, video_buffers));
     ASSERT_TRUE(frame_processor_->ProcessFrames(
         buffer_queue_map, append_window_start_, append_window_end_,
         &timestamp_offset_));
   }

   void CheckExpectedRangesByTimestamp(ChunkDemuxerStream* stream,
                                       const std::string& expected) {
     // Note, DemuxerStream::TEXT streams return [0,duration (==infinity here))
     Ranges<base::TimeDelta> r = stream->GetBufferedRanges(kInfiniteDuration);

     std::stringstream ss;
     ss << "{ ";
     for (size_t i = 0; i < r.size(); ++i) {
       int64_t start = r.start(i).InMilliseconds();
       int64_t end = r.end(i).InMilliseconds();
       ss << "[" << start << "," << end << ") ";
     }
     ss << "}";
     EXPECT_EQ(expected, ss.str());
   }

   void CheckReadStalls(ChunkDemuxerStream* stream) {
     int loop_count = 0;

     do {
       read_callback_called_ = false;
       stream->Read(base::Bind(&FrameProcessorTest::StoreStatusAndBuffer,
                               base::Unretained(this)));
       base::RunLoop().RunUntilIdle();
     } while (++loop_count < 2 && read_callback_called_ &&
              last_read_status_ == DemuxerStream::kAborted);

     ASSERT_FALSE(read_callback_called_ &&
                  last_read_status_ == DemuxerStream::kAborted)
         << "2 kAborted reads in a row. Giving up.";
     EXPECT_FALSE(read_callback_called_);
   }

   // Format of |expected| is a space-delimited sequence of
   // timestamp_in_ms:original_timestamp_in_ms
   // original_timestamp_in_ms (and the colon) must be omitted if it is the same
   // as timestamp_in_ms.
   void CheckReadsThenReadStalls(ChunkDemuxerStream* stream,
                                 const std::string& expected) {
     std::vector<std::string> timestamps = base::SplitString(
         expected, " ", base::TRIM_WHITESPACE, base::SPLIT_WANT_ALL);
     std::stringstream ss;
     for (size_t i = 0; i < timestamps.size(); ++i) {
       int loop_count = 0;

       do {
         read_callback_called_ = false;
         stream->Read(base::Bind(&FrameProcessorTest::StoreStatusAndBuffer,
                                 base::Unretained(this)));
         base::RunLoop().RunUntilIdle();
         EXPECT_TRUE(read_callback_called_);
       } while (++loop_count < 2 &&
                last_read_status_ == DemuxerStream::kAborted);

       ASSERT_FALSE(last_read_status_ == DemuxerStream::kAborted)
           << "2 kAborted reads in a row. Giving up.";
       EXPECT_EQ(DemuxerStream::kOk, last_read_status_);
       EXPECT_FALSE(last_read_buffer_->end_of_stream());

       if (i > 0) ss << " ";

       int time_in_ms = last_read_buffer_->timestamp().InMilliseconds();
       ss << time_in_ms;

       // Decode the original_time_in_ms from the buffer's data.
       double original_time_in_ms;
       ASSERT_EQ(sizeof(original_time_in_ms), last_read_buffer_->data_size());
       original_time_in_ms =
           *(reinterpret_cast<const double*>(last_read_buffer_->data()));
       if (original_time_in_ms != time_in_ms) ss << ":" << original_time_in_ms;

       // Detect full-discard preroll buffer.
       if (last_read_buffer_->discard_padding().first == kInfiniteDuration &&
           last_read_buffer_->discard_padding().second.is_zero()) {
         ss << "P";
       }
     }

     EXPECT_EQ(expected, ss.str());
     CheckReadStalls(stream);
   }

   // TODO(wolenetz): Refactor to instead verify the expected signalling or lack
   // thereof of new coded frame group by the FrameProcessor. See
   // https://crbug.com/580613.
   bool in_coded_frame_group() {
     return frame_processor_->coded_frame_group_last_dts_ !=
            kNoDecodeTimestamp();
   }

   void seek(ChunkDemuxerStream* stream, base::TimeDelta seek_time) {
     stream->AbortReads();
     stream->Seek(seek_time);
     stream->StartReturningData();
   }

   base::MessageLoop message_loop_;
   StrictMock<FrameProcessorTestCallbackHelper> callbacks_;

   std::unique_ptr<FrameProcessor> frame_processor_;
   base::TimeDelta append_window_start_;
   base::TimeDelta append_window_end_;
   base::TimeDelta timestamp_offset_;
   base::TimeDelta frame_duration_;
   std::unique_ptr<ChunkDemuxerStream> audio_;
   std::unique_ptr<ChunkDemuxerStream> video_;
   const TrackId audio_id_;
   const TrackId video_id_;
   const BufferQueue empty_queue_;

   // StoreStatusAndBuffer's most recent result.
   DemuxerStream::Status last_read_status_;
   scoped_refptr<DecoderBuffer> last_read_buffer_;
   bool read_callback_called_;

  private:
   void StoreStatusAndBuffer(DemuxerStream::Status status,
                             const scoped_refptr<DecoderBuffer>& buffer) {
     if (status == DemuxerStream::kOk && buffer.get()) {
       DVLOG(3) << __FUNCTION__ << "status: " << status
                << " ts: " << buffer->timestamp().InSecondsF();
     } else {
       DVLOG(3) << __FUNCTION__ << "status: " << status << " ts: n/a";
     }

     read_callback_called_ = true;
     last_read_status_ = status;
     last_read_buffer_ = buffer;
   }

   void CreateAndConfigureStream(DemuxerStream::Type type) {
     // TODO(wolenetz/dalecurtis): Also test with splicing disabled?
     switch (type) {
       case DemuxerStream::AUDIO: {
         ASSERT_FALSE(audio_);
         audio_.reset(new ChunkDemuxerStream(DemuxerStream::AUDIO, true, "1"));
         AudioDecoderConfig decoder_config(kCodecVorbis, kSampleFormatPlanarF32,
                                           CHANNEL_LAYOUT_STEREO, 1000,
                                           EmptyExtraData(), Unencrypted());
         frame_processor_->OnPossibleAudioConfigUpdate(decoder_config);
         ASSERT_TRUE(audio_->UpdateAudioConfig(decoder_config, new MediaLog()));
         break;
       }
       case DemuxerStream::VIDEO: {
         ASSERT_FALSE(video_);
         video_.reset(new ChunkDemuxerStream(DemuxerStream::VIDEO, true, "2"));
         ASSERT_TRUE(video_->UpdateVideoConfig(TestVideoConfig::Normal(),
                                               new MediaLog()));
         break;
       }
       // TODO(wolenetz): Test text coded frame processing.
       case DemuxerStream::TEXT:
       case DemuxerStream::UNKNOWN:
       case DemuxerStream::NUM_TYPES: {
         ASSERT_FALSE(true);
       }
     }
   }

   DISALLOW_COPY_AND_ASSIGN(FrameProcessorTest);
 };

 TEST_F(FrameProcessorTest, WrongTypeInAppendedBuffer) {
   AddTestTracks(HAS_AUDIO);
   EXPECT_FALSE(in_coded_frame_group());

   StreamParser::BufferQueueMap buffer_queue_map;
   const auto& audio_buffers =
       StringToBufferQueue("0K", audio_id_, DemuxerStream::VIDEO);
   buffer_queue_map.insert(std::make_pair(audio_id_, audio_buffers));
   ASSERT_FALSE(
       frame_processor_->ProcessFrames(buffer_queue_map, append_window_start_,
                                       append_window_end_, &timestamp_offset_));
   EXPECT_FALSE(in_coded_frame_group());
   EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
   CheckExpectedRangesByTimestamp(audio_.get(), "{ }");
   CheckReadStalls(audio_.get());
 }

 TEST_F(FrameProcessorTest, NonMonotonicallyIncreasingTimestampInOneCall) {
   AddTestTracks(HAS_AUDIO);

   StreamParser::BufferQueueMap buffer_queue_map;
   const auto& audio_buffers =
       StringToBufferQueue("10K 0K", audio_id_, DemuxerStream::AUDIO);
   buffer_queue_map.insert(std::make_pair(audio_id_, audio_buffers));
   ASSERT_FALSE(
       frame_processor_->ProcessFrames(buffer_queue_map, append_window_start_,
                                       append_window_end_, &timestamp_offset_));
   EXPECT_FALSE(in_coded_frame_group());
   EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
   CheckExpectedRangesByTimestamp(audio_.get(), "{ }");
   CheckReadStalls(audio_.get());
 }

 TEST_P(FrameProcessorTest, AudioOnly_SingleFrame) {
   // Tests A: P(A) -> (a)
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   if (GetParam()) frame_processor_->SetSequenceMode(true);

   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_));
   ProcessFrames("0K", "");
   EXPECT_TRUE(in_coded_frame_group());
   EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,10) }");
   CheckReadsThenReadStalls(audio_.get(), "0");
 }

 TEST_P(FrameProcessorTest, VideoOnly_SingleFrame) {
   // Tests V: P(V) -> (v)
   InSequence s;
   AddTestTracks(HAS_VIDEO);
   if (GetParam()) frame_processor_->SetSequenceMode(true);

   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_));
   ProcessFrames("", "0K");
   EXPECT_TRUE(in_coded_frame_group());
   EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
   CheckExpectedRangesByTimestamp(video_.get(), "{ [0,10) }");
   CheckReadsThenReadStalls(video_.get(), "0");
 }

 TEST_P(FrameProcessorTest, AudioOnly_TwoFrames) {
   // Tests A: P(A0, A10) -> (a0, a10)
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   if (GetParam()) frame_processor_->SetSequenceMode(true);

   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 2));
   ProcessFrames("0K 10K", "");
   EXPECT_TRUE(in_coded_frame_group());
   EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,20) }");
   CheckReadsThenReadStalls(audio_.get(), "0 10");
 }

 TEST_P(FrameProcessorTest, AudioOnly_SetOffsetThenSingleFrame) {
   // Tests A: STSO(50)+P(A0) -> TSO==50,(a0@50)
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   if (GetParam()) frame_processor_->SetSequenceMode(true);

   const base::TimeDelta fifty_ms = base::TimeDelta::FromMilliseconds(50);
   SetTimestampOffset(fifty_ms);
   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ + fifty_ms));
   ProcessFrames("0K", "");
   EXPECT_TRUE(in_coded_frame_group());
   EXPECT_EQ(fifty_ms, timestamp_offset_);
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [50,60) }");

   // We do not stall on reading without seeking to 50ms due to
   // SourceBufferStream::kSeekToStartFudgeRoom().
   CheckReadsThenReadStalls(audio_.get(), "50:0");
 }

 TEST_P(FrameProcessorTest, AudioOnly_SetOffsetThenFrameTimestampBelowOffset) {
   // Tests A: STSO(50)+P(A20) ->
   //   if sequence mode: TSO==30,(a20@50)
   //   if segments mode: TSO==50,(a20@70)
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   bool using_sequence_mode = GetParam();
   if (using_sequence_mode) frame_processor_->SetSequenceMode(true);

   const base::TimeDelta fifty_ms = base::TimeDelta::FromMilliseconds(50);
   const base::TimeDelta twenty_ms = base::TimeDelta::FromMilliseconds(20);
   SetTimestampOffset(fifty_ms);

   if (using_sequence_mode) {
     EXPECT_CALL(callbacks_,
                 PossibleDurationIncrease(fifty_ms + frame_duration_));
   } else {
     EXPECT_CALL(callbacks_, PossibleDurationIncrease(fifty_ms + twenty_ms +
                                                      frame_duration_));
   }

   ProcessFrames("20K", "");
   EXPECT_TRUE(in_coded_frame_group());

   // We do not stall on reading without seeking to 50ms / 70ms due to
   // SourceBufferStream::kSeekToStartFudgeRoom().
   if (using_sequence_mode) {
     EXPECT_EQ(fifty_ms - twenty_ms, timestamp_offset_);
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [50,60) }");
     CheckReadsThenReadStalls(audio_.get(), "50:20");
   } else {
     EXPECT_EQ(fifty_ms, timestamp_offset_);
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [70,80) }");
     CheckReadsThenReadStalls(audio_.get(), "70:20");
   }
 }

 TEST_P(FrameProcessorTest, AudioOnly_SequentialProcessFrames) {
   // Tests A: P(A0,A10)+P(A20,A30) -> (a0,a10,a20,a30)
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   if (GetParam()) frame_processor_->SetSequenceMode(true);

   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 2));
   ProcessFrames("0K 10K", "");
   EXPECT_TRUE(in_coded_frame_group());
   EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,20) }");

   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 4));
   ProcessFrames("20K 30K", "");
   EXPECT_TRUE(in_coded_frame_group());
   EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,40) }");

   CheckReadsThenReadStalls(audio_.get(), "0 10 20 30");
 }

 TEST_P(FrameProcessorTest, AudioOnly_NonSequentialProcessFrames) {
   // Tests A: P(A20,A30)+P(A0,A10) ->
   //   if sequence mode: TSO==-20 after first P(), 20 after second P(), and
   //                     a(20@0,a30@10,a0@20,a10@30)
   //   if segments mode: TSO==0,(a0,a10,a20,a30)
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   bool using_sequence_mode = GetParam();
   if (using_sequence_mode) {
     frame_processor_->SetSequenceMode(true);
     EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 2));
   } else {
     EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 4));
   }

   ProcessFrames("20K 30K", "");
   EXPECT_TRUE(in_coded_frame_group());

   if (using_sequence_mode) {
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,20) }");
     EXPECT_EQ(frame_duration_ * -2, timestamp_offset_);
     EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 4));
   } else {
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [20,40) }");
     EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
     EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 2));
   }

   ProcessFrames("0K 10K", "");
   EXPECT_TRUE(in_coded_frame_group());

   if (using_sequence_mode) {
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,40) }");
     EXPECT_EQ(frame_duration_ * 2, timestamp_offset_);
     CheckReadsThenReadStalls(audio_.get(), "0:20 10:30 20:0 30:10");
   } else {
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,40) }");
     EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
     // Re-seek to 0ms now that we've appended data earlier than what has already
     // satisfied our initial seek to start, above.
     seek(audio_.get(), base::TimeDelta());
     CheckReadsThenReadStalls(audio_.get(), "0 10 20 30");
   }
 }

 TEST_P(FrameProcessorTest, AudioVideo_SequentialProcessFrames) {
   // Tests AV: P(A0,A10;V0k,V10,V20)+P(A20,A30,A40,V30) ->
   //   (a0,a10,a20,a30,a40);(v0,v10,v20,v30)
   InSequence s;
   AddTestTracks(HAS_AUDIO | HAS_VIDEO);
   if (GetParam()) frame_processor_->SetSequenceMode(true);

   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 3));
   ProcessFrames("0K 10K", "0K 10 20");
   EXPECT_TRUE(in_coded_frame_group());
   EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,20) }");
   CheckExpectedRangesByTimestamp(video_.get(), "{ [0,30) }");

   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 5));
   ProcessFrames("20K 30K 40K", "30");
   EXPECT_TRUE(in_coded_frame_group());
   EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,50) }");
   CheckExpectedRangesByTimestamp(video_.get(), "{ [0,40) }");

   CheckReadsThenReadStalls(audio_.get(), "0 10 20 30 40");
   CheckReadsThenReadStalls(video_.get(), "0 10 20 30");
 }

 TEST_P(FrameProcessorTest, AudioVideo_Discontinuity) {
   // Tests AV: P(A0,A10,A30,A40,A50;V0k,V10,V40,V50key) ->
   //   if sequence mode: TSO==10,(a0,a10,a30,a40,a50@60);(v0,v10,v50@60)
   //   if segments mode: TSO==0,(a0,a10,a30,a40,a50);(v0,v10,v50)
   // This assumes A40K is processed before V40, which depends currently on
   // MergeBufferQueues() behavior.
   InSequence s;
   AddTestTracks(HAS_AUDIO | HAS_VIDEO);
   bool using_sequence_mode = GetParam();
   if (using_sequence_mode) {
     frame_processor_->SetSequenceMode(true);
     EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 7));
   } else {
     EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 6));
   }

   ProcessFrames("0K 10K 30K 40K 50K", "0K 10 40 50K");
   EXPECT_TRUE(in_coded_frame_group());

   if (using_sequence_mode) {
     EXPECT_EQ(frame_duration_, timestamp_offset_);
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,70) }");
     CheckExpectedRangesByTimestamp(video_.get(), "{ [0,70) }");
     CheckReadsThenReadStalls(audio_.get(), "0 10 30 40 60:50");
     CheckReadsThenReadStalls(video_.get(), "0 10 60:50");
   } else {
     EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,60) }");
     CheckExpectedRangesByTimestamp(video_.get(), "{ [0,20) [50,60) }");
     CheckReadsThenReadStalls(audio_.get(), "0 10 30 40 50");
     CheckReadsThenReadStalls(video_.get(), "0 10");
     seek(video_.get(), frame_duration_ * 5);
     CheckReadsThenReadStalls(video_.get(), "50");
   }
 }

 TEST_P(FrameProcessorTest, AudioVideo_Discontinuity_TimestampOffset) {
   // If in 'sequence' mode, a new coded frame group is *only* started if the
   // processed frame sequence outputs something that goes backwards in DTS
   // order. This helps retain the intent of 'sequence' mode: it both collapses
   // gaps as well as allows app to override the timeline placement and so needs
   // to handle overlap-appends, too.
   InSequence s;
   AddTestTracks(HAS_AUDIO | HAS_VIDEO);
   bool using_sequence_mode = GetParam();
   frame_processor_->SetSequenceMode(using_sequence_mode);

   // Start a coded frame group at time 100ms. Note the jagged start still uses
   // the coded frame group's start time as the range start for both streams.
   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 14));
   SetTimestampOffset(frame_duration_ * 10);
   ProcessFrames("0K 10K 20K", "10K 20K 30K");
   EXPECT_EQ(frame_duration_ * 10, timestamp_offset_);
   EXPECT_TRUE(in_coded_frame_group());
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [100,130) }");
   CheckExpectedRangesByTimestamp(video_.get(), "{ [100,140) }");

   // Test the differentiation between 'sequence' and 'segments' mode results if
   // the coded frame sequence jumps forward beyond the normal discontinuity
   // threshold.
   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 24));
   SetTimestampOffset(frame_duration_ * 20);
   ProcessFrames("0K 10K 20K", "10K 20K 30K");
   EXPECT_EQ(frame_duration_ * 20, timestamp_offset_);
   EXPECT_TRUE(in_coded_frame_group());
   if (using_sequence_mode) {
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [100,230) }");
     CheckExpectedRangesByTimestamp(video_.get(), "{ [100,240) }");
   } else {
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [100,130) [200,230) }");
     CheckExpectedRangesByTimestamp(video_.get(), "{ [100,140) [200,240) }");
   }

   // Test the behavior when timestampOffset adjustment causes next frames to be
   // in the past relative to the previously processed frame and triggers a new
   // coded frame group, even in 'sequence' mode.
   base::TimeDelta fifty_five_ms = base::TimeDelta::FromMilliseconds(55);
   EXPECT_CALL(callbacks_,
               PossibleDurationIncrease(fifty_five_ms + frame_duration_ * 4));
   SetTimestampOffset(fifty_five_ms);
   ProcessFrames("0K 10K 20K", "10K 20K 30K");
   EXPECT_EQ(fifty_five_ms, timestamp_offset_);
   EXPECT_TRUE(in_coded_frame_group());
   // The new audio range is not within SourceBufferStream's coalescing threshold
   // relative to the next range, but the new video range is within the
   // threshold.
   if (using_sequence_mode) {
     // TODO(wolenetz/chcunningham): The large explicit-timestampOffset-induced
     // jump forward (from timestamp 130 to 200) while in a sequence mode coded
     // frame group makes our adjacency threshold in SourceBuffer, based on
     // max-interbuffer-distance-within-coded-frame-group, very lenient.
     // This causes [55,85) to merge with [100,230) here for audio, and similar
     // for video. See also https://crbug.com/620523.
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [55,230) }");
     CheckExpectedRangesByTimestamp(video_.get(), "{ [55,240) }");
   } else {
     CheckExpectedRangesByTimestamp(audio_.get(),
                                    "{ [55,85) [100,130) [200,230) }");
     // Note that the range adjacency logic used in this case is doesn't consider
     // DTS 85 to be close enough to [100,140), since the first DTS in video
     // range [100,140) is actually 110. The muxed data started a coded frame
     // group at time 100, but actual DTS is used for adjacency checks while
     // appending.
     CheckExpectedRangesByTimestamp(video_.get(),
                                    "{ [55,95) [100,140) [200,240) }");
   }

   // Verify the buffers.
   // Re-seek now that we've appended data earlier than what already satisfied
   // our initial seek to start.
   seek(audio_.get(), fifty_five_ms);
   seek(video_.get(), fifty_five_ms);
   if (using_sequence_mode) {
     CheckReadsThenReadStalls(
         audio_.get(),
         "55:0 65:10 75:20 100:0 110:10 120:20 200:0 210:10 220:20");
     CheckReadsThenReadStalls(
         video_.get(),
         "65:10 75:20 85:30 110:10 120:20 130:30 210:10 220:20 230:30");
   } else {
     CheckReadsThenReadStalls(audio_.get(), "55:0 65:10 75:20");
     CheckReadsThenReadStalls(video_.get(), "65:10 75:20 85:30");
     seek(audio_.get(), frame_duration_ * 10);
     seek(video_.get(), frame_duration_ * 10);
     CheckReadsThenReadStalls(audio_.get(), "100:0 110:10 120:20");
     CheckReadsThenReadStalls(video_.get(), "110:10 120:20 130:30");
     seek(audio_.get(), frame_duration_ * 20);
     seek(video_.get(), frame_duration_ * 20);
     CheckReadsThenReadStalls(audio_.get(), "200:0 210:10 220:20");
     CheckReadsThenReadStalls(video_.get(), "210:10 220:20 230:30");
   }
 }

 TEST_P(FrameProcessorTest,
        AppendWindowFilterOfNegativeBufferTimestampsWithPrerollDiscard) {
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   if (GetParam()) frame_processor_->SetSequenceMode(true);

   SetTimestampOffset(frame_duration_ * -2);
   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_));
   ProcessFrames("0K 10K 20K", "");
   EXPECT_TRUE(in_coded_frame_group());
   EXPECT_EQ(frame_duration_ * -2, timestamp_offset_);
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,10) }");
   CheckReadsThenReadStalls(audio_.get(), "0:10P 0:20");
 }

 TEST_P(FrameProcessorTest, AppendWindowFilterWithInexactPreroll) {
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   if (GetParam()) frame_processor_->SetSequenceMode(true);
   SetTimestampOffset(-frame_duration_);
   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 2));
   ProcessFrames("0K 9.75K 20K", "");
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,20) }");
   CheckReadsThenReadStalls(audio_.get(), "0P 0:9.75 10:20");
 }

 TEST_P(FrameProcessorTest, AppendWindowFilterWithInexactPreroll_2) {
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   if (GetParam()) frame_processor_->SetSequenceMode(true);
   SetTimestampOffset(-frame_duration_);
   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 2));
   ProcessFrames("0K 10.25K 20K", "");
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,20) }");
   CheckReadsThenReadStalls(audio_.get(), "0P 0:10.25 10:20");
 }

 TEST_P(FrameProcessorTest, AllowNegativeFramePTSAndDTSBeforeOffsetAdjustment) {
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   bool using_sequence_mode = GetParam();
   if (using_sequence_mode) {
     frame_processor_->SetSequenceMode(true);
     EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 3));
   } else {
     EXPECT_CALL(callbacks_,
                 PossibleDurationIncrease((frame_duration_ * 5) / 2));
   }

   ProcessFrames("-5K 5K 15K", "");

   if (using_sequence_mode) {
     EXPECT_EQ(frame_duration_ / 2, timestamp_offset_);
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,30) }");
     CheckReadsThenReadStalls(audio_.get(), "0:-5 10:5 20:15");
   } else {
     EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,25) }");
     CheckReadsThenReadStalls(audio_.get(), "0:-5 5 15");
   }
 }

 TEST_P(FrameProcessorTest, PartialAppendWindowFilterNoDiscontinuity) {
   // Tests that spurious discontinuity is not introduced by a partially
   // trimmed frame.
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   if (GetParam()) frame_processor_->SetSequenceMode(true);
   EXPECT_CALL(callbacks_,
               PossibleDurationIncrease(base::TimeDelta::FromMilliseconds(29)));

   append_window_start_ = base::TimeDelta::FromMilliseconds(7);
   ProcessFrames("0K 19K", "");

   EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [7,29) }");
   CheckReadsThenReadStalls(audio_.get(), "7:0 19");
 }

 TEST_P(FrameProcessorTest,
        PartialAppendWindowFilterNoDiscontinuity_DtsAfterPts) {
   // Tests that spurious discontinuity is not introduced by a partially trimmed
   // frame that originally had DTS > PTS.
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   bool using_sequence_mode = GetParam();
   if (using_sequence_mode) {
     frame_processor_->SetSequenceMode(true);
     EXPECT_CALL(callbacks_, PossibleDurationIncrease(
                                 base::TimeDelta::FromMilliseconds(20)));
   } else {
     EXPECT_CALL(callbacks_, PossibleDurationIncrease(
                                 base::TimeDelta::FromMilliseconds(13)));
   }

   ProcessFrames("-7|10K 3|20K", "");

   if (using_sequence_mode) {
     EXPECT_EQ(base::TimeDelta::FromMilliseconds(7), timestamp_offset_);

     // TODO(wolenetz): Adjust the following expectation to use PTS instead of
     // DTS once https://crbug.com/398130 is fixed.
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [17,37) }");

     CheckReadsThenReadStalls(audio_.get(), "0:-7 10:3");
   } else {
     EXPECT_EQ(base::TimeDelta(), timestamp_offset_);

     // TODO(wolenetz): Adjust the following expectation to use PTS instead of
     // DTS once https://crbug.com/398130 is fixed.
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [17,30) }");

     CheckReadsThenReadStalls(audio_.get(), "0:-7 3");
   }
 }

 TEST_P(FrameProcessorTest, PartialAppendWindowFilterNoNewMediaSegment) {
   // Tests that a new media segment is not forcibly signalled for audio frame
   // partial front trim, to prevent incorrect introduction of a discontinuity
   // and potentially a non-keyframe video frame to be processed next after the
   // discontinuity.
   InSequence s;
   AddTestTracks(HAS_AUDIO | HAS_VIDEO);
   frame_processor_->SetSequenceMode(GetParam());
   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_));
   ProcessFrames("", "0K");
   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_));
   ProcessFrames("-5K", "");
   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 2));
   ProcessFrames("", "10");

   EXPECT_EQ(base::TimeDelta(), timestamp_offset_);
   EXPECT_TRUE(in_coded_frame_group());
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,5) }");
   CheckExpectedRangesByTimestamp(video_.get(), "{ [0,20) }");
   CheckReadsThenReadStalls(audio_.get(), "0:-5");
   CheckReadsThenReadStalls(video_.get(), "0 10");
 }

 TEST_F(FrameProcessorTest, AudioOnly_SequenceModeContinuityAcrossReset) {
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   frame_processor_->SetSequenceMode(true);
   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_));
   ProcessFrames("0K", "");
   frame_processor_->Reset();
   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_ * 2));
   ProcessFrames("100K", "");

   EXPECT_EQ(frame_duration_ * -9, timestamp_offset_);
   EXPECT_TRUE(in_coded_frame_group());
   CheckExpectedRangesByTimestamp(audio_.get(), "{ [0,20) }");
   CheckReadsThenReadStalls(audio_.get(), "0 10:100");
 }

 TEST_P(FrameProcessorTest, PartialAppendWindowZeroDurationPreroll) {
   InSequence s;
   AddTestTracks(HAS_AUDIO);
   bool is_sequence_mode = GetParam();
   frame_processor_->SetSequenceMode(is_sequence_mode);

   append_window_start_ = base::TimeDelta::FromMilliseconds(5);

   // Append a 0 duration frame that falls just before the append window.
   frame_duration_ = base::TimeDelta::FromMilliseconds(0);
   EXPECT_FALSE(in_coded_frame_group());
   EXPECT_CALL(callbacks_, PossibleDurationIncrease(frame_duration_));
   ProcessFrames("4K", "");
   // Verify buffer is not part of ranges. It should be silently saved for
   // preroll for future append.
   CheckExpectedRangesByTimestamp(audio_.get(), "{ }");
   CheckReadsThenReadStalls(audio_.get(), "");
   EXPECT_FALSE(in_coded_frame_group());

   // Abort the reads from last stall. We don't want those reads to "complete"
   // when we append below. We will initiate new reads to confirm the buffer
   // looks as we expect.
   seek(audio_.get(), base::TimeDelta());

   // Append a frame with 10ms duration, with 9ms falling after the window start.
   base::TimeDelta expected_duration =
       base::TimeDelta::FromMilliseconds(is_sequence_mode ? 10 : 14);
   EXPECT_CALL(callbacks_, PossibleDurationIncrease(expected_duration));
   frame_duration_ = base::TimeDelta::FromMilliseconds(10);
   ProcessFrames("4K", "");
   EXPECT_TRUE(in_coded_frame_group());

   // Verify range updated to reflect last append was processed and trimmed, and
   // also that zero duration buffer was saved and attached as preroll.
   if (is_sequence_mode) {
     // For sequence mode, append window trimming is applied after the append
     // is adjusted for timestampOffset. Basically, everything gets rebased to 0
     // and trimming then removes 5 seconds from the front.
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [5,10) }");
     CheckReadsThenReadStalls(audio_.get(), "5:4P 5:4");
   } else {  // segments mode
     CheckExpectedRangesByTimestamp(audio_.get(), "{ [5,14) }");
     CheckReadsThenReadStalls(audio_.get(), "5:4P 5:4");
   }

   // Verify the preroll buffer still has zero duration.
   StreamParserBuffer* last_read_parser_buffer =
       static_cast<StreamParserBuffer*>(last_read_buffer_.get());
   ASSERT_EQ(base::TimeDelta::FromMilliseconds(0),
             last_read_parser_buffer->preroll_buffer()->duration());
 }

 INSTANTIATE_TEST_CASE_P(SequenceMode, FrameProcessorTest, Values(true));
 INSTANTIATE_TEST_CASE_P(SegmentsMode, FrameProcessorTest, Values(false));

 }  // namespace media
 }  // namespace cobalt