media/gpu/test/video_encode_accelerator_tests.cc - cobalt - Git at Google

 // Copyright 2020 The Chromium Authors
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include <algorithm>
 #include <limits>

 #include "base/command_line.h"
 #include "base/files/file_path.h"
 #include "base/files/file_util.h"
 #include "base/strings/string_number_conversions.h"
 #include "media/base/media_switches.h"
 #include "media/base/media_util.h"
 #include "media/base/test_data_util.h"
 #include "media/base/video_bitrate_allocation.h"
 #include "media/base/video_codecs.h"
 #include "media/base/video_decoder_config.h"
 #include "media/gpu/buildflags.h"
 #include "media/gpu/gpu_video_encode_accelerator_helpers.h"
 #include "media/gpu/test/video.h"
 #include "media/gpu/test/video_encoder/bitstream_file_writer.h"
 #include "media/gpu/test/video_encoder/bitstream_validator.h"
 #include "media/gpu/test/video_encoder/decoder_buffer_validator.h"
 #include "media/gpu/test/video_encoder/video_encoder.h"
 #include "media/gpu/test/video_encoder/video_encoder_client.h"
 #include "media/gpu/test/video_encoder/video_encoder_test_environment.h"
 #include "media/gpu/test/video_frame_file_writer.h"
 #include "media/gpu/test/video_frame_helpers.h"
 #include "media/gpu/test/video_frame_validator.h"
 #include "media/gpu/test/video_test_environment.h"
 #include "media/gpu/test/video_test_helpers.h"
 #include "testing/gtest/include/gtest/gtest.h"
 #include "third_party/abseil-cpp/absl/types/optional.h"

 namespace media {
 namespace test {

 namespace {

 // Video encoder tests usage message. Make sure to also update the documentation
 // under docs/media/gpu/video_encoder_test_usage.md when making changes here.
 constexpr const char* usage_msg =
     R"(usage: video_encode_accelerator_tests
            [--codec=<codec>] [--num_temporal_layers=<number>]
            [--num_spatial_layers=<number>] [--bitrate_mode=(cbr|vbr)]
            [--reverse] [--bitrate=<bitrate>]
            [--disable_validator] [--output_bitstream]
            [--output_images=(all|corrupt)] [--output_format=(png|yuv)]
            [--output_folder=<filepath>] [--output_limit=<number>]
            [--disable_vaapi_lock]
            [-v=<level>] [--vmodule=<config>]
            [--gtest_help] [--help]
            [<video path>] [<video metadata path>]
 )";

 // Video encoder tests help message.
 constexpr const char* help_msg =
     R"""(Run the video encoder accelerator tests on the video specified by
 <video path>. If no <video path> is given the default
 "bear_320x192_40frames.yuv.webm" video will be used.

 The <video metadata path> should specify the location of a json file
 containing the video's metadata, such as frame checksums. By default
 <video path>.json will be used.

 The following arguments are supported:
    -v                   enable verbose mode, e.g. -v=2.
   --vmodule             enable verbose mode for the specified module,
                         e.g. --vmodule=*media/gpu*=2.

   --codec               codec profile to encode, "h264" (baseline),
                         "h264main, "h264high", "vp8", "vp9", "av1".
                         H264 Baseline is selected if unspecified.
   --num_temporal_layers the number of temporal layers of the encoded
                         bitstream. A default value is 1.
   --num_spatial_layers  the number of spatial layers of the encoded
                         bitstream. Only used in --codec=vp9 currently.
                         Spatial SVC encoding is applied only in
                         NV12Dmabuf test cases.
   --bitrate             bitrate (bits in second) of a produced bitstram.
                         If not specified, a proper value for the video
                         resolution is selected by the test.
   --bitrate_mode        The rate control mode for encoding, one of "cbr"
                         (default) or "vbr".
   --reverse             the stream plays backwards if the stream reaches
                         end of stream. So the input stream to be encoded
                         is consecutive. By default this is false.
   --disable_validator   disable validation of encoded bitstream.
   --output_bitstream    save the output bitstream in either H264 AnnexB
                         format (for H264) or IVF format (for vp8 and
                         vp9) to <output_folder>/<testname>.
   --output_images       in addition to saving the full encoded,
                         bitstream it's also possible to dump individual
                         frames to <output_folder>/<testname>, possible
                         values are "all|corrupt"
   --output_format       set the format of images saved to disk,
                         supported formats are "png" (default) and
                         "yuv".
   --output_limit        limit the number of images saved to disk.
   --output_folder       set the basic folder used to store test
                         artifacts. The default is the current directory.
   --disable_vaapi_lock  disable the global VA-API lock if applicable,
                         i.e., only on devices that use the VA-API with a libva
                         backend that's known to be thread-safe and only in
                         portions of the Chrome stack that should be able to
                         deal with the absence of the lock
                         (not the VaapiVideoDecodeAccelerator).

   --gtest_help          display the gtest help and exit.
   --help                display this help and exit.
 )""";

 // Default video to be used if no test video was specified.
 constexpr base::FilePath::CharType kDefaultTestVideoPath[] =
     FILE_PATH_LITERAL("bear_320x192_40frames.yuv.webm");

 // The number of frames to encode for bitrate check test cases.
 // TODO(hiroh): Decrease this values to make the test faster.
 constexpr size_t kNumFramesToEncodeForBitrateCheck = 300;
 // Tolerance factor for how encoded bitrate can differ from requested bitrate.
 constexpr double kBitrateTolerance = 0.1;
 constexpr double kVariableBitrateTolerance = 0.3;
 // The event timeout used in bitrate check tests because encoding 2160p and
 // validating |kNumFramesToEncodeBitrateCheck| frames take much time.
 constexpr base::TimeDelta kBitrateCheckEventTimeout = base::Seconds(180);

 media::test::VideoEncoderTestEnvironment* g_env;

 // Video encode test class. Performs setup and teardown for each single test.
 class VideoEncoderTest : public ::testing::Test {
  public:
   // GetDefaultConfig() creates VideoEncoderClientConfig for SharedMemory input
   // encoding. This function must not be called in spatial SVC encoding.
   VideoEncoderClientConfig GetDefaultConfig() {
     const auto& spatial_layers = g_env->SpatialLayers();
     CHECK_LE(spatial_layers.size(), 1u);

     return VideoEncoderClientConfig(g_env->Video(), g_env->Profile(),
                                     spatial_layers, g_env->BitrateAllocation(),
                                     g_env->Reverse());
   }

   std::unique_ptr<VideoEncoder> CreateVideoEncoder(
       Video* video,
       const VideoEncoderClientConfig& config) {
     LOG_ASSERT(video);

     auto video_encoder =
         VideoEncoder::Create(config, CreateBitstreamProcessors(video, config));
     LOG_ASSERT(video_encoder);

     if (!video_encoder->Initialize(video))
       ADD_FAILURE();

     return video_encoder;
   }

  private:
   std::unique_ptr<BitstreamProcessor> CreateBitstreamValidator(
       const Video* video,
       const VideoDecoderConfig& decoder_config,
       const size_t last_frame_index,
       VideoFrameValidator::GetModelFrameCB get_model_frame_cb,
       absl::optional<size_t> spatial_layer_index_to_decode,
       absl::optional<size_t> temporal_layer_index_to_decode,
       const std::vector<gfx::Size>& spatial_layer_resolutions) {
     std::vector<std::unique_ptr<VideoFrameProcessor>> video_frame_processors;

     // Attach a video frame writer to store individual frames to disk if
     // requested.
     std::unique_ptr<VideoFrameProcessor> image_writer;
     auto frame_output_config = g_env->ImageOutputConfig();
     base::FilePath output_folder = base::FilePath(g_env->OutputFolder())
                                        .Append(g_env->GetTestOutputFilePath());
     if (frame_output_config.output_mode != FrameOutputMode::kNone) {
       base::FilePath::StringType output_file_prefix;
       if (spatial_layer_index_to_decode) {
         output_file_prefix +=
             FILE_PATH_LITERAL("SL") +
             base::NumberToString(*spatial_layer_index_to_decode);
       }
       if (temporal_layer_index_to_decode) {
         output_file_prefix +=
             FILE_PATH_LITERAL("TL") +
             base::NumberToString(*temporal_layer_index_to_decode);
       }

       image_writer = VideoFrameFileWriter::Create(
           output_folder, frame_output_config.output_format,
           frame_output_config.output_limit, output_file_prefix);
       LOG_ASSERT(image_writer);
       if (frame_output_config.output_mode == FrameOutputMode::kAll)
         video_frame_processors.push_back(std::move(image_writer));
     }

     // For a resolution less than 360p, we lower the tolerance. Some platforms
     // couldn't compress a low resolution video efficiently with a low bitrate.
     constexpr gfx::Size k360p(640, 360);
     constexpr double kSSIMToleranceForLowerResolution = 0.65;
     const gfx::Size encode_resolution = decoder_config.visible_rect().size();
     const double ssim_tolerance =
         encode_resolution.GetArea() < k360p.GetArea()
             ? kSSIMToleranceForLowerResolution
             : SSIMVideoFrameValidator::kDefaultTolerance;

     auto ssim_validator = SSIMVideoFrameValidator::Create(
         get_model_frame_cb, std::move(image_writer),
         VideoFrameValidator::ValidationMode::kAverage, ssim_tolerance);
     LOG_ASSERT(ssim_validator);
     video_frame_processors.push_back(std::move(ssim_validator));
     return BitstreamValidator::Create(
         decoder_config, last_frame_index, std::move(video_frame_processors),
         spatial_layer_index_to_decode, temporal_layer_index_to_decode,
         spatial_layer_resolutions);
   }

   std::vector<std::unique_ptr<BitstreamProcessor>> CreateBitstreamProcessors(
       Video* video,
       const VideoEncoderClientConfig& config) {
     std::vector<std::unique_ptr<BitstreamProcessor>> bitstream_processors;
     const gfx::Rect visible_rect(config.output_resolution);
     std::vector<gfx::Size> spatial_layer_resolutions;
     // |config.spatial_layers| is filled only in temporal layer or spatial layer
     // encoding.
     for (const auto& sl : config.spatial_layers)
       spatial_layer_resolutions.emplace_back(sl.width, sl.height);

     const VideoCodec codec =
         VideoCodecProfileToVideoCodec(config.output_profile);
     if (g_env->SaveOutputBitstream()) {
       base::FilePath::StringPieceType extension =
           codec == VideoCodec::kH264 ? FILE_PATH_LITERAL("h264")
                                      : FILE_PATH_LITERAL("ivf");
       auto output_bitstream_filepath =
           g_env->OutputFolder()
               .Append(g_env->GetTestOutputFilePath())
               .Append(video->FilePath().BaseName().ReplaceExtension(extension));
       if (!spatial_layer_resolutions.empty()) {
         CHECK_GE(config.num_spatial_layers, 1u);
         CHECK_GE(config.num_temporal_layers, 1u);
         for (size_t spatial_layer_index_to_write = 0;
              spatial_layer_index_to_write < config.num_spatial_layers;
              ++spatial_layer_index_to_write) {
           const gfx::Size& layer_size =
               spatial_layer_resolutions[spatial_layer_index_to_write];
           for (size_t temporal_layer_index_to_write = 0;
                temporal_layer_index_to_write < config.num_temporal_layers;
                ++temporal_layer_index_to_write) {
             bitstream_processors.emplace_back(BitstreamFileWriter::Create(
                 output_bitstream_filepath.InsertBeforeExtensionASCII(
                     FILE_PATH_LITERAL(".SL") +
                     base::NumberToString(spatial_layer_index_to_write) +
                     FILE_PATH_LITERAL(".TL") +
                     base::NumberToString(temporal_layer_index_to_write)),
                 codec, layer_size, config.framerate,
                 config.num_frames_to_encode, spatial_layer_index_to_write,
                 temporal_layer_index_to_write, spatial_layer_resolutions));
             LOG_ASSERT(bitstream_processors.back());
           }
         }
       } else {
         bitstream_processors.emplace_back(BitstreamFileWriter::Create(
             output_bitstream_filepath, codec, visible_rect.size(),
             config.framerate, config.num_frames_to_encode));
         LOG_ASSERT(bitstream_processors.back());
       }
     }

     if (!g_env->IsBitstreamValidatorEnabled()) {
       return bitstream_processors;
     }

     switch (codec) {
       case VideoCodec::kH264:
         bitstream_processors.emplace_back(new H264Validator(
             config.output_profile, visible_rect, config.num_temporal_layers));
         break;
       case VideoCodec::kVP8:
         bitstream_processors.emplace_back(
             new VP8Validator(visible_rect, config.num_temporal_layers));
         break;
       case VideoCodec::kVP9:
         bitstream_processors.emplace_back(new VP9Validator(
             config.output_profile, visible_rect, config.num_spatial_layers,
             config.num_temporal_layers));
         break;
       case VideoCodec::kAV1:
         bitstream_processors.emplace_back(new AV1Validator(visible_rect));
         break;
       default:
         LOG(ERROR) << "Unsupported profile: "
                    << GetProfileName(config.output_profile);
         break;
     }

     raw_data_helper_ = RawDataHelper::Create(video, g_env->Reverse());
     if (!raw_data_helper_) {
       LOG(ERROR) << "Failed to create raw data helper";
       return bitstream_processors;
     }

     if (!spatial_layer_resolutions.empty()) {
       CHECK_GE(config.num_spatial_layers, 1u);
       CHECK_GE(config.num_temporal_layers, 1u);
       for (size_t spatial_layer_index_to_decode = 0;
            spatial_layer_index_to_decode < config.num_spatial_layers;
            ++spatial_layer_index_to_decode) {
         const gfx::Size& layer_size =
             spatial_layer_resolutions[spatial_layer_index_to_decode];
         VideoDecoderConfig decoder_config(
             codec, config.output_profile,
             VideoDecoderConfig::AlphaMode::kIsOpaque, VideoColorSpace(),
             kNoTransformation, layer_size, gfx::Rect(layer_size), layer_size,
             EmptyExtraData(), EncryptionScheme::kUnencrypted);
         VideoFrameValidator::GetModelFrameCB get_model_frame_cb =
             base::BindRepeating(&VideoEncoderTest::GetModelFrame,
                                 base::Unretained(this), gfx::Rect(layer_size));
         for (size_t temporal_layer_index_to_decode = 0;
              temporal_layer_index_to_decode < config.num_temporal_layers;
              ++temporal_layer_index_to_decode) {
           bitstream_processors.emplace_back(CreateBitstreamValidator(
               video, decoder_config, config.num_frames_to_encode - 1,
               get_model_frame_cb, spatial_layer_index_to_decode,
               temporal_layer_index_to_decode, spatial_layer_resolutions));
           LOG_ASSERT(bitstream_processors.back());
         }
       }
     } else {
       // Attach a bitstream validator to validate all encoded video frames. The
       // bitstream validator uses a software video decoder to validate the
       // encoded buffers by decoding them. Metrics such as the image's SSIM can
       // be calculated for additional quality checks.
       VideoDecoderConfig decoder_config(
           codec, config.output_profile,
           VideoDecoderConfig::AlphaMode::kIsOpaque, VideoColorSpace(),
           kNoTransformation, visible_rect.size(), visible_rect,
           visible_rect.size(), EmptyExtraData(),
           EncryptionScheme::kUnencrypted);
       VideoFrameValidator::GetModelFrameCB get_model_frame_cb =
           base::BindRepeating(&VideoEncoderTest::GetModelFrame,
                               base::Unretained(this), visible_rect);
       bitstream_processors.emplace_back(CreateBitstreamValidator(
           video, decoder_config, config.num_frames_to_encode - 1,
           get_model_frame_cb, absl::nullopt, absl::nullopt,
           /*spatial_layer_resolutions=*/{}));
       LOG_ASSERT(bitstream_processors.back());
     }
     return bitstream_processors;
   }

   scoped_refptr<const VideoFrame> GetModelFrame(const gfx::Rect& visible_rect,
                                                 size_t frame_index) {
     LOG_ASSERT(raw_data_helper_);
     auto frame = raw_data_helper_->GetFrame(frame_index);
     if (!frame)
       return nullptr;
     if (visible_rect.size() == frame->visible_rect().size())
       return frame;
     return ScaleVideoFrame(frame.get(), visible_rect.size());
   }

   std::unique_ptr<RawDataHelper> raw_data_helper_;
 };

 absl::optional<std::string> SupportsDynamicFramerate() {
   return g_env->IsKeplerUsed()
              ? absl::make_optional<std::string>(
                    "The rate controller in the kepler firmware doesn't handle "
                    "frame rate changes correctly.")
              : absl::nullopt;
 }

 absl::optional<std::string> SupportsNV12DmaBufInput() {
   return g_env->IsKeplerUsed() ? absl::make_optional<std::string>(
                                      "Encoding with dmabuf input frames is not "
                                      "supported in kepler.")
                                : absl::nullopt;
 }

 }  // namespace

 // Encode video from start to end. Wait for the kFlushDone event at the end of
 // the stream, that notifies us all frames have been encoded.
 TEST_F(VideoEncoderTest, FlushAtEndOfStream) {
   if (g_env->SpatialLayers().size() > 1)
     GTEST_SKIP() << "Skip SHMEM input test cases in spatial SVC encoding";

   auto encoder = CreateVideoEncoder(g_env->Video(), GetDefaultConfig());

   encoder->Encode();
   EXPECT_TRUE(encoder->WaitForFlushDone());

   EXPECT_EQ(encoder->GetFlushDoneCount(), 1u);
   EXPECT_EQ(encoder->GetFrameReleasedCount(), g_env->Video()->NumFrames());
   EXPECT_TRUE(encoder->WaitForBitstreamProcessors());
 }

 // Test initializing the video encoder. The test will be successful if the video
 // encoder is capable of setting up the encoder for the specified codec and
 // resolution. The test only verifies initialization and doesn't do any
 // encoding.
 TEST_F(VideoEncoderTest, Initialize) {
   if (g_env->SpatialLayers().size() > 1)
     GTEST_SKIP() << "Skip SHMEM input test cases in spatial SVC encoding";

   auto encoder = CreateVideoEncoder(g_env->Video(), GetDefaultConfig());

   EXPECT_EQ(encoder->GetEventCount(VideoEncoder::kInitialized), 1u);
 }

 // Create a video encoder and immediately destroy it without initializing. The
 // video encoder will be automatically destroyed when the video encoder goes out
 // of scope at the end of the test. The test will pass if no asserts or crashes
 // are triggered upon destroying.
 TEST_F(VideoEncoderTest, DestroyBeforeInitialize) {
   if (g_env->SpatialLayers().size() > 1)
     GTEST_SKIP() << "Skip SHMEM input test cases in spatial SVC encoding";

   auto video_encoder = VideoEncoder::Create(GetDefaultConfig());

   EXPECT_NE(video_encoder, nullptr);
 }

 // Test forcing key frames while encoding a video.
 TEST_F(VideoEncoderTest, ForceKeyFrame) {
   if (g_env->SpatialLayers().size() > 1)
     GTEST_SKIP() << "Skip SHMEM input test cases in spatial SVC encoding";

   auto config = GetDefaultConfig();
   const size_t middle_frame = config.num_frames_to_encode;
   config.num_frames_to_encode *= 2;
   auto encoder = CreateVideoEncoder(g_env->Video(), config);

   // It is expected that our hw encoders don't produce key frames in a short
   // time span like a few hundred frames.
   encoder->EncodeUntil(VideoEncoder::kBitstreamReady, 1u);
   EXPECT_TRUE(encoder->WaitUntilIdle());
   EXPECT_EQ(encoder->GetEventCount(VideoEncoder::kKeyFrame), 1u);
   // Encode until the middle of stream and request force_keyframe.
   encoder->EncodeUntil(VideoEncoder::kFrameReleased, middle_frame);
   EXPECT_TRUE(encoder->WaitUntilIdle());
   // Check if there is no keyframe except the first frame.
   EXPECT_EQ(encoder->GetEventCount(VideoEncoder::kKeyFrame), 1u);
   encoder->ForceKeyFrame();

   // Encode until the end of stream.
   encoder->Encode();
   EXPECT_TRUE(encoder->WaitForFlushDone());
   // Check if there are two key frames, first frame and one on ForceKeyFrame().
   EXPECT_EQ(encoder->GetEventCount(VideoEncoder::kKeyFrame), 2u);
   EXPECT_EQ(encoder->GetFlushDoneCount(), 1u);
   EXPECT_EQ(encoder->GetFrameReleasedCount(), config.num_frames_to_encode);
   EXPECT_TRUE(encoder->WaitForBitstreamProcessors());
 }

 // Encode video from start to end. Multiple buffer encodes will be queued in the
 // encoder, without waiting for the result of the previous encode requests.
 TEST_F(VideoEncoderTest, FlushAtEndOfStream_MultipleOutstandingEncodes) {
   if (g_env->SpatialLayers().size() > 1)
     GTEST_SKIP() << "Skip SHMEM input test cases in spatial SVC encoding";

   auto config = GetDefaultConfig();
   config.max_outstanding_encode_requests = 4;
   auto encoder = CreateVideoEncoder(g_env->Video(), config);

   encoder->Encode();
   EXPECT_TRUE(encoder->WaitForFlushDone());

   EXPECT_EQ(encoder->GetFlushDoneCount(), 1u);
   EXPECT_EQ(encoder->GetFrameReleasedCount(), g_env->Video()->NumFrames());
   EXPECT_TRUE(encoder->WaitForBitstreamProcessors());
 }

 // Encode multiple videos simultaneously from start to finish.
 TEST_F(VideoEncoderTest, FlushAtEndOfStream_MultipleConcurrentEncodes) {
   if (g_env->SpatialLayers().size() > 1)
     GTEST_SKIP() << "Skip SHMEM input test cases in spatial SVC encoding";

   // Run two encoders for larger resolutions to avoid creating shared memory
   // buffers during the test on lower end devices.
   constexpr gfx::Size k1080p(1920, 1080);
   const size_t kMinSupportedConcurrentEncoders =
       g_env->Video()->Resolution().GetArea() >= k1080p.GetArea() ? 2 : 3;

   auto config = GetDefaultConfig();
   std::vector<std::unique_ptr<VideoEncoder>> encoders(
       kMinSupportedConcurrentEncoders);
   for (size_t i = 0; i < kMinSupportedConcurrentEncoders; ++i)
     encoders[i] = CreateVideoEncoder(g_env->Video(), config);

   for (size_t i = 0; i < kMinSupportedConcurrentEncoders; ++i)
     encoders[i]->Encode();

   for (size_t i = 0; i < kMinSupportedConcurrentEncoders; ++i) {
     EXPECT_TRUE(encoders[i]->WaitForFlushDone());
     EXPECT_EQ(encoders[i]->GetFlushDoneCount(), 1u);
     EXPECT_EQ(encoders[i]->GetFrameReleasedCount(),
               g_env->Video()->NumFrames());
     EXPECT_TRUE(encoders[i]->WaitForBitstreamProcessors());
   }
 }

 TEST_F(VideoEncoderTest, BitrateCheck) {
   if (g_env->SpatialLayers().size() > 1)
     GTEST_SKIP() << "Skip SHMEM input test cases in spatial SVC encoding";

   auto config = GetDefaultConfig();
   config.num_frames_to_encode = kNumFramesToEncodeForBitrateCheck;
   auto encoder = CreateVideoEncoder(g_env->Video(), config);
   // Set longer event timeout than the default (30 sec) because encoding 2160p
   // and validating the stream take much time.
   encoder->SetEventWaitTimeout(kBitrateCheckEventTimeout);

   encoder->Encode();
   EXPECT_TRUE(encoder->WaitForFlushDone());

   EXPECT_EQ(encoder->GetFlushDoneCount(), 1u);
   EXPECT_EQ(encoder->GetFrameReleasedCount(), config.num_frames_to_encode);
   EXPECT_TRUE(encoder->WaitForBitstreamProcessors());
   // TODO(b/181797390): Reconsider bitrate check for VBR encoding if this fails
   // on some boards.
   const double tolerance =
       config.bitrate_allocation.GetMode() == Bitrate::Mode::kConstant
           ? kBitrateTolerance
           : kVariableBitrateTolerance;
   EXPECT_NEAR(encoder->GetStats().Bitrate(),
               config.bitrate_allocation.GetSumBps(),
               tolerance * config.bitrate_allocation.GetSumBps());
 }

 TEST_F(VideoEncoderTest, BitrateCheck_DynamicBitrate) {
   if (g_env->SpatialLayers().size() > 1)
     GTEST_SKIP() << "Skip SHMEM input test cases in spatial SVC encoding";
   if (g_env->BitrateAllocation().GetMode() != Bitrate::Mode::kConstant) {
     GTEST_SKIP()
         << "Skip Dynamic bitrate change checks for non-CBR bitrate mode";
   }

   auto config = GetDefaultConfig();
   config.num_frames_to_encode = kNumFramesToEncodeForBitrateCheck * 2;
   auto encoder = CreateVideoEncoder(g_env->Video(), config);
   // Set longer event timeout than the default (30 sec) because encoding 2160p
   // and validating the stream take much time.
   encoder->SetEventWaitTimeout(kBitrateCheckEventTimeout);

   // Encode the video with the first bitrate.
   const uint32_t first_bitrate = config.bitrate_allocation.GetSumBps();
   encoder->EncodeUntil(VideoEncoder::kFrameReleased,
                        kNumFramesToEncodeForBitrateCheck);
   EXPECT_TRUE(encoder->WaitUntilIdle());
   EXPECT_NEAR(encoder->GetStats().Bitrate(), first_bitrate,
               kBitrateTolerance * first_bitrate);

   // Encode the video with the second bitrate.
   const uint32_t second_bitrate = first_bitrate * 3 / 2;
   encoder->ResetStats();
   encoder->UpdateBitrate(
       AllocateDefaultBitrateForTesting(
           config.num_spatial_layers, config.num_temporal_layers,
           Bitrate::ConstantBitrate(second_bitrate)),
       config.framerate);
   encoder->Encode();
   EXPECT_TRUE(encoder->WaitForFlushDone());
   EXPECT_NEAR(encoder->GetStats().Bitrate(), second_bitrate,
               kBitrateTolerance * second_bitrate);

   EXPECT_EQ(encoder->GetFlushDoneCount(), 1u);
   EXPECT_EQ(encoder->GetFrameReleasedCount(), config.num_frames_to_encode);
   EXPECT_TRUE(encoder->WaitForBitstreamProcessors());
 }

 TEST_F(VideoEncoderTest, BitrateCheck_DynamicFramerate) {
   if (g_env->SpatialLayers().size() > 1)
     GTEST_SKIP() << "Skip SHMEM input test cases in spatial SVC encoding";
   if (g_env->BitrateAllocation().GetMode() != Bitrate::Mode::kConstant) {
     GTEST_SKIP()
         << "Skip dynamic framerate change checks for non-CBR bitrate mode";
   }

   if (auto skip_reason = SupportsDynamicFramerate())
     GTEST_SKIP() << *skip_reason;
   auto config = GetDefaultConfig();
   config.num_frames_to_encode = kNumFramesToEncodeForBitrateCheck * 2;
   auto encoder = CreateVideoEncoder(g_env->Video(), config);
   // Set longer event timeout than the default (30 sec) because encoding 2160p
   // and validating the stream take much time.
   encoder->SetEventWaitTimeout(kBitrateCheckEventTimeout);

   // Encode the video with the first framerate.
   const uint32_t first_framerate = config.framerate;

   encoder->EncodeUntil(VideoEncoder::kFrameReleased,
                        kNumFramesToEncodeForBitrateCheck);
   EXPECT_TRUE(encoder->WaitUntilIdle());
   EXPECT_NEAR(encoder->GetStats().Bitrate(),
               config.bitrate_allocation.GetSumBps(),
               kBitrateTolerance * config.bitrate_allocation.GetSumBps());

   // Encode the video with the second framerate.
   const uint32_t second_framerate = std::max(first_framerate * 2 / 3, 10u);
   encoder->ResetStats();
   encoder->UpdateBitrate(config.bitrate_allocation, second_framerate);
   encoder->Encode();
   EXPECT_TRUE(encoder->WaitForFlushDone());
   EXPECT_NEAR(encoder->GetStats().Bitrate(),
               config.bitrate_allocation.GetSumBps(),
               kBitrateTolerance * config.bitrate_allocation.GetSumBps());

   EXPECT_EQ(encoder->GetFlushDoneCount(), 1u);
   EXPECT_EQ(encoder->GetFrameReleasedCount(), config.num_frames_to_encode);
   EXPECT_TRUE(encoder->WaitForBitstreamProcessors());
 }

 TEST_F(VideoEncoderTest, FlushAtEndOfStream_NV12Dmabuf) {
   if (auto skip_reason = SupportsNV12DmaBufInput())
     GTEST_SKIP() << *skip_reason;

   Video* nv12_video = g_env->GenerateNV12Video();
   VideoEncoderClientConfig config(nv12_video, g_env->Profile(),
                                   g_env->SpatialLayers(),
                                   g_env->BitrateAllocation(), g_env->Reverse());
   config.input_storage_type =
       VideoEncodeAccelerator::Config::StorageType::kGpuMemoryBuffer;

   auto encoder = CreateVideoEncoder(nv12_video, config);

   encoder->Encode();
   EXPECT_TRUE(encoder->WaitForFlushDone());
   EXPECT_EQ(encoder->GetFlushDoneCount(), 1u);
   EXPECT_EQ(encoder->GetFrameReleasedCount(), nv12_video->NumFrames());
   EXPECT_TRUE(encoder->WaitForBitstreamProcessors());
 }

 // Downscaling is required in VideoEncodeAccelerator when zero-copy video
 // capture is enabled. One example is simulcast, camera produces 360p VideoFrame
 // and there are two VideoEncodeAccelerator for 360p and 180p. VideoEncoder for
 // 180p is fed 360p and thus has to perform the scaling from 360p to 180p.
 TEST_F(VideoEncoderTest, FlushAtEndOfStream_NV12DmabufScaling) {
   if (auto skip_reason = SupportsNV12DmaBufInput())
     GTEST_SKIP() << *skip_reason;
   if (g_env->SpatialLayers().size() > 1)
     GTEST_SKIP() << "Skip simulcast test case for spatial SVC encoding";

   constexpr gfx::Size kMinOutputResolution(240, 180);
   const gfx::Size output_resolution =
       gfx::Size(g_env->Video()->Resolution().width() / 2,
                 g_env->Video()->Resolution().height() / 2);
   if (!gfx::Rect(output_resolution).Contains(gfx::Rect(kMinOutputResolution))) {
     GTEST_SKIP() << "Skip test if video resolution is too small, "
                  << "output_resolution=" << output_resolution.ToString()
                  << ", minimum output resolution="
                  << kMinOutputResolution.ToString();
   }

   auto* nv12_video = g_env->GenerateNV12Video();
   // Set 1/4 of the original bitrate because the area of |output_resolution| is
   // 1/4 of the original resolution.
   uint32_t new_target_bitrate = g_env->BitrateAllocation().GetSumBps() / 4;
   // TODO(b/181797390): Reconsider if this peak bitrate is reasonable.
   const Bitrate new_bitrate =
       g_env->BitrateAllocation().GetMode() == Bitrate::Mode::kConstant
           ? Bitrate::ConstantBitrate(new_target_bitrate)
           : Bitrate::VariableBitrate(new_target_bitrate,
                                      new_target_bitrate * 2);

   auto spatial_layers = g_env->SpatialLayers();
   size_t num_temporal_layers = 1u;
   if (!spatial_layers.empty()) {
     CHECK_EQ(spatial_layers.size(), 1u);
     spatial_layers[0].width = output_resolution.width();
     spatial_layers[0].height = output_resolution.height();
     spatial_layers[0].bitrate_bps /= 4;
     num_temporal_layers = spatial_layers[0].num_of_temporal_layers;
   }
   VideoEncoderClientConfig config(
       nv12_video, g_env->Profile(), spatial_layers,
       AllocateDefaultBitrateForTesting(/*num_spatial_layers=*/1u,
                                        num_temporal_layers, new_bitrate),
       g_env->Reverse());
   config.output_resolution = output_resolution;
   config.input_storage_type =
       VideoEncodeAccelerator::Config::StorageType::kGpuMemoryBuffer;

   auto encoder = CreateVideoEncoder(nv12_video, config);
   encoder->Encode();
   EXPECT_TRUE(encoder->WaitForFlushDone());
   EXPECT_EQ(encoder->GetFlushDoneCount(), 1u);
   EXPECT_EQ(encoder->GetFrameReleasedCount(), nv12_video->NumFrames());
   EXPECT_TRUE(encoder->WaitForBitstreamProcessors());
 }

 // Encode VideoFrames with cropping the rectangle (0, 60, size).
 // Cropping is required in VideoEncodeAccelerator when zero-copy video
 // capture is enabled. One example is when 640x360 capture recording is
 // requested, a camera cannot produce the resolution and instead produces
 // 640x480 frames with visible_rect=0, 60, 640x360.
 TEST_F(VideoEncoderTest, FlushAtEndOfStream_NV12DmabufCroppingTopAndBottom) {
   if (auto skip_reason = SupportsNV12DmaBufInput())
     GTEST_SKIP() << *skip_reason;
   constexpr int kGrowHeight = 120;
   const gfx::Size original_resolution = g_env->Video()->Resolution();
   const gfx::Rect expanded_visible_rect(0, kGrowHeight / 2,
                                         original_resolution.width(),
                                         original_resolution.height());
   const gfx::Size expanded_resolution(
       original_resolution.width(), original_resolution.height() + kGrowHeight);
   constexpr gfx::Size kMaxExpandedResolution(1920, 1080);
   if (!gfx::Rect(kMaxExpandedResolution)
            .Contains(gfx::Rect(expanded_resolution))) {
     GTEST_SKIP() << "Expanded video resolution is too large, "
                  << "expanded_resolution=" << expanded_resolution.ToString()
                  << ", maximum expanded resolution="
                  << kMaxExpandedResolution.ToString();
   }

   auto nv12_expanded_video = g_env->GenerateNV12Video()->Expand(
       expanded_resolution, expanded_visible_rect);
   ASSERT_TRUE(nv12_expanded_video);
   VideoEncoderClientConfig config(nv12_expanded_video.get(), g_env->Profile(),
                                   g_env->SpatialLayers(),
                                   g_env->BitrateAllocation(), g_env->Reverse());
   config.output_resolution = original_resolution;
   config.input_storage_type =
       VideoEncodeAccelerator::Config::StorageType::kGpuMemoryBuffer;

   auto encoder = CreateVideoEncoder(nv12_expanded_video.get(), config);
   encoder->Encode();
   EXPECT_TRUE(encoder->WaitForFlushDone());
   EXPECT_EQ(encoder->GetFlushDoneCount(), 1u);
   EXPECT_EQ(encoder->GetFrameReleasedCount(), nv12_expanded_video->NumFrames());
   EXPECT_TRUE(encoder->WaitForBitstreamProcessors());
 }

 // Encode VideoFrames with cropping the rectangle (60, 0, size).
 // Cropping is required in VideoEncodeAccelerator when zero-copy video
 // capture is enabled. One example is when 640x360 capture recording is
 // requested, a camera cannot produce the resolution and instead produces
 // 760x360 frames with visible_rect=60, 0, 640x360.
 TEST_F(VideoEncoderTest, FlushAtEndOfStream_NV12DmabufCroppingRightAndLeft) {
   if (auto skip_reason = SupportsNV12DmaBufInput())
     GTEST_SKIP() << *skip_reason;
   constexpr int kGrowWidth = 120;
   const gfx::Size original_resolution = g_env->Video()->Resolution();
   const gfx::Rect expanded_visible_rect(kGrowWidth / 2, 0,
                                         original_resolution.width(),
                                         original_resolution.height());
   const gfx::Size expanded_resolution(original_resolution.width() + kGrowWidth,
                                       original_resolution.height());
   constexpr gfx::Size kMaxExpandedResolution(1920, 1080);
   if (!gfx::Rect(kMaxExpandedResolution)
            .Contains(gfx::Rect(expanded_resolution))) {
     GTEST_SKIP() << "Expanded video resolution is too large, "
                  << "expanded_resolution=" << expanded_resolution.ToString()
                  << ", maximum expanded resolution="
                  << kMaxExpandedResolution.ToString();
   }

   auto nv12_expanded_video = g_env->GenerateNV12Video()->Expand(
       expanded_resolution, expanded_visible_rect);
   ASSERT_TRUE(nv12_expanded_video);
   VideoEncoderClientConfig config(nv12_expanded_video.get(), g_env->Profile(),
                                   g_env->SpatialLayers(),
                                   g_env->BitrateAllocation(), g_env->Reverse());
   config.output_resolution = original_resolution;
   config.input_storage_type =
       VideoEncodeAccelerator::Config::StorageType::kGpuMemoryBuffer;

   auto encoder = CreateVideoEncoder(nv12_expanded_video.get(), config);
   encoder->Encode();
   EXPECT_TRUE(encoder->WaitForFlushDone());
   EXPECT_EQ(encoder->GetFlushDoneCount(), 1u);
   EXPECT_EQ(encoder->GetFrameReleasedCount(), nv12_expanded_video->NumFrames());
   EXPECT_TRUE(encoder->WaitForBitstreamProcessors());
 }

 // This tests deactivate and activating spatial layers during encoding.
 TEST_F(VideoEncoderTest, DeactivateAndActivateSpatialLayers) {
   if (auto skip_reason = SupportsNV12DmaBufInput())
     GTEST_SKIP() << *skip_reason;

   const auto& spatial_layers = g_env->SpatialLayers();
   if (spatial_layers.size() <= 1)
     GTEST_SKIP() << "Skip (de)activate spatial layers test for simple encoding";

   Video* nv12_video = g_env->GenerateNV12Video();
   const size_t bottom_spatial_idx = 0;
   const size_t top_spatial_idx = spatial_layers.size() - 1;
   auto deactivate_spatial_layer =
       [](VideoBitrateAllocation bitrate_allocation,
          size_t deactivate_sid) -> VideoBitrateAllocation {
     for (size_t i = 0; i < VideoBitrateAllocation::kMaxTemporalLayers; ++i)
       bitrate_allocation.SetBitrate(deactivate_sid, i, 0u);
     return bitrate_allocation;
   };

   const auto& default_allocation = g_env->BitrateAllocation();
   std::vector<VideoBitrateAllocation> bitrate_allocations;

   // Deactivate the top layer.
   bitrate_allocations.emplace_back(
       deactivate_spatial_layer(default_allocation, top_spatial_idx));

   // Activate the top layer.
   bitrate_allocations.emplace_back(default_allocation);

   // Deactivate the bottom layer (and top layer if there is still a spatial
   // layer).
   auto bitrate_allocation =
       deactivate_spatial_layer(default_allocation, bottom_spatial_idx);
   if (bottom_spatial_idx + 1 < top_spatial_idx) {
     bitrate_allocation =
         deactivate_spatial_layer(bitrate_allocation, top_spatial_idx);
   }
   bitrate_allocations.emplace_back(bitrate_allocation);

   // Deactivate the layers except bottom layer.
   bitrate_allocation = default_allocation;
   for (size_t i = bottom_spatial_idx + 1; i < spatial_layers.size(); ++i)
     bitrate_allocation = deactivate_spatial_layer(bitrate_allocation, i);
   bitrate_allocations.emplace_back(bitrate_allocation);

   VideoEncoderClientConfig config(nv12_video, g_env->Profile(),
                                   g_env->SpatialLayers(),
                                   g_env->BitrateAllocation(), g_env->Reverse());
   config.input_storage_type =
       VideoEncodeAccelerator::Config::StorageType::kGpuMemoryBuffer;
   std::vector<size_t> num_frames_to_encode(bitrate_allocations.size());
   for (size_t i = 0; i < num_frames_to_encode.size(); ++i)
     num_frames_to_encode[i] = config.num_frames_to_encode * (i + 1);
   config.num_frames_to_encode =
       num_frames_to_encode.back() + config.num_frames_to_encode;

   auto encoder = CreateVideoEncoder(nv12_video, config);

   for (size_t i = 0; i < bitrate_allocations.size(); ++i) {
     encoder->EncodeUntil(VideoEncoder::kFrameReleased, num_frames_to_encode[i]);
     EXPECT_TRUE(encoder->WaitUntilIdle());
     encoder->UpdateBitrate(bitrate_allocations[i], config.framerate);
   }

   encoder->Encode();
   EXPECT_TRUE(encoder->WaitForFlushDone());
   EXPECT_EQ(encoder->GetFlushDoneCount(), 1u);
   EXPECT_EQ(encoder->GetFrameReleasedCount(), config.num_frames_to_encode);
   EXPECT_TRUE(encoder->WaitForBitstreamProcessors());
 }

 }  // namespace test
 }  // namespace media

 int main(int argc, char** argv) {
   // Set the default test data path.
   media::test::Video::SetTestDataPath(media::GetTestDataPath());

   // Print the help message if requested. This needs to be done before
   // initializing gtest, to overwrite the default gtest help message.
   base::CommandLine::Init(argc, argv);
   const base::CommandLine* cmd_line = base::CommandLine::ForCurrentProcess();
   LOG_ASSERT(cmd_line);
   if (cmd_line->HasSwitch("help")) {
     std::cout << media::test::usage_msg << "\n" << media::test::help_msg;
     return 0;
   }

   // Check if a video was specified on the command line.
   base::CommandLine::StringVector args = cmd_line->GetArgs();
   base::FilePath video_path =
       (args.size() >= 1) ? base::FilePath(args[0])
                          : base::FilePath(media::test::kDefaultTestVideoPath);
   base::FilePath video_metadata_path =
       (args.size() >= 2) ? base::FilePath(args[1]) : base::FilePath();
   std::string codec = "h264";
   size_t num_temporal_layers = 1u;
   size_t num_spatial_layers = 1u;
   bool output_bitstream = false;
   absl::optional<uint32_t> output_bitrate;
   bool reverse = false;
   media::Bitrate::Mode bitrate_mode = media::Bitrate::Mode::kConstant;
   media::test::FrameOutputConfig frame_output_config;
   base::FilePath output_folder =
       base::FilePath(base::FilePath::kCurrentDirectory);
   std::vector<base::test::FeatureRef> disabled_features;

   // Parse command line arguments.
   bool enable_bitstream_validator = true;
   base::CommandLine::SwitchMap switches = cmd_line->GetSwitches();
   for (base::CommandLine::SwitchMap::const_iterator it = switches.begin();
        it != switches.end(); ++it) {
     if (it->first.find("gtest_") == 0 ||               // Handled by GoogleTest
         it->first == "v" || it->first == "vmodule") {  // Handled by Chrome
       continue;
     }

     if (it->first == "codec") {
       codec = it->second;
     } else if (it->first == "num_temporal_layers") {
       if (!base::StringToSizeT(it->second, &num_temporal_layers)) {
         std::cout << "invalid number of temporal layers: " << it->second
                   << "\n";
         return EXIT_FAILURE;
       }
     } else if (it->first == "num_spatial_layers") {
       if (!base::StringToSizeT(it->second, &num_spatial_layers)) {
         std::cout << "invalid number of spatial layers: " << it->second << "\n";
         return EXIT_FAILURE;
       }
     } else if (it->first == "bitrate_mode") {
       if (it->second == "vbr") {
         bitrate_mode = media::Bitrate::Mode::kVariable;
       } else if (it->second != "cbr") {
         std::cout << "unknown bitrate mode \"" << it->second
                   << "\", possible values are \"cbr|vbr\"\n";
         return EXIT_FAILURE;
       }
     } else if (it->first == "disable_validator") {
       enable_bitstream_validator = false;
     } else if (it->first == "output_bitstream") {
       output_bitstream = true;
     } else if (it->first == "bitrate") {
       unsigned value;
       if (!base::StringToUint(it->second, &value)) {
         std::cout << "invalid bitrate " << it->second << "\n"
                   << media::test::usage_msg;
         return EXIT_FAILURE;
       }
       output_bitrate = base::checked_cast<uint32_t>(value);
     } else if (it->first == "reverse") {
       reverse = true;
     } else if (it->first == "output_images") {
       if (it->second == "all") {
         frame_output_config.output_mode = media::test::FrameOutputMode::kAll;
       } else if (it->second == "corrupt") {
         frame_output_config.output_mode =
             media::test::FrameOutputMode::kCorrupt;
       } else {
         std::cout << "unknown image output mode \"" << it->second
                   << "\", possible values are \"all|corrupt\"\n";
         return EXIT_FAILURE;
       }
     } else if (it->first == "output_format") {
       if (it->second == "png") {
         frame_output_config.output_format =
             media::test::VideoFrameFileWriter::OutputFormat::kPNG;
       } else if (it->second == "yuv") {
         frame_output_config.output_format =
             media::test::VideoFrameFileWriter::OutputFormat::kYUV;
       } else {
         std::cout << "unknown frame output format \"" << it->second
                   << "\", possible values are \"png|yuv\"\n";
         return EXIT_FAILURE;
       }
     } else if (it->first == "output_limit") {
       if (!base::StringToUint64(it->second,
                                 &frame_output_config.output_limit)) {
         std::cout << "invalid number \"" << it->second << "\n";
         return EXIT_FAILURE;
       }
     } else if (it->first == "output_folder") {
       output_folder = base::FilePath(it->second);
     } else if (it->first == "disable_vaapi_lock") {
       disabled_features.push_back(media::kGlobalVaapiLock);
     } else {
       std::cout << "unknown option: --" << it->first << "\n"
                 << media::test::usage_msg;
       return EXIT_FAILURE;
     }
   }

   testing::InitGoogleTest(&argc, argv);

   // Set up our test environment.
   media::test::VideoEncoderTestEnvironment* test_environment =
       media::test::VideoEncoderTestEnvironment::Create(
           video_path, video_metadata_path, enable_bitstream_validator,
           output_folder, codec, num_temporal_layers, num_spatial_layers,
           output_bitstream, output_bitrate, bitrate_mode, reverse,
           frame_output_config,
           /*enabled_features=*/{}, disabled_features);

   if (!test_environment)
     return EXIT_FAILURE;

   media::test::g_env = static_cast<media::test::VideoEncoderTestEnvironment*>(
       testing::AddGlobalTestEnvironment(test_environment));

   return RUN_ALL_TESTS();
 }