media/gpu/windows/media_foundation_video_encode_accelerator_win.h - cobalt - Git at Google

 // Copyright 2016 The Chromium Authors
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #ifndef MEDIA_GPU_WINDOWS_MEDIA_FOUNDATION_VIDEO_ENCODE_ACCELERATOR_WIN_H_
 #define MEDIA_GPU_WINDOWS_MEDIA_FOUNDATION_VIDEO_ENCODE_ACCELERATOR_WIN_H_

 #include <mfapi.h>
 #include <mfidl.h>
 #include <stdint.h>
 #include <strmif.h>
 #include <wrl/client.h>

 #include <memory>

 #include "base/atomic_ref_count.h"
 #include "base/containers/circular_deque.h"
 #include "base/functional/bind.h"
 #include "base/memory/raw_ptr.h"
 #include "base/memory/weak_ptr.h"
 #include "base/synchronization/lock.h"
 #include "base/task/sequenced_task_runner.h"
 #include "base/task/single_thread_task_runner.h"
 #include "base/threading/thread.h"
 #include "base/win/shlwapi.h"
 #include "base/win/windows_types.h"
 #include "gpu/config/gpu_driver_bug_workarounds.h"
 #include "gpu/config/gpu_preferences.h"
 #include "media/base/bitrate.h"
 #include "media/base/video_codecs.h"
 #include "media/base/video_encoder.h"
 #include "media/base/win/dxgi_device_manager.h"
 #include "media/gpu/media_gpu_export.h"
 #include "media/video/h264_parser.h"
 #if BUILDFLAG(ENABLE_PLATFORM_HEVC)
 #include "media/video/h265_nalu_parser.h"
 #endif
 #include "media/video/video_encode_accelerator.h"

 namespace media {

 class VideoRateControlWrapper;

 // Media Foundation implementation of the VideoEncodeAccelerator interface for
 // Windows.
 // This class saves the task runner on which it is constructed and runs client
 // callbacks using that same task runner.
 // This class has DCHECKs to makes sure that methods are called in the
 // correct task runners. It starts an internal encoder thread on which
 // VideoEncodeAccelerator implementation tasks are posted.
 class MEDIA_GPU_EXPORT MediaFoundationVideoEncodeAccelerator
     : public VideoEncodeAccelerator,
       public IMFAsyncCallback {
  public:
   explicit MediaFoundationVideoEncodeAccelerator(
       const gpu::GpuPreferences& gpu_preferences,
       const gpu::GpuDriverBugWorkarounds& gpu_workarounds,
       CHROME_LUID luid);

   MediaFoundationVideoEncodeAccelerator(
       const MediaFoundationVideoEncodeAccelerator&) = delete;
   MediaFoundationVideoEncodeAccelerator& operator=(
       const MediaFoundationVideoEncodeAccelerator&) = delete;

   // VideoEncodeAccelerator implementation.
   VideoEncodeAccelerator::SupportedProfiles GetSupportedProfiles() override;
   bool Initialize(const Config& config,
                   Client* client,
                   std::unique_ptr<MediaLog> media_log) override;
   void Encode(scoped_refptr<VideoFrame> frame, bool force_keyframe) override;
   void UseOutputBitstreamBuffer(BitstreamBuffer buffer) override;
   void RequestEncodingParametersChange(const Bitrate& bitrate,
                                        uint32_t framerate) override;
   void RequestEncodingParametersChange(
       const VideoBitrateAllocation& bitrate_allocation,
       uint32_t framerate) override;
   void Destroy() override;
   void Flush(FlushCallback flush_callback) override;
   bool IsFlushSupported() override;
   bool IsGpuFrameResizeSupported() override;

   // IMFAsyncCallback implementation
   IFACEMETHODIMP GetParameters(DWORD* pdwFlags, DWORD* pdwQueue) override;
   IFACEMETHODIMP Invoke(IMFAsyncResult* pAsyncResult) override;
   IFACEMETHODIMP_(ULONG) AddRef() override;
   IFACEMETHODIMP_(ULONG) Release() override;
   IFACEMETHODIMP QueryInterface(REFIID riid, void** ppv) override;

   enum class DriverVendor { kOther, kNvidia, kIntel, kAMD };

  protected:
   ~MediaFoundationVideoEncodeAccelerator() override;

  private:
   // Holds output buffers coming from the client ready to be filled.
   struct BitstreamBufferRef;

   // Holds output buffers coming from the encoder.
   class EncodeOutput;

   // Pending encode input.
   using PendingInput = VideoEncoder::PendingEncode;

   // Encoder state.
   enum State {
     kUninitialized,
     kInitializing,
     kEncoding,
     // We wait to feed all pending frames from `pending_input_queue_`
     // before telling MF encoder to drain.
     kPreFlushing,
     // We issued a drain message to the MF encoder want wait for the drain
     // to complete.
     kFlushing,
     kError,
   };

   // Get supported profiles for specific codec.
   VideoEncodeAccelerator::SupportedProfiles GetSupportedProfilesForCodec(
       VideoCodec codec);

   // Activates the asynchronous encoder instance |encoder_| according to codec
   // merit.
   bool ActivateAsyncEncoder(IMFActivate** pp_activates,
                             uint32_t activate_count,
                             bool is_constrained_h264);

   // Initializes and allocates memory for input and output parameters.
   bool InitializeInputOutputParameters(VideoCodecProfile output_profile,
                                        bool is_constrained_h264);

   // Initializes encoder parameters for real-time use.
   bool SetEncoderModes();

   // Helper function to notify the client of an error status. This also sets
   // the state to kError.
   void NotifyErrorStatus(EncoderStatus status);

   // Set the encoder state to |state|.
   void SetState(State state);

   // Processes the input video frame for the encoder.
   HRESULT ProcessInput(const PendingInput& input);

   // Feed as many frames from |pending_input_queue_| to ProcessInput()
   // as possible.
   void FeedInputs();

   // Populates input sample buffer with contents of a video frame
   HRESULT PopulateInputSampleBuffer(const PendingInput& input);
   HRESULT PopulateInputSampleBufferGpu(scoped_refptr<VideoFrame> frame);
   HRESULT CopyInputSampleBufferFromGpu(const VideoFrame& frame);

   // Assign TemporalID by bitstream or external state machine(based on SVC
   // Spec).
   bool AssignTemporalId(Microsoft::WRL::ComPtr<IMFMediaBuffer> output_buffer,
                         size_t size,
                         int* temporal_id,
                         bool keyframe);

   int AssignTemporalIdBySvcSpec(bool keyframe);

   bool temporal_scalable_coding() const { return num_temporal_layers_ > 1; }

   // Checks for and copies encoded output.
   void ProcessOutput();

   // Asynchronous event handler
   void MediaEventHandler(MediaEventType event_type, HRESULT status);

   // Sends MFT_MESSAGE_COMMAND_DRAIN to the encoder to make it
   // process all inputs, produce all outputs and tell us when it's done.
   void DrainEncoder();

   // Initialize video processing (for scaling)
   HRESULT InitializeD3DVideoProcessing(ID3D11Texture2D* input_texture);

   // Perform D3D11 scaling operation
   HRESULT PerformD3DScaling(ID3D11Texture2D* input_texture);

   // Used to post tasks from the IMFMediaEvent::Invoke() method.
   scoped_refptr<base::SingleThreadTaskRunner> task_runner_;

   std::unique_ptr<MediaLog> media_log_;

   // Bitstream buffers ready to be used to return encoded output as a FIFO.
   base::circular_deque<std::unique_ptr<BitstreamBufferRef>>
       bitstream_buffer_queue_;

   // Input frame queue for encoding on next METransformNeedInput event.
   base::circular_deque<PendingInput> pending_input_queue_;

   // EncodeOutput needs to be copied into a BitstreamBufferRef as a FIFO.
   base::circular_deque<std::unique_ptr<EncodeOutput>> encoder_output_queue_;

   // Counter of outputs which is used to assign temporal layer indexes
   // according to the corresponding layer pattern. Reset for every key frame.
   uint32_t outputs_since_keyframe_count_ = 0;

   // Encoder state. Encode tasks will only run in kEncoding state.
   State state_ = kUninitialized;

   // This parser is used to assign temporalId.
   H264Parser h264_parser_;
 #if BUILDFLAG(ENABLE_PLATFORM_HEVC)
   H265NaluParser h265_nalu_parser_;
 #endif

   gfx::Size input_visible_size_;
   size_t bitstream_buffer_size_ = 0u;
   uint32_t frame_rate_ = 30;
   // For recording configured frame rate as we don't dynamically change it.
   // The default value here will be overridden during initialization.
   uint32_t configured_frame_rate_ = 30;
   // Bitrate allocation in bps.
   VideoBitrateAllocation bitrate_allocation_{Bitrate::Mode::kConstant};
   bool low_latency_mode_ = false;
   int num_temporal_layers_ = 1;

   // Codec type used for encoding.
   VideoCodec codec_ = VideoCodec::kUnknown;

   // Vendor of the active video encoder.
   DriverVendor vendor_ = DriverVendor::kOther;

   // Group of picture length for encoded output stream, indicates the
   // distance between two key frames.
   uint32_t gop_length_ = 0u;

   // Video encoder info that includes accelerator name, QP validity, etc.
   VideoEncoderInfo encoder_info_;
   bool encoder_info_sent_ = false;

   Microsoft::WRL::ComPtr<IMFActivate> activate_;
   Microsoft::WRL::ComPtr<IMFTransform> encoder_;
   Microsoft::WRL::ComPtr<ICodecAPI> codec_api_;
   Microsoft::WRL::ComPtr<IMFMediaEventGenerator> event_generator_;
   base::AtomicRefCount async_callback_ref_{1};

   DWORD input_stream_id_ = 0u;
   DWORD output_stream_id_ = 0u;

   Microsoft::WRL::ComPtr<IMFMediaType> imf_input_media_type_;
   Microsoft::WRL::ComPtr<IMFMediaType> imf_output_media_type_;

   Microsoft::WRL::ComPtr<IMFSample> input_sample_;
   // True if `input_sample_` has been populated with data/metadata
   // of the next frame to be encoded.
   bool has_prepared_input_sample_ = false;

   Microsoft::WRL::ComPtr<IMFSample> output_sample_;
   Microsoft::WRL::ComPtr<ID3D11VideoProcessor> video_processor_;
   Microsoft::WRL::ComPtr<ID3D11VideoProcessorEnumerator>
       video_processor_enumerator_;
   Microsoft::WRL::ComPtr<ID3D11VideoDevice> video_device_;
   Microsoft::WRL::ComPtr<ID3D11VideoContext> video_context_;
   D3D11_VIDEO_PROCESSOR_CONTENT_DESC vp_desc_ = {};
   Microsoft::WRL::ComPtr<ID3D11Texture2D> scaled_d3d11_texture_;
   Microsoft::WRL::ComPtr<ID3D11VideoProcessorOutputView> vp_output_view_;

   // To expose client callbacks from VideoEncodeAccelerator.
   raw_ptr<Client> client_ = nullptr;
   SEQUENCE_CHECKER(sequence_checker_);

   // DXGI device manager for handling hardware input textures
   scoped_refptr<DXGIDeviceManager> dxgi_device_manager_;
   // Mapping of dxgi resource needed when HMFT rejects setting D3D11 manager.
   bool dxgi_resource_mapping_required_ = false;
   // Staging texture for copying from GPU memory if HMFT does not operate in
   // D3D11 mode.
   Microsoft::WRL::ComPtr<ID3D11Texture2D> staging_texture_;

   // Preferred adapter for DXGIDeviceManager.
   const CHROME_LUID luid_;

   // A buffer used as a scratch space for I420 to NV12 conversion
   std::vector<uint8_t> resize_buffer_;

   FlushCallback flush_callback_;

   // Bitrate controller for CBR encoding.
   std::unique_ptr<VideoRateControlWrapper> rate_ctrl_;

   // Declared last to ensure that all weak pointers are invalidated before
   // other destructors run.
   base::WeakPtr<MediaFoundationVideoEncodeAccelerator> weak_ptr_;
   base::WeakPtrFactory<MediaFoundationVideoEncodeAccelerator> weak_factory_{
       this};
 };

 }  // namespace media

 #endif  // MEDIA_GPU_WINDOWS_MEDIA_FOUNDATION_VIDEO_ENCODE_ACCELERATOR_WIN_H_
	// Copyright 2016 The Chromium Authors
	// Use of this source code is governed by a BSD-style license that can be
	// found in the LICENSE file.

	#ifndef MEDIA_GPU_WINDOWS_MEDIA_FOUNDATION_VIDEO_ENCODE_ACCELERATOR_WIN_H_
	#define MEDIA_GPU_WINDOWS_MEDIA_FOUNDATION_VIDEO_ENCODE_ACCELERATOR_WIN_H_

	#include <mfapi.h>
	#include <mfidl.h>
	#include <stdint.h>
	#include <strmif.h>
	#include <wrl/client.h>

	#include <memory>

	#include "base/atomic_ref_count.h"
	#include "base/containers/circular_deque.h"
	#include "base/functional/bind.h"
	#include "base/memory/raw_ptr.h"
	#include "base/memory/weak_ptr.h"
	#include "base/synchronization/lock.h"
	#include "base/task/sequenced_task_runner.h"
	#include "base/task/single_thread_task_runner.h"
	#include "base/threading/thread.h"
	#include "base/win/shlwapi.h"
	#include "base/win/windows_types.h"
	#include "gpu/config/gpu_driver_bug_workarounds.h"
	#include "gpu/config/gpu_preferences.h"
	#include "media/base/bitrate.h"
	#include "media/base/video_codecs.h"
	#include "media/base/video_encoder.h"
	#include "media/base/win/dxgi_device_manager.h"
	#include "media/gpu/media_gpu_export.h"
	#include "media/video/h264_parser.h"
	#if BUILDFLAG(ENABLE_PLATFORM_HEVC)
	#include "media/video/h265_nalu_parser.h"
	#endif
	#include "media/video/video_encode_accelerator.h"

	namespace media {

	class VideoRateControlWrapper;

	// Media Foundation implementation of the VideoEncodeAccelerator interface for
	// Windows.
	// This class saves the task runner on which it is constructed and runs client
	// callbacks using that same task runner.
	// This class has DCHECKs to makes sure that methods are called in the
	// correct task runners. It starts an internal encoder thread on which
	// VideoEncodeAccelerator implementation tasks are posted.
	class MEDIA_GPU_EXPORT MediaFoundationVideoEncodeAccelerator
	: public VideoEncodeAccelerator,
	public IMFAsyncCallback {
	public:
	explicit MediaFoundationVideoEncodeAccelerator(
	const gpu::GpuPreferences& gpu_preferences,
	const gpu::GpuDriverBugWorkarounds& gpu_workarounds,
	CHROME_LUID luid);

	MediaFoundationVideoEncodeAccelerator(
	const MediaFoundationVideoEncodeAccelerator&) = delete;
	MediaFoundationVideoEncodeAccelerator& operator=(
	const MediaFoundationVideoEncodeAccelerator&) = delete;

	// VideoEncodeAccelerator implementation.
	VideoEncodeAccelerator::SupportedProfiles GetSupportedProfiles() override;
	bool Initialize(const Config& config,
	Client* client,
	std::unique_ptr<MediaLog> media_log) override;
	void Encode(scoped_refptr<VideoFrame> frame, bool force_keyframe) override;
	void UseOutputBitstreamBuffer(BitstreamBuffer buffer) override;
	void RequestEncodingParametersChange(const Bitrate& bitrate,
	uint32_t framerate) override;
	void RequestEncodingParametersChange(
	const VideoBitrateAllocation& bitrate_allocation,
	uint32_t framerate) override;
	void Destroy() override;
	void Flush(FlushCallback flush_callback) override;
	bool IsFlushSupported() override;
	bool IsGpuFrameResizeSupported() override;

	// IMFAsyncCallback implementation
	IFACEMETHODIMP GetParameters(DWORD* pdwFlags, DWORD* pdwQueue) override;
	IFACEMETHODIMP Invoke(IMFAsyncResult* pAsyncResult) override;
	IFACEMETHODIMP_(ULONG) AddRef() override;
	IFACEMETHODIMP_(ULONG) Release() override;
	IFACEMETHODIMP QueryInterface(REFIID riid, void** ppv) override;

	enum class DriverVendor { kOther, kNvidia, kIntel, kAMD };

	protected:
	~MediaFoundationVideoEncodeAccelerator() override;

	private:
	// Holds output buffers coming from the client ready to be filled.
	struct BitstreamBufferRef;

	// Holds output buffers coming from the encoder.
	class EncodeOutput;

	// Pending encode input.
	using PendingInput = VideoEncoder::PendingEncode;

	// Encoder state.
	enum State {
	kUninitialized,
	kInitializing,
	kEncoding,
	// We wait to feed all pending frames from `pending_input_queue_`
	// before telling MF encoder to drain.
	kPreFlushing,
	// We issued a drain message to the MF encoder want wait for the drain
	// to complete.
	kFlushing,
	kError,
	};

	// Get supported profiles for specific codec.
	VideoEncodeAccelerator::SupportedProfiles GetSupportedProfilesForCodec(
	VideoCodec codec);

	// Activates the asynchronous encoder instance \|encoder_\| according to codec
	// merit.
	bool ActivateAsyncEncoder(IMFActivate** pp_activates,
	uint32_t activate_count,
	bool is_constrained_h264);

	// Initializes and allocates memory for input and output parameters.
	bool InitializeInputOutputParameters(VideoCodecProfile output_profile,
	bool is_constrained_h264);

	// Initializes encoder parameters for real-time use.
	bool SetEncoderModes();

	// Helper function to notify the client of an error status. This also sets
	// the state to kError.
	void NotifyErrorStatus(EncoderStatus status);

	// Set the encoder state to \|state\|.
	void SetState(State state);

	// Processes the input video frame for the encoder.
	HRESULT ProcessInput(const PendingInput& input);

	// Feed as many frames from \|pending_input_queue_\| to ProcessInput()
	// as possible.
	void FeedInputs();

	// Populates input sample buffer with contents of a video frame
	HRESULT PopulateInputSampleBuffer(const PendingInput& input);
	HRESULT PopulateInputSampleBufferGpu(scoped_refptr<VideoFrame> frame);
	HRESULT CopyInputSampleBufferFromGpu(const VideoFrame& frame);

	// Assign TemporalID by bitstream or external state machine(based on SVC
	// Spec).
	bool AssignTemporalId(Microsoft::WRL::ComPtr<IMFMediaBuffer> output_buffer,
	size_t size,
	int* temporal_id,
	bool keyframe);

	int AssignTemporalIdBySvcSpec(bool keyframe);

	bool temporal_scalable_coding() const { return num_temporal_layers_ > 1; }

	// Checks for and copies encoded output.
	void ProcessOutput();

	// Asynchronous event handler
	void MediaEventHandler(MediaEventType event_type, HRESULT status);

	// Sends MFT_MESSAGE_COMMAND_DRAIN to the encoder to make it
	// process all inputs, produce all outputs and tell us when it's done.
	void DrainEncoder();

	// Initialize video processing (for scaling)
	HRESULT InitializeD3DVideoProcessing(ID3D11Texture2D* input_texture);

	// Perform D3D11 scaling operation
	HRESULT PerformD3DScaling(ID3D11Texture2D* input_texture);

	// Used to post tasks from the IMFMediaEvent::Invoke() method.
	scoped_refptr<base::SingleThreadTaskRunner> task_runner_;

	std::unique_ptr<MediaLog> media_log_;

	// Bitstream buffers ready to be used to return encoded output as a FIFO.
	base::circular_deque<std::unique_ptr<BitstreamBufferRef>>
	bitstream_buffer_queue_;

	// Input frame queue for encoding on next METransformNeedInput event.
	base::circular_deque<PendingInput> pending_input_queue_;

	// EncodeOutput needs to be copied into a BitstreamBufferRef as a FIFO.
	base::circular_deque<std::unique_ptr<EncodeOutput>> encoder_output_queue_;

	// Counter of outputs which is used to assign temporal layer indexes
	// according to the corresponding layer pattern. Reset for every key frame.
	uint32_t outputs_since_keyframe_count_ = 0;

	// Encoder state. Encode tasks will only run in kEncoding state.
	State state_ = kUninitialized;

	// This parser is used to assign temporalId.
	H264Parser h264_parser_;
	#if BUILDFLAG(ENABLE_PLATFORM_HEVC)
	H265NaluParser h265_nalu_parser_;
	#endif

	gfx::Size input_visible_size_;
	size_t bitstream_buffer_size_ = 0u;
	uint32_t frame_rate_ = 30;
	// For recording configured frame rate as we don't dynamically change it.
	// The default value here will be overridden during initialization.
	uint32_t configured_frame_rate_ = 30;
	// Bitrate allocation in bps.
	VideoBitrateAllocation bitrate_allocation_{Bitrate::Mode::kConstant};
	bool low_latency_mode_ = false;
	int num_temporal_layers_ = 1;

	// Codec type used for encoding.
	VideoCodec codec_ = VideoCodec::kUnknown;

	// Vendor of the active video encoder.
	DriverVendor vendor_ = DriverVendor::kOther;

	// Group of picture length for encoded output stream, indicates the
	// distance between two key frames.
	uint32_t gop_length_ = 0u;

	// Video encoder info that includes accelerator name, QP validity, etc.
	VideoEncoderInfo encoder_info_;
	bool encoder_info_sent_ = false;

	Microsoft::WRL::ComPtr<IMFActivate> activate_;
	Microsoft::WRL::ComPtr<IMFTransform> encoder_;
	Microsoft::WRL::ComPtr<ICodecAPI> codec_api_;
	Microsoft::WRL::ComPtr<IMFMediaEventGenerator> event_generator_;
	base::AtomicRefCount async_callback_ref_{1};

	DWORD input_stream_id_ = 0u;
	DWORD output_stream_id_ = 0u;

	Microsoft::WRL::ComPtr<IMFMediaType> imf_input_media_type_;
	Microsoft::WRL::ComPtr<IMFMediaType> imf_output_media_type_;

	Microsoft::WRL::ComPtr<IMFSample> input_sample_;
	// True if `input_sample_` has been populated with data/metadata
	// of the next frame to be encoded.
	bool has_prepared_input_sample_ = false;

	Microsoft::WRL::ComPtr<IMFSample> output_sample_;
	Microsoft::WRL::ComPtr<ID3D11VideoProcessor> video_processor_;
	Microsoft::WRL::ComPtr<ID3D11VideoProcessorEnumerator>
	video_processor_enumerator_;
	Microsoft::WRL::ComPtr<ID3D11VideoDevice> video_device_;
	Microsoft::WRL::ComPtr<ID3D11VideoContext> video_context_;
	D3D11_VIDEO_PROCESSOR_CONTENT_DESC vp_desc_ = {};
	Microsoft::WRL::ComPtr<ID3D11Texture2D> scaled_d3d11_texture_;
	Microsoft::WRL::ComPtr<ID3D11VideoProcessorOutputView> vp_output_view_;

	// To expose client callbacks from VideoEncodeAccelerator.
	raw_ptr<Client> client_ = nullptr;
	SEQUENCE_CHECKER(sequence_checker_);

	// DXGI device manager for handling hardware input textures
	scoped_refptr<DXGIDeviceManager> dxgi_device_manager_;
	// Mapping of dxgi resource needed when HMFT rejects setting D3D11 manager.
	bool dxgi_resource_mapping_required_ = false;
	// Staging texture for copying from GPU memory if HMFT does not operate in
	// D3D11 mode.
	Microsoft::WRL::ComPtr<ID3D11Texture2D> staging_texture_;

	// Preferred adapter for DXGIDeviceManager.
	const CHROME_LUID luid_;

	// A buffer used as a scratch space for I420 to NV12 conversion
	std::vector<uint8_t> resize_buffer_;

	FlushCallback flush_callback_;

	// Bitrate controller for CBR encoding.
	std::unique_ptr<VideoRateControlWrapper> rate_ctrl_;

	// Declared last to ensure that all weak pointers are invalidated before
	// other destructors run.
	base::WeakPtr<MediaFoundationVideoEncodeAccelerator> weak_ptr_;
	base::WeakPtrFactory<MediaFoundationVideoEncodeAccelerator> weak_factory_{
	this};
	};

	} // namespace media

	#endif // MEDIA_GPU_WINDOWS_MEDIA_FOUNDATION_VIDEO_ENCODE_ACCELERATOR_WIN_H_