| // Copyright 2014 The Chromium Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include "media/gpu/v4l2/v4l2_video_decode_accelerator.h" |
| |
| #include <dlfcn.h> |
| #include <errno.h> |
| #include <fcntl.h> |
| #include <linux/videodev2.h> |
| #include <poll.h> |
| #include <string.h> |
| #include <sys/eventfd.h> |
| #include <sys/ioctl.h> |
| #include <sys/mman.h> |
| |
| #include "base/bind.h" |
| #include "base/callback_helpers.h" |
| #include "base/command_line.h" |
| #include "base/cxx17_backports.h" |
| #include "base/numerics/safe_conversions.h" |
| #include "base/posix/eintr_wrapper.h" |
| #include "base/single_thread_task_runner.h" |
| #include "base/strings/stringprintf.h" |
| #include "base/threading/thread_task_runner_handle.h" |
| #include "base/time/time.h" |
| #include "base/trace_event/memory_dump_manager.h" |
| #include "base/trace_event/trace_event.h" |
| #include "build/build_config.h" |
| #include "media/base/media_switches.h" |
| #include "media/base/scopedfd_helper.h" |
| #include "media/base/unaligned_shared_memory.h" |
| #include "media/base/video_frame_layout.h" |
| #include "media/base/video_types.h" |
| #include "media/gpu/chromeos/fourcc.h" |
| #include "media/gpu/chromeos/platform_video_frame_utils.h" |
| #include "media/gpu/macros.h" |
| #include "media/gpu/v4l2/v4l2_image_processor_backend.h" |
| #include "media/gpu/v4l2/v4l2_stateful_workaround.h" |
| #include "media/gpu/v4l2/v4l2_utils.h" |
| #include "media/gpu/v4l2/v4l2_vda_helpers.h" |
| #include "ui/gfx/geometry/rect.h" |
| #include "ui/gfx/native_pixmap_handle.h" |
| #include "ui/gl/gl_context.h" |
| #include "ui/gl/scoped_binders.h" |
| |
| #define NOTIFY_ERROR(x) \ |
| do { \ |
| VLOGF(1) << "Setting error state:" << x; \ |
| SetErrorState(x); \ |
| } while (0) |
| |
| #define IOCTL_OR_ERROR_RETURN_VALUE(type, arg, value, type_str) \ |
| do { \ |
| if (device_->Ioctl(type, arg) != 0) { \ |
| PLOG(ERROR) << "ioctl() failed: " << type_str; \ |
| NOTIFY_ERROR(PLATFORM_FAILURE); \ |
| return value; \ |
| } \ |
| } while (0) |
| |
| #define IOCTL_OR_ERROR_RETURN(type, arg) \ |
| IOCTL_OR_ERROR_RETURN_VALUE(type, arg, ((void)0), #type) |
| |
| #define IOCTL_OR_ERROR_RETURN_FALSE(type, arg) \ |
| IOCTL_OR_ERROR_RETURN_VALUE(type, arg, false, #type) |
| |
| #define IOCTL_OR_LOG_ERROR(type, arg) \ |
| do { \ |
| if (device_->Ioctl(type, arg) != 0) \ |
| VPLOGF(1) << "ioctl() failed: " << #type; \ |
| } while (0) |
| |
| namespace media { |
| |
| // static |
| const uint32_t V4L2VideoDecodeAccelerator::supported_input_fourccs_[] = { |
| V4L2_PIX_FMT_H264, V4L2_PIX_FMT_VP8, V4L2_PIX_FMT_VP9, |
| }; |
| |
| // static |
| base::AtomicRefCount V4L2VideoDecodeAccelerator::num_instances_(0); |
| |
| struct V4L2VideoDecodeAccelerator::BitstreamBufferRef { |
| BitstreamBufferRef( |
| base::WeakPtr<Client>& client, |
| scoped_refptr<base::SingleThreadTaskRunner>& client_task_runner, |
| scoped_refptr<DecoderBuffer> buffer, |
| int32_t input_id); |
| ~BitstreamBufferRef(); |
| |
| const base::WeakPtr<Client> client; |
| const scoped_refptr<base::SingleThreadTaskRunner> client_task_runner; |
| scoped_refptr<DecoderBuffer> buffer; |
| size_t bytes_used; |
| const int32_t input_id; |
| }; |
| |
| V4L2VideoDecodeAccelerator::BitstreamBufferRef::BitstreamBufferRef( |
| base::WeakPtr<Client>& client, |
| scoped_refptr<base::SingleThreadTaskRunner>& client_task_runner, |
| scoped_refptr<DecoderBuffer> buffer, |
| int32_t input_id) |
| : client(client), |
| client_task_runner(client_task_runner), |
| buffer(std::move(buffer)), |
| bytes_used(0), |
| input_id(input_id) {} |
| |
| V4L2VideoDecodeAccelerator::BitstreamBufferRef::~BitstreamBufferRef() { |
| if (input_id >= 0) { |
| client_task_runner->PostTask( |
| FROM_HERE, |
| base::BindOnce(&Client::NotifyEndOfBitstreamBuffer, client, input_id)); |
| } |
| } |
| |
| V4L2VideoDecodeAccelerator::OutputRecord::OutputRecord() |
| : egl_image(EGL_NO_IMAGE_KHR), |
| picture_id(-1), |
| texture_id(0), |
| cleared(false) {} |
| |
| V4L2VideoDecodeAccelerator::OutputRecord::OutputRecord(OutputRecord&&) = |
| default; |
| |
| V4L2VideoDecodeAccelerator::OutputRecord::~OutputRecord() {} |
| |
| V4L2VideoDecodeAccelerator::PictureRecord::PictureRecord(bool cleared, |
| const Picture& picture) |
| : cleared(cleared), picture(picture) {} |
| |
| V4L2VideoDecodeAccelerator::PictureRecord::~PictureRecord() {} |
| |
| V4L2VideoDecodeAccelerator::V4L2VideoDecodeAccelerator( |
| EGLDisplay egl_display, |
| const GetGLContextCallback& get_gl_context_cb, |
| const MakeGLContextCurrentCallback& make_context_current_cb, |
| scoped_refptr<V4L2Device> device) |
| : can_use_decoder_(num_instances_.Increment() < kMaxNumOfInstances), |
| child_task_runner_(base::ThreadTaskRunnerHandle::Get()), |
| decoder_thread_("V4L2DecoderThread"), |
| decoder_state_(kUninitialized), |
| output_mode_(Config::OutputMode::ALLOCATE), |
| device_(std::move(device)), |
| decoder_delay_bitstream_buffer_id_(-1), |
| decoder_decode_buffer_tasks_scheduled_(0), |
| decoder_flushing_(false), |
| decoder_cmd_supported_(false), |
| flush_awaiting_last_output_buffer_(false), |
| reset_pending_(false), |
| output_dpb_size_(0), |
| picture_clearing_count_(0), |
| device_poll_thread_("V4L2DevicePollThread"), |
| egl_display_(egl_display), |
| get_gl_context_cb_(get_gl_context_cb), |
| make_context_current_cb_(make_context_current_cb), |
| input_format_fourcc_(0), |
| weak_this_factory_(this) { |
| weak_this_ = weak_this_factory_.GetWeakPtr(); |
| } |
| |
| V4L2VideoDecodeAccelerator::~V4L2VideoDecodeAccelerator() { |
| DCHECK(!decoder_thread_.IsRunning()); |
| DCHECK(!device_poll_thread_.IsRunning()); |
| DVLOGF(2); |
| |
| // These maps have members that should be manually destroyed, e.g. file |
| // descriptors, mmap() segments, etc. |
| DCHECK(output_buffer_map_.empty()); |
| |
| num_instances_.Decrement(); |
| } |
| |
| bool V4L2VideoDecodeAccelerator::Initialize(const Config& config, |
| Client* client) { |
| VLOGF(2) << "profile: " << config.profile |
| << ", output_mode=" << static_cast<int>(config.output_mode); |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| DCHECK_EQ(decoder_state_, kUninitialized); |
| |
| if (!can_use_decoder_) { |
| VLOGF(1) << "Reached the maximum number of decoder instances"; |
| return false; |
| } |
| |
| if (config.is_encrypted()) { |
| NOTREACHED() << "Encrypted streams are not supported for this VDA"; |
| return false; |
| } |
| |
| if (config.output_mode != Config::OutputMode::ALLOCATE && |
| config.output_mode != Config::OutputMode::IMPORT) { |
| NOTREACHED() << "Only ALLOCATE and IMPORT OutputModes are supported"; |
| return false; |
| } |
| |
| client_ptr_factory_.reset(new base::WeakPtrFactory<Client>(client)); |
| client_ = client_ptr_factory_->GetWeakPtr(); |
| // If we haven't been set up to decode on separate thread via |
| // TryToSetupDecodeOnSeparateThread(), use the main thread/client for |
| // decode tasks. |
| if (!decode_task_runner_) { |
| decode_task_runner_ = child_task_runner_; |
| DCHECK(!decode_client_); |
| decode_client_ = client_; |
| } |
| |
| // We need the context to be initialized to query extensions. |
| if (make_context_current_cb_) { |
| if (egl_display_ == EGL_NO_DISPLAY) { |
| VLOGF(1) << "could not get EGLDisplay"; |
| return false; |
| } |
| |
| if (!make_context_current_cb_.Run()) { |
| VLOGF(1) << "could not make context current"; |
| return false; |
| } |
| |
| // TODO(posciak): https://crbug.com/450898. |
| #if defined(ARCH_CPU_ARMEL) |
| if (!gl::g_driver_egl.ext.b_EGL_KHR_fence_sync) { |
| VLOGF(1) << "context does not have EGL_KHR_fence_sync"; |
| return false; |
| } |
| #endif |
| } else { |
| DVLOGF(2) << "No GL callbacks provided, initializing without GL support"; |
| } |
| |
| decoder_state_ = kInitialized; |
| |
| if (!decoder_thread_.Start()) { |
| LOG(ERROR) << "decoder thread failed to start"; |
| return false; |
| } |
| |
| bool result = false; |
| base::WaitableEvent done; |
| decoder_thread_.task_runner()->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2VideoDecodeAccelerator::InitializeTask, |
| base::Unretained(this), config, &result, &done)); |
| done.Wait(); |
| |
| return result; |
| } |
| |
| void V4L2VideoDecodeAccelerator::InitializeTask(const Config& config, |
| bool* result, |
| base::WaitableEvent* done) { |
| DVLOGF(3); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_NE(result, nullptr); |
| DCHECK_NE(done, nullptr); |
| DCHECK_EQ(decoder_state_, kInitialized); |
| TRACE_EVENT0("media,gpu", "V4L2VDA::InitializeTask"); |
| |
| // The client can keep going as soon as the configuration is checked. |
| // Store the result to the local value to see the result even after |*result| |
| // is released. |
| bool config_result = CheckConfig(config); |
| *result = config_result; |
| done->Signal(); |
| |
| // No need to keep going is configuration is not supported. |
| if (!config_result) |
| return; |
| |
| frame_splitter_ = |
| v4l2_vda_helpers::InputBufferFragmentSplitter::CreateFromProfile( |
| config.profile); |
| if (!frame_splitter_) { |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| base::trace_event::MemoryDumpManager::GetInstance()->RegisterDumpProvider( |
| this, "media::V4l2VideoDecodeAccelerator", decoder_thread_.task_runner()); |
| |
| // Subscribe to the resolution change event. |
| struct v4l2_event_subscription sub; |
| memset(&sub, 0, sizeof(sub)); |
| sub.type = V4L2_EVENT_SOURCE_CHANGE; |
| IOCTL_OR_ERROR_RETURN(VIDIOC_SUBSCRIBE_EVENT, &sub); |
| |
| if (!CreateInputBuffers()) { |
| LOG(ERROR) << "Failed CreatingInputBuffers()"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| decoder_cmd_supported_ = IsDecoderCmdSupported(); |
| |
| StartDevicePoll(); |
| } |
| |
| bool V4L2VideoDecodeAccelerator::CheckConfig(const Config& config) { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| input_format_fourcc_ = |
| V4L2Device::VideoCodecProfileToV4L2PixFmt(config.profile, false); |
| |
| if (!input_format_fourcc_ || |
| !device_->Open(V4L2Device::Type::kDecoder, input_format_fourcc_)) { |
| VLOGF(1) << "Failed to open device for profile: " << config.profile |
| << " fourcc: " << FourccToString(input_format_fourcc_); |
| return false; |
| } |
| |
| // Capabilities check. |
| struct v4l2_capability caps; |
| const __u32 kCapsRequired = V4L2_CAP_VIDEO_M2M_MPLANE | V4L2_CAP_STREAMING; |
| IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_QUERYCAP, &caps); |
| if ((caps.capabilities & kCapsRequired) != kCapsRequired) { |
| VLOGF(1) << "ioctl() failed: VIDIOC_QUERYCAP" |
| << ", caps check failed: 0x" << std::hex << caps.capabilities; |
| return false; |
| } |
| |
| workarounds_ = |
| CreateV4L2StatefulWorkarounds(V4L2Device::Type::kDecoder, config.profile); |
| |
| output_mode_ = config.output_mode; |
| |
| input_queue_ = device_->GetQueue(V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE); |
| if (!input_queue_) |
| return false; |
| |
| output_queue_ = device_->GetQueue(V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE); |
| if (!output_queue_) |
| return false; |
| |
| if (!SetupFormats()) |
| return false; |
| |
| // We have confirmed that |config| is supported, tell the good news to the |
| // client. |
| return true; |
| } |
| |
| void V4L2VideoDecodeAccelerator::Decode(BitstreamBuffer bitstream_buffer) { |
| Decode(bitstream_buffer.ToDecoderBuffer(), bitstream_buffer.id()); |
| } |
| |
| void V4L2VideoDecodeAccelerator::Decode(scoped_refptr<DecoderBuffer> buffer, |
| int32_t bitstream_id) { |
| DVLOGF(4) << "input_id=" << bitstream_id |
| << ", size=" << (buffer ? buffer->data_size() : 0); |
| DCHECK(decode_task_runner_->BelongsToCurrentThread()); |
| |
| if (bitstream_id < 0) { |
| LOG(ERROR) << "Invalid bitstream buffer, id: " << bitstream_id; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| // DecodeTask() will take care of running a DecodeBufferTask(). |
| decoder_thread_.task_runner()->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2VideoDecodeAccelerator::DecodeTask, |
| base::Unretained(this), std::move(buffer), bitstream_id)); |
| } |
| |
| void V4L2VideoDecodeAccelerator::AssignPictureBuffers( |
| const std::vector<PictureBuffer>& buffers) { |
| VLOGF(2) << "buffer_count=" << buffers.size(); |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| |
| decoder_thread_.task_runner()->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2VideoDecodeAccelerator::AssignPictureBuffersTask, |
| base::Unretained(this), buffers)); |
| } |
| |
| void V4L2VideoDecodeAccelerator::AssignPictureBuffersTask( |
| const std::vector<PictureBuffer>& buffers) { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_EQ(decoder_state_, kAwaitingPictureBuffers); |
| DCHECK(output_queue_); |
| TRACE_EVENT1("media,gpu", "V4L2VDA::AssignPictureBuffersTask", "buffers_size", |
| buffers.size()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| uint32_t req_buffer_count = output_dpb_size_ + kDpbOutputBufferExtraCount; |
| if (image_processor_device_) |
| req_buffer_count += kDpbOutputBufferExtraCountForImageProcessor; |
| |
| if (buffers.size() < req_buffer_count) { |
| LOG(ERROR) << "Failed to provide requested picture buffers. (Got " |
| << buffers.size() << ", requested " << req_buffer_count << ")"; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| enum v4l2_memory memory; |
| if (!image_processor_device_ && output_mode_ == Config::OutputMode::IMPORT) |
| memory = V4L2_MEMORY_DMABUF; |
| else |
| memory = V4L2_MEMORY_MMAP; |
| |
| if (output_queue_->AllocateBuffers(buffers.size(), memory) == 0) { |
| LOG(ERROR) << "Failed to request buffers!"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| if (output_queue_->AllocatedBuffersCount() != buffers.size()) { |
| LOG(ERROR) << "Could not allocate requested number of output buffers"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| DCHECK(output_buffer_map_.empty()); |
| DCHECK(output_wait_map_.empty()); |
| output_buffer_map_.resize(buffers.size()); |
| if (image_processor_device_ && output_mode_ == Config::OutputMode::ALLOCATE) { |
| if (!CreateImageProcessor()) |
| return; |
| } |
| |
| // Reserve all buffers until ImportBufferForPictureTask() is called |
| std::vector<V4L2WritableBufferRef> v4l2_buffers; |
| while (auto buffer_opt = output_queue_->GetFreeBuffer()) |
| v4l2_buffers.push_back(std::move(*buffer_opt)); |
| |
| // Now setup the output record for each buffer and import it if needed. |
| for (auto&& buffer : v4l2_buffers) { |
| const int i = buffer.BufferId(); |
| |
| OutputRecord& output_record = output_buffer_map_[i]; |
| DCHECK_EQ(output_record.egl_image, EGL_NO_IMAGE_KHR); |
| DCHECK_EQ(output_record.picture_id, -1); |
| DCHECK(!output_record.cleared); |
| |
| output_record.picture_id = buffers[i].id(); |
| output_record.texture_id = buffers[i].service_texture_ids().empty() |
| ? 0 |
| : buffers[i].service_texture_ids()[0]; |
| |
| // We move the buffer into output_wait_map_, so get a reference to |
| // its video frame if we need it to create the native pixmap for import. |
| scoped_refptr<VideoFrame> video_frame; |
| if (output_mode_ == Config::OutputMode::ALLOCATE && |
| !image_processor_device_) |
| video_frame = buffer.GetVideoFrame(); |
| |
| // The buffer will remain here until ImportBufferForPicture is called, |
| // either by the client, or by ourselves, if we are allocating. |
| DCHECK_EQ(output_wait_map_.count(buffers[i].id()), 0u); |
| output_wait_map_.emplace(buffers[i].id(), std::move(buffer)); |
| |
| if (output_mode_ == Config::OutputMode::ALLOCATE) { |
| gfx::NativePixmapHandle native_pixmap; |
| |
| // If we are using an image processor, the DMABufs that we need to import |
| // are those of the image processor's buffers, not the decoders. So |
| // pass an empty native pixmap in that case. |
| if (!image_processor_device_) |
| native_pixmap = |
| CreateGpuMemoryBufferHandle(video_frame.get()).native_pixmap_handle; |
| |
| ImportBufferForPictureTask(output_record.picture_id, |
| std::move(native_pixmap)); |
| } // else we'll get triggered via ImportBufferForPicture() from client. |
| |
| DVLOGF(3) << "buffer[" << i << "]: picture_id=" << output_record.picture_id; |
| } |
| |
| if (output_mode_ == Config::OutputMode::ALLOCATE) { |
| ScheduleDecodeBufferTaskIfNeeded(); |
| } |
| } |
| |
| void V4L2VideoDecodeAccelerator::CreateEGLImageFor( |
| scoped_refptr<V4L2Device> egl_device, |
| size_t buffer_index, |
| int32_t picture_buffer_id, |
| gfx::NativePixmapHandle handle, |
| GLuint texture_id, |
| const gfx::Size& visible_size, |
| const Fourcc fourcc) { |
| DVLOGF(3) << "index=" << buffer_index; |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| DCHECK_NE(texture_id, 0u); |
| |
| if (!get_gl_context_cb_ || !make_context_current_cb_) { |
| LOG(ERROR) << "GL callbacks required for binding to EGLImages"; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| gl::GLContext* gl_context = get_gl_context_cb_.Run(); |
| if (!gl_context || !make_context_current_cb_.Run()) { |
| LOG(ERROR) << "No GL context"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| gl::ScopedTextureBinder bind_restore(GL_TEXTURE_EXTERNAL_OES, 0); |
| |
| EGLImageKHR egl_image = egl_device->CreateEGLImage( |
| egl_display_, gl_context->GetHandle(), texture_id, visible_size, |
| buffer_index, fourcc, std::move(handle)); |
| if (egl_image == EGL_NO_IMAGE_KHR) { |
| LOG(ERROR) << "could not create EGLImageKHR," |
| << " index=" << buffer_index << " texture_id=" << texture_id; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| decoder_thread_.task_runner()->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2VideoDecodeAccelerator::AssignEGLImage, |
| base::Unretained(this), buffer_index, |
| picture_buffer_id, egl_image)); |
| } |
| |
| void V4L2VideoDecodeAccelerator::AssignEGLImage(size_t buffer_index, |
| int32_t picture_buffer_id, |
| EGLImageKHR egl_image) { |
| DVLOGF(3) << "index=" << buffer_index << ", picture_id=" << picture_buffer_id; |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| // It's possible that while waiting for the EGLImages to be allocated and |
| // assigned, we have already decoded more of the stream and saw another |
| // resolution change. This is a normal situation, in such a case either there |
| // is no output record with this index awaiting an EGLImage to be assigned to |
| // it, or the record is already updated to use a newer PictureBuffer and is |
| // awaiting an EGLImage associated with a different picture_buffer_id. If so, |
| // just discard this image, we will get the one we are waiting for later. |
| if (buffer_index >= output_buffer_map_.size() || |
| output_buffer_map_[buffer_index].picture_id != picture_buffer_id) { |
| DVLOGF(4) << "Picture set already changed, dropping EGLImage"; |
| child_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(base::IgnoreResult(&V4L2Device::DestroyEGLImage), |
| device_, egl_display_, egl_image)); |
| return; |
| } |
| |
| OutputRecord& output_record = output_buffer_map_[buffer_index]; |
| DCHECK_EQ(output_record.egl_image, EGL_NO_IMAGE_KHR); |
| |
| output_record.egl_image = egl_image; |
| |
| // Make ourselves available if CreateEGLImageFor has been called from |
| // ImportBufferForPictureTask. |
| if (!image_processor_) { |
| DCHECK_EQ(output_wait_map_.count(picture_buffer_id), 1u); |
| output_wait_map_.erase(picture_buffer_id); |
| if (decoder_state_ != kChangingResolution) { |
| Enqueue(); |
| ScheduleDecodeBufferTaskIfNeeded(); |
| } |
| } |
| } |
| |
| void V4L2VideoDecodeAccelerator::ImportBufferForPicture( |
| int32_t picture_buffer_id, |
| VideoPixelFormat pixel_format, |
| gfx::GpuMemoryBufferHandle gpu_memory_buffer_handle) { |
| DVLOGF(3) << "picture_buffer_id=" << picture_buffer_id; |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| if (output_mode_ != Config::OutputMode::IMPORT) { |
| LOG(ERROR) << "Cannot import in non-import mode"; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| decoder_thread_.task_runner()->PostTask( |
| FROM_HERE, |
| base::BindOnce( |
| &V4L2VideoDecodeAccelerator::ImportBufferForPictureForImportTask, |
| base::Unretained(this), picture_buffer_id, pixel_format, |
| std::move(gpu_memory_buffer_handle.native_pixmap_handle))); |
| } |
| |
| void V4L2VideoDecodeAccelerator::ImportBufferForPictureForImportTask( |
| int32_t picture_buffer_id, |
| VideoPixelFormat pixel_format, |
| gfx::NativePixmapHandle handle) { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| // |output_format_fourcc_| is the output format of the decoder. It is not |
| // the final output format from the image processor (if exists). |
| // Use |egl_image_format_fourcc_|, it will be the final output format. |
| if (pixel_format != egl_image_format_fourcc_->ToVideoPixelFormat()) { |
| LOG(ERROR) << "Unsupported import format: " << pixel_format << ", expected " |
| << VideoPixelFormatToString( |
| egl_image_format_fourcc_->ToVideoPixelFormat()); |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| for (const auto& plane : handle.planes) { |
| DVLOGF(3) << ": offset=" << plane.offset << ", stride=" << plane.stride; |
| } |
| |
| ImportBufferForPictureTask(picture_buffer_id, std::move(handle)); |
| } |
| |
| void V4L2VideoDecodeAccelerator::ImportBufferForPictureTask( |
| int32_t picture_buffer_id, |
| gfx::NativePixmapHandle handle) { |
| DVLOGF(3) << "picture_buffer_id=" << picture_buffer_id |
| << ", handle.planes.size()=" << handle.planes.size(); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| TRACE_EVENT2("media,gpu", "V4L2VDA::ImportBufferForPictureTask", |
| "picture_buffer_id", picture_buffer_id, "handle.planes", |
| handle.planes.size()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| const auto iter = |
| std::find_if(output_buffer_map_.begin(), output_buffer_map_.end(), |
| [picture_buffer_id](const OutputRecord& output_record) { |
| return output_record.picture_id == picture_buffer_id; |
| }); |
| if (iter == output_buffer_map_.end()) { |
| // It's possible that we've already posted a DismissPictureBuffer for this |
| // picture, but it has not yet executed when this ImportBufferForPicture was |
| // posted to us by the client. In that case just ignore this (we've already |
| // dismissed it and accounted for that). |
| DVLOGF(3) << "got picture id=" << picture_buffer_id |
| << " not in use (anymore?)."; |
| return; |
| } |
| |
| if (!output_wait_map_.count(iter->picture_id)) { |
| LOG(ERROR) << "Passed buffer is not waiting to be imported"; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| // TODO(crbug.com/982172): ARC++ may adjust the size of the buffer due to |
| // allocator constraints, but the VDA API does not provide a way for it to |
| // communicate the actual buffer size. If we are importing, make sure that the |
| // actual buffer size is coherent with what we expect, and adjust our size if |
| // needed. |
| if (output_mode_ == Config::OutputMode::IMPORT) { |
| DCHECK_GT(handle.planes.size(), 0u); |
| const gfx::Size handle_size = v4l2_vda_helpers::NativePixmapSizeFromHandle( |
| handle, *egl_image_format_fourcc_, egl_image_size_); |
| |
| // If this is the first picture, then adjust the EGL width. |
| // Otherwise just check that it remains the same. |
| if (decoder_state_ == kAwaitingPictureBuffers) { |
| DCHECK_GE(handle_size.width(), egl_image_size_.width()); |
| DVLOGF(3) << "Original egl_image_size=" << egl_image_size_.ToString() |
| << ", adjusted buffer size=" << handle_size.ToString(); |
| egl_image_size_ = handle_size; |
| } |
| DCHECK_EQ(egl_image_size_, handle_size); |
| |
| // For allocate mode, the IP will already have been created in |
| // AssignPictureBuffersTask. |
| if (image_processor_device_ && !image_processor_) { |
| DCHECK_EQ(kAwaitingPictureBuffers, decoder_state_); |
| // This is the first buffer import. Create the image processor and change |
| // the decoder state. The client may adjust the coded width. We don't have |
| // the final coded size in AssignPictureBuffers yet. Use the adjusted |
| // coded width to create the image processor. |
| if (!CreateImageProcessor()) |
| return; |
| } |
| } |
| |
| if (reset_pending_) { |
| FinishReset(); |
| } |
| |
| if (decoder_state_ == kAwaitingPictureBuffers) { |
| decoder_state_ = kDecoding; |
| DVLOGF(3) << "Change state to kDecoding"; |
| } |
| |
| // If we are importing, create the output VideoFrame that we will render |
| // into. |
| if (output_mode_ == Config::OutputMode::IMPORT) { |
| DCHECK_GT(handle.planes.size(), 0u); |
| DCHECK(!iter->output_frame); |
| // Duplicate the buffer FDs for the VideoFrame instance. |
| std::vector<base::ScopedFD> duped_fds; |
| std::vector<ColorPlaneLayout> color_planes; |
| for (const gfx::NativePixmapPlane& plane : handle.planes) { |
| duped_fds.emplace_back(HANDLE_EINTR(dup(plane.fd.get()))); |
| if (!duped_fds.back().is_valid()) { |
| PLOG(ERROR) << "Failed to duplicate plane FD!"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| color_planes.push_back( |
| ColorPlaneLayout(base::checked_cast<int32_t>(plane.stride), |
| base::checked_cast<size_t>(plane.offset), |
| base::checked_cast<size_t>(plane.size))); |
| } |
| auto layout = VideoFrameLayout::CreateWithPlanes( |
| egl_image_format_fourcc_->ToVideoPixelFormat(), egl_image_size_, |
| std::move(color_planes)); |
| if (!layout) { |
| LOG(ERROR) << "Cannot create layout!"; |
| NOTIFY_ERROR(INVALID_ARGUMENT); |
| return; |
| } |
| |
| iter->output_frame = VideoFrame::WrapExternalDmabufs( |
| *layout, gfx::Rect(visible_size_), visible_size_, |
| DuplicateFDs(duped_fds), base::TimeDelta()); |
| } |
| |
| if (iter->texture_id != 0) { |
| if (iter->egl_image != EGL_NO_IMAGE_KHR) { |
| child_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(base::IgnoreResult(&V4L2Device::DestroyEGLImage), |
| device_, egl_display_, iter->egl_image)); |
| } |
| |
| // If we are not using an image processor, create the EGL image ahead of |
| // time since we already have its DMABUF fds. It is guaranteed that |
| // CreateEGLImageFor will run before the picture is passed to the client |
| // because the picture will need to be cleared on the child thread first. |
| if (!image_processor_) { |
| DCHECK_GT(handle.planes.size(), 0u); |
| size_t index = iter - output_buffer_map_.begin(); |
| |
| child_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2VideoDecodeAccelerator::CreateEGLImageFor, |
| weak_this_, device_, index, picture_buffer_id, |
| std::move(handle), iter->texture_id, visible_size_, |
| *egl_image_format_fourcc_)); |
| |
| // Early return, AssignEGLImage will make the buffer available for |
| // decoding once the EGL image is created. |
| return; |
| } |
| } |
| |
| // The buffer can now be used for decoding |
| DCHECK_EQ(output_wait_map_.count(picture_buffer_id), 1u); |
| output_wait_map_.erase(picture_buffer_id); |
| if (decoder_state_ != kChangingResolution) { |
| Enqueue(); |
| ScheduleDecodeBufferTaskIfNeeded(); |
| } |
| } |
| |
| void V4L2VideoDecodeAccelerator::ReusePictureBuffer(int32_t picture_buffer_id) { |
| DVLOGF(4) << "picture_buffer_id=" << picture_buffer_id; |
| // Must be run on child thread, as we'll insert a sync in the EGL context. |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| |
| std::unique_ptr<gl::GLFenceEGL> egl_fence; |
| |
| if (make_context_current_cb_) { |
| if (!make_context_current_cb_.Run()) { |
| LOG(ERROR) << "could not make context current"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| // TODO(posciak): https://crbug.com/450898. |
| #if defined(ARCH_CPU_ARMEL) |
| egl_fence = gl::GLFenceEGL::Create(); |
| if (!egl_fence) { |
| LOG(ERROR) << "gl::GLFenceEGL::Create() failed"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| #endif |
| } |
| |
| decoder_thread_.task_runner()->PostTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2VideoDecodeAccelerator::ReusePictureBufferTask, |
| base::Unretained(this), picture_buffer_id, |
| std::move(egl_fence))); |
| } |
| |
| void V4L2VideoDecodeAccelerator::Flush() { |
| VLOGF(2); |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| decoder_thread_.task_runner()->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2VideoDecodeAccelerator::FlushTask, |
| base::Unretained(this))); |
| } |
| |
| void V4L2VideoDecodeAccelerator::Reset() { |
| VLOGF(2); |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| decoder_thread_.task_runner()->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2VideoDecodeAccelerator::ResetTask, |
| base::Unretained(this))); |
| } |
| |
| void V4L2VideoDecodeAccelerator::Destroy() { |
| VLOGF(2); |
| DCHECK(child_task_runner_->BelongsToCurrentThread()); |
| |
| // Signal any waiting/sleeping tasks to early exit as soon as possible to |
| // avoid waiting too long for the decoder_thread_ to Stop(). |
| destroy_pending_.Signal(); |
| |
| // We're destroying; cancel all callbacks. |
| client_ptr_factory_.reset(); |
| weak_this_factory_.InvalidateWeakPtrs(); |
| |
| // If the decoder thread is running, destroy using posted task. |
| if (decoder_thread_.IsRunning()) { |
| decoder_thread_.task_runner()->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2VideoDecodeAccelerator::DestroyTask, |
| base::Unretained(this))); |
| // DestroyTask() will cause the decoder_thread_ to flush all tasks. |
| decoder_thread_.Stop(); |
| } |
| |
| delete this; |
| VLOGF(2) << "Destroyed."; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::TryToSetupDecodeOnSeparateThread( |
| const base::WeakPtr<Client>& decode_client, |
| const scoped_refptr<base::SingleThreadTaskRunner>& decode_task_runner) { |
| VLOGF(2); |
| decode_client_ = decode_client; |
| decode_task_runner_ = decode_task_runner; |
| return true; |
| } |
| |
| // static |
| VideoDecodeAccelerator::SupportedProfiles |
| V4L2VideoDecodeAccelerator::GetSupportedProfiles() { |
| scoped_refptr<V4L2Device> device = V4L2Device::Create(); |
| if (!device) |
| return SupportedProfiles(); |
| |
| return device->GetSupportedDecodeProfiles( |
| base::size(supported_input_fourccs_), supported_input_fourccs_); |
| } |
| |
| void V4L2VideoDecodeAccelerator::DecodeTask(scoped_refptr<DecoderBuffer> buffer, |
| int32_t bitstream_id) { |
| DVLOGF(4) << "input_id=" << bitstream_id; |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_NE(decoder_state_, kUninitialized); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| std::unique_ptr<BitstreamBufferRef> bitstream_record(new BitstreamBufferRef( |
| decode_client_, decode_task_runner_, std::move(buffer), bitstream_id)); |
| |
| // Skip empty buffer. |
| if (!bitstream_record->buffer) |
| return; |
| |
| if (decoder_state_ == kResetting || decoder_flushing_) { |
| // In the case that we're resetting or flushing, we need to delay decoding |
| // the BitstreamBuffers that come after the Reset() or Flush() call. When |
| // we're here, we know that this DecodeTask() was scheduled by a Decode() |
| // call that came after (in the client thread) the Reset() or Flush() call; |
| // thus set up the delay if necessary. |
| if (decoder_delay_bitstream_buffer_id_ == -1) |
| decoder_delay_bitstream_buffer_id_ = bitstream_record->input_id; |
| } else if (decoder_state_ == kError) { |
| VLOGF(2) << "early out: kError state"; |
| return; |
| } |
| |
| decoder_input_queue_.push_back(std::move(bitstream_record)); |
| decoder_decode_buffer_tasks_scheduled_++; |
| DecodeBufferTask(); |
| } |
| |
| void V4L2VideoDecodeAccelerator::DecodeBufferTask() { |
| DVLOGF(4); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_NE(decoder_state_, kUninitialized); |
| TRACE_EVENT0("media,gpu", "V4L2VDA::DecodeBufferTask"); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| decoder_decode_buffer_tasks_scheduled_--; |
| |
| if (decoder_state_ != kInitialized && decoder_state_ != kDecoding) { |
| DVLOGF(3) << "early out: state=" << decoder_state_; |
| return; |
| } |
| |
| if (decoder_current_bitstream_buffer_ == NULL) { |
| if (decoder_input_queue_.empty()) { |
| // We're waiting for a new buffer -- exit without scheduling a new task. |
| return; |
| } |
| if (decoder_delay_bitstream_buffer_id_ == |
| decoder_input_queue_.front()->input_id) { |
| // We're asked to delay decoding on this and subsequent buffers. |
| return; |
| } |
| |
| // Setup to use the next buffer. |
| decoder_current_bitstream_buffer_ = std::move(decoder_input_queue_.front()); |
| decoder_input_queue_.pop_front(); |
| const auto& buffer = decoder_current_bitstream_buffer_->buffer; |
| if (buffer) { |
| DVLOGF(4) << "reading input_id=" |
| << decoder_current_bitstream_buffer_->input_id |
| << ", addr=" << buffer->data() |
| << ", size=" << buffer->data_size(); |
| } else { |
| DCHECK_EQ(decoder_current_bitstream_buffer_->input_id, kFlushBufferId); |
| DVLOGF(4) << "reading input_id=kFlushBufferId"; |
| } |
| } |
| bool schedule_task = false; |
| size_t decoded_size = 0; |
| const auto& buffer = decoder_current_bitstream_buffer_->buffer; |
| if (!buffer) { |
| // This is a dummy buffer, queued to flush the pipe. Flush. |
| DCHECK_EQ(decoder_current_bitstream_buffer_->input_id, kFlushBufferId); |
| // Enqueue a buffer guaranteed to be empty. To do that, we flush the |
| // current input, enqueue no data to the next frame, then flush that down. |
| schedule_task = true; |
| if (current_input_buffer_ && |
| current_input_buffer_->GetTimeStamp().tv_sec != kFlushBufferId) |
| schedule_task = FlushInputFrame(); |
| |
| if (schedule_task && AppendToInputFrame(NULL, 0) && FlushInputFrame()) { |
| VLOGF(2) << "enqueued flush buffer"; |
| schedule_task = true; |
| } else { |
| // If we failed to enqueue the empty buffer (due to pipeline |
| // backpressure), don't advance the bitstream buffer queue, and don't |
| // schedule the next task. This bitstream buffer queue entry will get |
| // reprocessed when the pipeline frees up. |
| schedule_task = false; |
| } |
| } else if (buffer->data_size() == 0) { |
| // This is a buffer queued from the client that has zero size. Skip. |
| // TODO(sandersd): This shouldn't be possible, empty buffers are never |
| // enqueued. |
| schedule_task = true; |
| } else { |
| // This is a buffer queued from the client, with actual contents. Decode. |
| const uint8_t* const data = |
| buffer->data() + decoder_current_bitstream_buffer_->bytes_used; |
| const size_t data_size = |
| buffer->data_size() - decoder_current_bitstream_buffer_->bytes_used; |
| |
| for (auto& workaround : workarounds_) { |
| auto result = workaround->Apply(data, data_size); |
| if (result == V4L2StatefulWorkaround::Result::NotifyError) { |
| LOG(ERROR) << "Failed applying a workaround"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| } |
| |
| if (!frame_splitter_->AdvanceFrameFragment(data, data_size, |
| &decoded_size)) { |
| LOG(ERROR) << "Invalid Stream"; |
| NOTIFY_ERROR(UNREADABLE_INPUT); |
| return; |
| } |
| // AdvanceFrameFragment should not return a size larger than the buffer |
| // size, even on invalid data. |
| CHECK_LE(decoded_size, data_size); |
| |
| switch (decoder_state_) { |
| case kInitialized: |
| schedule_task = DecodeBufferInitial(data, decoded_size, &decoded_size); |
| break; |
| case kDecoding: |
| schedule_task = DecodeBufferContinue(data, decoded_size); |
| break; |
| default: |
| LOG(ERROR) << "Illegal State"; |
| NOTIFY_ERROR(ILLEGAL_STATE); |
| return; |
| } |
| } |
| if (decoder_state_ == kError) { |
| // Failed during decode. |
| return; |
| } |
| |
| if (schedule_task) { |
| decoder_current_bitstream_buffer_->bytes_used += decoded_size; |
| if ((buffer ? buffer->data_size() : 0) == |
| decoder_current_bitstream_buffer_->bytes_used) { |
| // Our current bitstream buffer is done; return it. |
| int32_t input_id = decoder_current_bitstream_buffer_->input_id; |
| DVLOGF(4) << "finished input_id=" << input_id; |
| // BitstreamBufferRef destructor calls NotifyEndOfBitstreamBuffer(). |
| decoder_current_bitstream_buffer_.reset(); |
| } |
| ScheduleDecodeBufferTaskIfNeeded(); |
| } |
| } |
| |
| void V4L2VideoDecodeAccelerator::ScheduleDecodeBufferTaskIfNeeded() { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| // If we're behind on tasks, schedule another one. |
| int buffers_to_decode = decoder_input_queue_.size(); |
| if (decoder_current_bitstream_buffer_ != NULL) |
| buffers_to_decode++; |
| if (decoder_decode_buffer_tasks_scheduled_ < buffers_to_decode) { |
| decoder_decode_buffer_tasks_scheduled_++; |
| decoder_thread_.task_runner()->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2VideoDecodeAccelerator::DecodeBufferTask, |
| base::Unretained(this))); |
| } |
| } |
| |
| bool V4L2VideoDecodeAccelerator::DecodeBufferInitial(const void* data, |
| size_t size, |
| size_t* endpos) { |
| DVLOGF(3) << "data=" << data << ", size=" << size; |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_EQ(decoder_state_, kInitialized); |
| // Initial decode. We haven't been able to get output stream format info yet. |
| // Get it, and start decoding. |
| |
| // Copy in and send to HW. |
| if (!AppendToInputFrame(data, size)) |
| return false; |
| |
| // If we only have a partial frame, don't flush and process yet. |
| if (frame_splitter_->IsPartialFramePending()) |
| return true; |
| |
| if (!FlushInputFrame()) |
| return false; |
| |
| // Recycle buffers. |
| Dequeue(); |
| |
| *endpos = size; |
| |
| // If an initial resolution change event is not done yet, a driver probably |
| // needs more stream to decode format. |
| // Return true and schedule next buffer without changing status to kDecoding. |
| // If the initial resolution change is done and coded size is known, we may |
| // still have to wait for AssignPictureBuffers() and output buffers to be |
| // allocated. |
| if (coded_size_.IsEmpty() || output_buffer_map_.empty()) { |
| return true; |
| } |
| |
| decoder_state_ = kDecoding; |
| ScheduleDecodeBufferTaskIfNeeded(); |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::DecodeBufferContinue(const void* data, |
| size_t size) { |
| DVLOGF(4) << "data=" << data << ", size=" << size; |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_EQ(decoder_state_, kDecoding); |
| |
| // Both of these calls will set kError state if they fail. |
| // Only flush the frame if it's complete. |
| return (AppendToInputFrame(data, size) && |
| (frame_splitter_->IsPartialFramePending() || FlushInputFrame())); |
| } |
| |
| bool V4L2VideoDecodeAccelerator::AppendToInputFrame(const void* data, |
| size_t size) { |
| DVLOGF(4); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_NE(decoder_state_, kUninitialized); |
| DCHECK_NE(decoder_state_, kResetting); |
| DCHECK_NE(decoder_state_, kError); |
| // This routine can handle data == NULL and size == 0, which occurs when |
| // we queue an empty buffer for the purposes of flushing the pipe. |
| |
| // Flush if we're too big |
| if (current_input_buffer_) { |
| size_t plane_size = current_input_buffer_->GetPlaneSize(0); |
| size_t bytes_used = current_input_buffer_->GetPlaneBytesUsed(0); |
| if (bytes_used + size > plane_size) { |
| if (!FlushInputFrame()) |
| return false; |
| } |
| } |
| |
| // Try to get an available input buffer. |
| if (!current_input_buffer_) { |
| DCHECK(decoder_current_bitstream_buffer_ != NULL); |
| DCHECK(input_queue_); |
| |
| // See if we can get more free buffers from HW. |
| if (input_queue_->FreeBuffersCount() == 0) |
| Dequeue(); |
| |
| current_input_buffer_ = input_queue_->GetFreeBuffer(); |
| if (!current_input_buffer_) { |
| // No buffer available yet. |
| DVLOGF(4) << "stalled for input buffers"; |
| return false; |
| } |
| struct timeval timestamp = { |
| .tv_sec = decoder_current_bitstream_buffer_->input_id}; |
| current_input_buffer_->SetTimeStamp(timestamp); |
| } |
| |
| DCHECK(data != NULL || size == 0); |
| if (size == 0) { |
| // If we asked for an empty buffer, return now. We return only after |
| // getting the next input buffer, since we might actually want an empty |
| // input buffer for flushing purposes. |
| return true; |
| } |
| |
| // Copy in to the buffer. |
| size_t plane_size = current_input_buffer_->GetPlaneSize(0); |
| size_t bytes_used = current_input_buffer_->GetPlaneBytesUsed(0); |
| |
| if (size > plane_size - bytes_used) { |
| LOG(ERROR) << "over-size frame, erroring"; |
| NOTIFY_ERROR(UNREADABLE_INPUT); |
| return false; |
| } |
| void* mapping = current_input_buffer_->GetPlaneMapping(0); |
| memcpy(reinterpret_cast<uint8_t*>(mapping) + bytes_used, data, size); |
| current_input_buffer_->SetPlaneBytesUsed(0, bytes_used + size); |
| |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::FlushInputFrame() { |
| DVLOGF(4); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_NE(decoder_state_, kUninitialized); |
| DCHECK_NE(decoder_state_, kResetting); |
| DCHECK_NE(decoder_state_, kError); |
| |
| if (!current_input_buffer_) |
| return true; |
| |
| const int32_t input_buffer_id = current_input_buffer_->GetTimeStamp().tv_sec; |
| |
| DCHECK(input_buffer_id != kFlushBufferId || |
| current_input_buffer_->GetPlaneBytesUsed(0) == 0); |
| // * if input_id >= 0, this input buffer was prompted by a bitstream buffer we |
| // got from the client. We can skip it if it is empty. |
| // * if input_id < 0 (should be kFlushBufferId in this case), this input |
| // buffer was prompted by a flush buffer, and should be queued even when |
| // empty. |
| if (input_buffer_id >= 0 && |
| current_input_buffer_->GetPlaneBytesUsed(0) == 0) { |
| current_input_buffer_.reset(); |
| return true; |
| } |
| |
| // Queue it. |
| DVLOGF(4) << "submitting input_id=" << input_buffer_id; |
| input_ready_queue_.push(std::move(*current_input_buffer_)); |
| current_input_buffer_.reset(); |
| // Enqueue once since there's new available input for it. |
| Enqueue(); |
| |
| TRACE_COUNTER_ID1("media,gpu", "V4L2VDA input ready buffers", this, |
| input_ready_queue_.size()); |
| |
| return (decoder_state_ != kError); |
| } |
| |
| void V4L2VideoDecodeAccelerator::ServiceDeviceTask(bool event_pending) { |
| DVLOGF(4); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_NE(decoder_state_, kUninitialized); |
| TRACE_EVENT0("media,gpu", "V4L2VDA::ServiceDeviceTask"); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| DCHECK(input_queue_); |
| DCHECK(output_queue_); |
| |
| if (decoder_state_ == kResetting) { |
| DVLOGF(3) << "early out: kResetting state"; |
| return; |
| } else if (decoder_state_ == kError) { |
| DVLOGF(3) << "early out: kError state"; |
| return; |
| } else if (decoder_state_ == kChangingResolution) { |
| DVLOGF(3) << "early out: kChangingResolution state"; |
| return; |
| } |
| |
| bool resolution_change_pending = false; |
| if (event_pending) |
| resolution_change_pending = DequeueResolutionChangeEvent(); |
| |
| if (!resolution_change_pending && coded_size_.IsEmpty()) { |
| // Some platforms do not send an initial resolution change event. |
| // To work around this, we need to keep checking if the initial resolution |
| // is known already by explicitly querying the format after each decode, |
| // regardless of whether we received an event. |
| // This needs to be done on initial resolution change, |
| // i.e. when coded_size_.IsEmpty(). |
| |
| // Try GetFormatInfo to check if an initial resolution change can be done. |
| struct v4l2_format format; |
| gfx::Size visible_size; |
| bool again; |
| if (GetFormatInfo(&format, &visible_size, &again) && !again) { |
| resolution_change_pending = true; |
| DequeueResolutionChangeEvent(); |
| } |
| } |
| |
| Dequeue(); |
| Enqueue(); |
| |
| // Clear the interrupt fd. |
| if (!device_->ClearDevicePollInterrupt()) { |
| LOG(ERROR) << "Failed Clear the interrupt fd"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| bool poll_device = false; |
| // Add fd, if we should poll on it. |
| // Can be polled as soon as either input or output buffers are queued. |
| if (input_queue_->QueuedBuffersCount() + output_queue_->QueuedBuffersCount() > |
| 0) |
| poll_device = true; |
| |
| // ServiceDeviceTask() should only ever be scheduled from DevicePollTask(), |
| // so either: |
| // * device_poll_thread_ is running normally |
| // * device_poll_thread_ scheduled us, but then a ResetTask() or DestroyTask() |
| // shut it down, in which case we're either in kResetting or kError states |
| // respectively, and we should have early-outed already. |
| DCHECK(device_poll_thread_.task_runner()); |
| // Queue the DevicePollTask() now. |
| device_poll_thread_.task_runner()->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2VideoDecodeAccelerator::DevicePollTask, |
| base::Unretained(this), poll_device)); |
| |
| DVLOGF(3) << "ServiceDeviceTask(): buffer counts: DEC[" |
| << decoder_input_queue_.size() << "->" << input_ready_queue_.size() |
| << "] => DEVICE[" << input_queue_->FreeBuffersCount() << "+" |
| << input_queue_->QueuedBuffersCount() << "/" |
| << input_queue_->AllocatedBuffersCount() << "->" |
| << output_queue_->FreeBuffersCount() << "+" |
| << output_queue_->QueuedBuffersCount() << "/" |
| << output_buffer_map_.size() << "] => PROCESSOR[" |
| << buffers_at_ip_.size() << "] => CLIENT[" |
| << buffers_at_client_.size() << "]"; |
| |
| ScheduleDecodeBufferTaskIfNeeded(); |
| if (resolution_change_pending) |
| StartResolutionChange(); |
| } |
| |
| void V4L2VideoDecodeAccelerator::CheckGLFences() { |
| DVLOGF(4); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| while (!buffers_awaiting_fence_.empty()) { |
| if (buffers_awaiting_fence_.front().first->HasCompleted()) { |
| // Buffer at the front of the queue goes back to V4L2Queue's free list |
| // and can be reused. |
| buffers_awaiting_fence_.pop(); |
| } else { |
| // If we have no free buffers available, then preemptively schedule a |
| // call to Enqueue() in a short time, otherwise we may starve out of |
| // buffers. The delay chosen roughly corresponds to the time a frame is |
| // displayed, which should be optimal in most cases. |
| if (output_queue_->FreeBuffersCount() == 0) { |
| constexpr int64_t resched_delay = 17; |
| |
| decoder_thread_.task_runner()->PostDelayedTask( |
| FROM_HERE, |
| base::BindOnce(&V4L2VideoDecodeAccelerator::Enqueue, |
| base::Unretained(this)), |
| base::Milliseconds(resched_delay)); |
| } |
| break; |
| } |
| } |
| } |
| |
| void V4L2VideoDecodeAccelerator::Enqueue() { |
| DVLOGF(4); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_NE(decoder_state_, kUninitialized); |
| |
| // Early return if we are running after DestroyTask() or a resolution change. |
| // This can happen due to the PostDelayedTask() in CheckGLFences(). |
| if (IsDestroyPending() || decoder_state_ == kChangingResolution) |
| return; |
| |
| DCHECK(input_queue_); |
| DCHECK(output_queue_); |
| |
| // Drain the pipe of completed decode buffers. |
| const int old_inputs_queued = input_queue_->QueuedBuffersCount(); |
| while (!input_ready_queue_.empty()) { |
| bool flush_handled = false; |
| int32_t input_id = input_ready_queue_.front().GetTimeStamp().tv_sec; |
| if (input_id == kFlushBufferId) { |
| // Send the flush command after all input buffers are dequeued. This makes |
| // sure all previous resolution changes have been handled because the |
| // driver must hold the input buffer that triggers resolution change. The |
| // driver cannot decode data in it without new output buffers. If we send |
| // the flush now and a queued input buffer triggers resolution change |
| // later, the driver will send an output buffer that has |
| // V4L2_BUF_FLAG_LAST. But some queued input buffer have not been decoded |
| // yet. Also, V4L2VDA calls STREAMOFF and STREAMON after resolution |
| // change. They implicitly send a V4L2_DEC_CMD_STOP and V4L2_DEC_CMD_START |
| // to the decoder. |
| if (input_queue_->QueuedBuffersCount() > 0) |
| break; |
| |
| if (coded_size_.IsEmpty() || !input_queue_->IsStreaming()) { |
| // In these situations, we should call NotifyFlushDone() immediately: |
| // (1) If coded_size_.IsEmpty(), no output buffer could have been |
| // allocated and there is nothing to flush. |
| // (2) If input stream is off, we will never get the output buffer |
| // with V4L2_BUF_FLAG_LAST. |
| VLOGF(2) << "Nothing to flush. Notify flush done directly."; |
| NofityFlushDone(); |
| flush_handled = true; |
| } else if (decoder_cmd_supported_) { |
| if (!SendDecoderCmdStop()) |
| return; |
| flush_handled = true; |
| } |
| } |
| if (flush_handled) { |
| // Recycle the buffer directly if we already handled the flush request. |
| input_ready_queue_.pop(); |
| } else { |
| // Enqueue an input buffer, or an empty flush buffer if decoder cmd |
| // is not supported and there may be buffers to be flushed. |
| auto buffer = std::move(input_ready_queue_.front()); |
| input_ready_queue_.pop(); |
| if (!EnqueueInputRecord(std::move(buffer))) |
| return; |
| } |
| } |
| |
| if (old_inputs_queued == 0 && input_queue_->QueuedBuffersCount() != 0) { |
| // We just started up a previously empty queue. |
| // Queue state changed; signal interrupt. |
| if (!device_->SetDevicePollInterrupt()) { |
| PLOG(ERROR) << "SetDevicePollInterrupt failed"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| // Start VIDIOC_STREAMON if we haven't yet. |
| if (!input_queue_->Streamon()) { |
| LOG(ERROR) << "Failed Stream on input queue"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| } |
| |
| // OUTPUT queue must be started before CAPTURE queue as per codec API. |
| if (!input_queue_->IsStreaming()) |
| return; |
| |
| // Enqueue all the outputs we can. |
| const int old_outputs_queued = output_queue_->QueuedBuffersCount(); |
| // Release output buffers which GL fences have been signaled. |
| CheckGLFences(); |
| while (auto buffer_opt = output_queue_->GetFreeBuffer()) { |
| if (!EnqueueOutputRecord(std::move(*buffer_opt))) |
| return; |
| } |
| if (old_outputs_queued == 0 && output_queue_->QueuedBuffersCount() != 0) { |
| // We just started up a previously empty queue. |
| // Queue state changed; signal interrupt. |
| if (!device_->SetDevicePollInterrupt()) { |
| PLOG(ERROR) << "SetDevicePollInterrupt(): failed"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| if (!output_queue_->Streamon()) { |
| PLOG(ERROR) << "Failed Stream on output queue"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| } |
| } |
| |
| bool V4L2VideoDecodeAccelerator::DequeueResolutionChangeEvent() { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_NE(decoder_state_, kUninitialized); |
| DVLOGF(3); |
| |
| while (absl::optional<struct v4l2_event> event = device_->DequeueEvent()) { |
| if (event->type == V4L2_EVENT_SOURCE_CHANGE) { |
| if (event->u.src_change.changes & V4L2_EVENT_SRC_CH_RESOLUTION) { |
| VLOGF(2) << "got resolution change event."; |
| return true; |
| } |
| } else { |
| VLOGF(1) << "got an event (" << event->type |
| << ") we haven't subscribed to."; |
| } |
| } |
| return false; |
| } |
| |
| void V4L2VideoDecodeAccelerator::Dequeue() { |
| DVLOGF(4); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_NE(decoder_state_, kUninitialized); |
| DCHECK(input_queue_); |
| DCHECK(output_queue_); |
| |
| while (input_queue_->QueuedBuffersCount() > 0) { |
| if (!DequeueInputBuffer()) |
| break; |
| } |
| while (output_queue_->QueuedBuffersCount() > 0) { |
| if (!DequeueOutputBuffer()) |
| break; |
| } |
| NotifyFlushDoneIfNeeded(); |
| } |
| |
| bool V4L2VideoDecodeAccelerator::DequeueInputBuffer() { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK(input_queue_); |
| DCHECK_GT(input_queue_->QueuedBuffersCount(), 0u); |
| |
| // Dequeue a completed input (VIDEO_OUTPUT) buffer, and recycle to the free |
| // list. |
| auto ret = input_queue_->DequeueBuffer(); |
| |
| if (ret.first == false) { |
| LOG(ERROR) << "Error in Dequeue input buffer"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } else if (!ret.second) { |
| // we're just out of buffers to dequeue. |
| return false; |
| } |
| |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::DequeueOutputBuffer() { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK(output_queue_); |
| DCHECK_GT(output_queue_->QueuedBuffersCount(), 0u); |
| DCHECK(output_queue_->IsStreaming()); |
| |
| // Dequeue a completed output (VIDEO_CAPTURE) buffer, and queue to the |
| // completed queue. |
| auto ret = output_queue_->DequeueBuffer(); |
| if (ret.first == false) { |
| LOG(ERROR) << "Error in Dequeue output buffer"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| if (!ret.second) { |
| return false; |
| } |
| |
| V4L2ReadableBufferRef buf(std::move(ret.second)); |
| |
| DCHECK_LT(buf->BufferId(), output_buffer_map_.size()); |
| OutputRecord& output_record = output_buffer_map_[buf->BufferId()]; |
| DCHECK_NE(output_record.picture_id, -1); |
| // Zero-bytes buffers are returned as part of a flush and can be dismissed. |
| if (buf->GetPlaneBytesUsed(0) > 0) { |
| int32_t bitstream_buffer_id = buf->GetTimeStamp().tv_sec; |
| DCHECK_GE(bitstream_buffer_id, 0); |
| DVLOGF(4) << "Dequeue output buffer: dqbuf index=" << buf->BufferId() |
| << " bitstream input_id=" << bitstream_buffer_id; |
| if (image_processor_device_) { |
| if (!ProcessFrame(bitstream_buffer_id, buf)) { |
| LOG(ERROR) << "Processing frame failed"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| } else { |
| SendBufferToClient(buf->BufferId(), bitstream_buffer_id, buf); |
| } |
| } |
| if (buf->IsLast()) { |
| DVLOGF(3) << "Got last output buffer. Waiting last buffer=" |
| << flush_awaiting_last_output_buffer_; |
| if (flush_awaiting_last_output_buffer_) { |
| flush_awaiting_last_output_buffer_ = false; |
| struct v4l2_decoder_cmd cmd; |
| memset(&cmd, 0, sizeof(cmd)); |
| cmd.cmd = V4L2_DEC_CMD_START; |
| IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_DECODER_CMD, &cmd); |
| } |
| } |
| |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::EnqueueInputRecord( |
| V4L2WritableBufferRef buffer) { |
| DVLOGF(4); |
| |
| // Enqueue an input (VIDEO_OUTPUT) buffer. |
| int32_t input_id = buffer.GetTimeStamp().tv_sec; |
| size_t bytes_used = buffer.GetPlaneBytesUsed(0); |
| if (!std::move(buffer).QueueMMap()) { |
| LOG(ERROR) << "Error in Queue input buffer"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| DVLOGF(4) << "enqueued input_id=" << input_id << " size=" << bytes_used; |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::EnqueueOutputRecord( |
| V4L2WritableBufferRef buffer) { |
| OutputRecord& output_record = output_buffer_map_[buffer.BufferId()]; |
| DCHECK_NE(output_record.picture_id, -1); |
| |
| bool ret = false; |
| switch (buffer.Memory()) { |
| case V4L2_MEMORY_MMAP: |
| ret = std::move(buffer).QueueMMap(); |
| break; |
| case V4L2_MEMORY_DMABUF: |
| ret = std::move(buffer).QueueDMABuf(output_record.output_frame); |
| break; |
| default: |
| NOTREACHED(); |
| } |
| |
| if (!ret) { |
| LOG(ERROR) << "Error in Dequeue output buffer"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| return true; |
| } |
| |
| void V4L2VideoDecodeAccelerator::ReusePictureBufferTask( |
| int32_t picture_buffer_id, |
| std::unique_ptr<gl::GLFenceEGL> egl_fence) { |
| DVLOGF(4) << "picture_buffer_id=" << picture_buffer_id; |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| // We run ReusePictureBufferTask even if we're in kResetting. |
| if (decoder_state_ == kError) { |
| DVLOGF(4) << "early out: kError state"; |
| return; |
| } |
| |
| if (decoder_state_ == kChangingResolution) { |
| DVLOGF(4) << "early out: kChangingResolution"; |
| return; |
| } |
| |
| auto iter = buffers_at_client_.find(picture_buffer_id); |
| if (iter == buffers_at_client_.end()) { |
| // It's possible that we've already posted a DismissPictureBuffer for this |
| // picture, but it has not yet executed when this ReusePictureBuffer was |
| // posted to us by the client. In that case just ignore this (we've already |
| // dismissed it and accounted for that) and let the fence object get |
| // destroyed. |
| DVLOGF(3) << "got picture id= " << picture_buffer_id |
| << " not in use (anymore?)."; |
| return; |
| } |
| |
| // Take ownership of the EGL fence and keep the buffer out of the game until |
| // the fence signals. |
| if (egl_fence) |
| buffers_awaiting_fence_.emplace( |
| std::make_pair(std::move(egl_fence), std::move(iter->second))); |
| |
| buffers_at_client_.erase(iter); |
| |
| // We got a buffer back, so enqueue it back. |
| Enqueue(); |
| |
| TRACE_COUNTER_ID2( |
| "media,gpu", "V4L2 output buffers", this, "in client", |
| buffers_at_client_.size(), "in vda", |
| output_buffer_map_.size() - buffers_at_client_.size()); |
| TRACE_COUNTER_ID2( |
| "media,gpu", "V4L2 output buffers in vda", this, "free", |
| output_queue_->FreeBuffersCount(), "in device or IP", |
| output_queue_->QueuedBuffersCount() + buffers_at_ip_.size()); |
| } |
| |
| void V4L2VideoDecodeAccelerator::FlushTask() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| if (decoder_state_ == kError) { |
| VLOGF(2) << "early out: kError state"; |
| return; |
| } |
| |
| TRACE_EVENT_NESTABLE_ASYNC_BEGIN0("media,gpu", "V4L2VDA::FlushTask", |
| TRACE_ID_LOCAL(this)); |
| |
| // We don't support stacked flushing. |
| DCHECK(!decoder_flushing_); |
| |
| // Queue up an empty buffer -- this triggers the flush. |
| decoder_input_queue_.push_back(std::make_unique<BitstreamBufferRef>( |
| decode_client_, decode_task_runner_, nullptr, kFlushBufferId)); |
| decoder_flushing_ = true; |
| SendPictureReady(); // Send all pending PictureReady. |
| |
| ScheduleDecodeBufferTaskIfNeeded(); |
| } |
| |
| void V4L2VideoDecodeAccelerator::NotifyFlushDoneIfNeeded() { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK(input_queue_); |
| if (!decoder_flushing_) |
| return; |
| |
| // Pipeline is empty when: |
| // * Decoder input queue is empty of non-delayed buffers. |
| // * There is no currently filling input buffer. |
| // * Input holding queue is empty. |
| // * All input (VIDEO_OUTPUT) buffers are returned. |
| // * All image processor buffers are returned. |
| if (!decoder_input_queue_.empty()) { |
| if (decoder_input_queue_.front()->input_id != |
| decoder_delay_bitstream_buffer_id_) { |
| DVLOGF(3) << "Some input bitstream buffers are not queued."; |
| return; |
| } |
| } |
| if (current_input_buffer_) { |
| DVLOGF(3) << "Current input buffer != -1"; |
| return; |
| } |
| if ((input_ready_queue_.size() + input_queue_->QueuedBuffersCount()) != 0) { |
| DVLOGF(3) << "Some input buffers are not dequeued."; |
| return; |
| } |
| if (!buffers_at_ip_.empty()) { |
| DVLOGF(3) << "Waiting for image processor to complete."; |
| return; |
| } |
| if (flush_awaiting_last_output_buffer_) { |
| DVLOGF(3) << "Waiting for last output buffer."; |
| return; |
| } |
| |
| // TODO(posciak): https://crbug.com/270039. Exynos requires a |
| // streamoff-streamon sequence after flush to continue, even if we are not |
| // resetting. This would make sense, because we don't really want to resume |
| // from a non-resume point (e.g. not from an IDR) if we are flushed. |
| // MSE player however triggers a Flush() on chunk end, but never Reset(). One |
| // could argue either way, or even say that Flush() is not needed/harmful when |
| // transitioning to next chunk. |
| // For now, do the streamoff-streamon cycle to satisfy Exynos and not freeze |
| // when doing MSE. This should be harmless otherwise. |
| if (!(StopDevicePoll() && StopOutputStream() && StopInputStream())) |
| return; |
| |
| if (!StartDevicePoll()) |
| return; |
| |
| NofityFlushDone(); |
| // While we were flushing, we early-outed DecodeBufferTask()s. |
| ScheduleDecodeBufferTaskIfNeeded(); |
| } |
| |
| void V4L2VideoDecodeAccelerator::NofityFlushDone() { |
| TRACE_EVENT_NESTABLE_ASYNC_END0("media,gpu", "V4L2VDA::FlushTask", |
| TRACE_ID_LOCAL(this)); |
| decoder_delay_bitstream_buffer_id_ = -1; |
| decoder_flushing_ = false; |
| VLOGF(2) << "returning flush"; |
| child_task_runner_->PostTask( |
| FROM_HERE, base::BindOnce(&Client::NotifyFlushDone, client_)); |
| } |
| |
| bool V4L2VideoDecodeAccelerator::IsDecoderCmdSupported() { |
| // CMD_STOP should always succeed. If the decoder is started, the command can |
| // flush it. If the decoder is stopped, the command does nothing. We use this |
| // to know if a driver supports V4L2_DEC_CMD_STOP to flush. |
| struct v4l2_decoder_cmd cmd; |
| memset(&cmd, 0, sizeof(cmd)); |
| cmd.cmd = V4L2_DEC_CMD_STOP; |
| if (device_->Ioctl(VIDIOC_TRY_DECODER_CMD, &cmd) != 0) { |
| VLOGF(2) "V4L2_DEC_CMD_STOP is not supported."; |
| return false; |
| } |
| |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::SendDecoderCmdStop() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK(!flush_awaiting_last_output_buffer_); |
| |
| struct v4l2_decoder_cmd cmd; |
| memset(&cmd, 0, sizeof(cmd)); |
| cmd.cmd = V4L2_DEC_CMD_STOP; |
| IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_DECODER_CMD, &cmd); |
| flush_awaiting_last_output_buffer_ = true; |
| |
| return true; |
| } |
| |
| void V4L2VideoDecodeAccelerator::ResetTask() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| if (decoder_state_ == kError) { |
| VLOGF(2) << "early out: kError state"; |
| return; |
| } |
| |
| TRACE_EVENT_NESTABLE_ASYNC_BEGIN0("media,gpu", "V4L2VDA::ResetTask", |
| TRACE_ID_LOCAL(this)); |
| |
| decoder_current_bitstream_buffer_.reset(); |
| while (!decoder_input_queue_.empty()) |
| decoder_input_queue_.pop_front(); |
| |
| current_input_buffer_.reset(); |
| |
| // If we are in the middle of switching resolutions or awaiting picture |
| // buffers, postpone reset until it's done. We don't have to worry about |
| // timing of this wrt to decoding, because output pipe is already |
| // stopped if we are changing resolution. We will come back here after |
| // we are done. |
| DCHECK(!reset_pending_); |
| if (decoder_state_ == kChangingResolution || |
| decoder_state_ == kAwaitingPictureBuffers) { |
| reset_pending_ = true; |
| return; |
| } |
| FinishReset(); |
| } |
| |
| void V4L2VideoDecodeAccelerator::FinishReset() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| reset_pending_ = false; |
| // After the output stream is stopped, the codec should not post any |
| // resolution change events. So we dequeue the resolution change event |
| // afterwards. The event could be posted before or while stopping the output |
| // stream. The codec will expect the buffer of new size after the seek, so |
| // we need to handle the resolution change event first. |
| if (!(StopDevicePoll() && StopOutputStream())) |
| return; |
| |
| if (DequeueResolutionChangeEvent()) { |
| reset_pending_ = true; |
| StartResolutionChange(); |
| return; |
| } |
| |
| if (!StopInputStream()) |
| return; |
| |
| // Drop all buffers in image processor. |
| if (image_processor_ && !ResetImageProcessor()) { |
| LOG(ERROR) << "Fail to reset image processor"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| // If we were flushing, we'll never return any more BitstreamBuffers or |
| // PictureBuffers; they have all been dropped and returned by now. |
| NotifyFlushDoneIfNeeded(); |
| |
| // Mark that we're resetting, then enqueue a ResetDoneTask(). All intervening |
| // jobs will early-out in the kResetting state. |
| decoder_state_ = kResetting; |
| SendPictureReady(); // Send all pending PictureReady. |
| decoder_thread_.task_runner()->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2VideoDecodeAccelerator::ResetDoneTask, |
| base::Unretained(this))); |
| } |
| |
| void V4L2VideoDecodeAccelerator::ResetDoneTask() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| if (IsDestroyPending()) |
| return; |
| |
| if (decoder_state_ == kError) { |
| VLOGF(2) << "early out: kError state"; |
| return; |
| } |
| |
| TRACE_EVENT_NESTABLE_ASYNC_END0("media,gpu", "V4L2VDA::ResetTask", |
| TRACE_ID_LOCAL(this)); |
| |
| // Start poll thread if NotifyFlushDoneIfNeeded has not already. |
| if (!device_poll_thread_.IsRunning()) { |
| if (!StartDevicePoll()) |
| return; |
| } |
| |
| frame_splitter_->Reset(); |
| |
| // Jobs drained, we're finished resetting. |
| DCHECK_EQ(decoder_state_, kResetting); |
| decoder_state_ = kInitialized; |
| |
| decoder_delay_bitstream_buffer_id_ = -1; |
| child_task_runner_->PostTask( |
| FROM_HERE, base::BindOnce(&Client::NotifyResetDone, client_)); |
| |
| // While we were resetting, we early-outed DecodeBufferTask()s. |
| ScheduleDecodeBufferTaskIfNeeded(); |
| } |
| |
| void V4L2VideoDecodeAccelerator::DestroyTask() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| TRACE_EVENT0("media,gpu", "V4L2VDA::DestroyTask"); |
| |
| // DestroyTask() should run regardless of decoder_state_. |
| |
| decoder_state_ = kDestroying; |
| |
| StopDevicePoll(); |
| StopOutputStream(); |
| StopInputStream(); |
| |
| decoder_current_bitstream_buffer_.reset(); |
| current_input_buffer_.reset(); |
| decoder_decode_buffer_tasks_scheduled_ = 0; |
| while (!decoder_input_queue_.empty()) |
| decoder_input_queue_.pop_front(); |
| decoder_flushing_ = false; |
| |
| // First liberate all the frames held by the client. |
| buffers_at_client_.clear(); |
| |
| // The image processor's thread was the user of the image processor device, |
| // so let it keep the last reference and destroy it in its own thread. |
| image_processor_device_ = nullptr; |
| image_processor_ = nullptr; |
| while (!buffers_at_ip_.empty()) |
| buffers_at_ip_.pop(); |
| |
| DestroyInputBuffers(); |
| DestroyOutputBuffers(); |
| |
| input_queue_ = nullptr; |
| output_queue_ = nullptr; |
| |
| frame_splitter_ = nullptr; |
| workarounds_.clear(); |
| |
| // Clear the V4L2 devices in the decoder thread so the V4L2Device's |
| // destructor is called from the thread that used it. |
| device_ = nullptr; |
| |
| base::trace_event::MemoryDumpManager::GetInstance()->UnregisterDumpProvider( |
| this); |
| } |
| |
| bool V4L2VideoDecodeAccelerator::StartDevicePoll() { |
| DVLOGF(3); |
| DCHECK(!device_poll_thread_.IsRunning()); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| // Start up the device poll thread and schedule its first DevicePollTask(). |
| if (!device_poll_thread_.Start()) { |
| LOG(ERROR) << "Device thread failed to start"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| cancelable_service_device_task_.Reset(base::BindRepeating( |
| &V4L2VideoDecodeAccelerator::ServiceDeviceTask, base::Unretained(this))); |
| cancelable_service_device_task_callback_ = |
| cancelable_service_device_task_.callback(); |
| device_poll_thread_.task_runner()->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2VideoDecodeAccelerator::DevicePollTask, |
| base::Unretained(this), 0)); |
| |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::StopDevicePoll() { |
| DVLOGF(3); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| if (!device_poll_thread_.IsRunning()) |
| return true; |
| |
| // Signal the DevicePollTask() to stop, and stop the device poll thread. |
| if (!device_->SetDevicePollInterrupt()) { |
| PLOG(ERROR) << "SetDevicePollInterrupt(): failed"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| device_poll_thread_.Stop(); |
| // Must be done after the Stop() above to ensure |
| // |cancelable_service_device_task_callback_| is not copied. |
| cancelable_service_device_task_.Cancel(); |
| cancelable_service_device_task_callback_ = base::NullCallback(); |
| // Clear the interrupt now, to be sure. |
| if (!device_->ClearDevicePollInterrupt()) { |
| PLOG(ERROR) << "ClearDevicePollInterrupt: failed"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| DVLOGF(3) << "device poll stopped"; |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::StopOutputStream() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| if (!output_queue_ || !output_queue_->IsStreaming()) |
| return true; |
| |
| if (!output_queue_->Streamoff()) { |
| LOG(ERROR) << "Failed streaming off output queue"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| // Output stream is stopped. No need to wait for the buffer anymore. |
| flush_awaiting_last_output_buffer_ = false; |
| |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::StopInputStream() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| if (!input_queue_ || !input_queue_->IsStreaming()) |
| return true; |
| |
| if (!input_queue_->Streamoff()) { |
| LOG(ERROR) << "Failed streaming off input queue"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| // Reset accounting info for input. |
| while (!input_ready_queue_.empty()) |
| input_ready_queue_.pop(); |
| |
| return true; |
| } |
| |
| void V4L2VideoDecodeAccelerator::StartResolutionChange() { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_NE(decoder_state_, kUninitialized); |
| DCHECK_NE(decoder_state_, kResetting); |
| |
| VLOGF(2) << "Initiate resolution change"; |
| |
| if (!(StopDevicePoll() && StopOutputStream())) |
| return; |
| |
| decoder_state_ = kChangingResolution; |
| SendPictureReady(); // Send all pending PictureReady. |
| |
| if (!buffers_at_ip_.empty()) { |
| VLOGF(2) << "Wait image processor to finish before destroying buffers."; |
| return; |
| } |
| |
| buffers_at_client_.clear(); |
| |
| image_processor_ = nullptr; |
| |
| if (!DestroyOutputBuffers()) { |
| LOG(ERROR) << "Failed destroying output buffers."; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| FinishResolutionChange(); |
| } |
| |
| void V4L2VideoDecodeAccelerator::FinishResolutionChange() { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_EQ(decoder_state_, kChangingResolution); |
| VLOGF(2); |
| |
| if (decoder_state_ == kError) { |
| VLOGF(2) << "early out: kError state"; |
| return; |
| } |
| |
| struct v4l2_format format; |
| bool again; |
| gfx::Size visible_size; |
| bool ret = GetFormatInfo(&format, &visible_size, &again); |
| if (!ret || again) { |
| LOG(ERROR) << "Couldn't get format information after resolution change"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| if (!CreateBuffersForFormat(format, visible_size)) { |
| LOG(ERROR) << "Couldn't reallocate buffers after resolution change"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| if (!StartDevicePoll()) |
| return; |
| } |
| |
| void V4L2VideoDecodeAccelerator::DevicePollTask(bool poll_device) { |
| DVLOGF(4); |
| DCHECK(device_poll_thread_.task_runner()->BelongsToCurrentThread()); |
| TRACE_EVENT0("media,gpu", "V4L2VDA::DevicePollTask"); |
| |
| bool event_pending = false; |
| |
| if (!device_->Poll(poll_device, &event_pending)) { |
| LOG(ERROR) << "Failed during poll"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return; |
| } |
| |
| // All processing should happen on ServiceDeviceTask(), since we shouldn't |
| // touch decoder state from this thread. |
| decoder_thread_.task_runner()->PostTask( |
| FROM_HERE, |
| base::BindOnce(cancelable_service_device_task_callback_, event_pending)); |
| } |
| |
| bool V4L2VideoDecodeAccelerator::IsDestroyPending() { |
| return destroy_pending_.IsSignaled(); |
| } |
| |
| void V4L2VideoDecodeAccelerator::NotifyError(Error error) { |
| VLOGF(1); |
| |
| // Notifying the client should only happen from the client's thread. |
| if (!child_task_runner_->BelongsToCurrentThread()) { |
| child_task_runner_->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2VideoDecodeAccelerator::NotifyError, |
| weak_this_, error)); |
| return; |
| } |
| |
| // Notify the decoder's client an error has occurred. |
| if (client_) { |
| client_->NotifyError(error); |
| client_ptr_factory_.reset(); |
| } |
| } |
| |
| void V4L2VideoDecodeAccelerator::SetErrorState(Error error) { |
| // We can touch decoder_state_ only if this is the decoder thread or the |
| // decoder thread isn't running. |
| if (decoder_thread_.task_runner() && |
| !decoder_thread_.task_runner()->BelongsToCurrentThread()) { |
| decoder_thread_.task_runner()->PostTask( |
| FROM_HERE, base::BindOnce(&V4L2VideoDecodeAccelerator::SetErrorState, |
| base::Unretained(this), error)); |
| return; |
| } |
| |
| // Notifying the client of an error will only happen if we are already |
| // initialized, as the API does not allow doing so before that. Subsequent |
| // errors and errors while destroying will be suppressed. |
| if (decoder_state_ != kError && decoder_state_ != kUninitialized && |
| decoder_state_ != kDestroying) |
| NotifyError(error); |
| |
| decoder_state_ = kError; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::GetFormatInfo(struct v4l2_format* format, |
| gfx::Size* visible_size, |
| bool* again) { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| *again = false; |
| |
| auto ret = output_queue_->GetFormat(); |
| switch (ret.second) { |
| case 0: |
| *format = *ret.first; |
| break; |
| case EINVAL: |
| // EINVAL means we haven't seen sufficient stream to decode the format. |
| *again = true; |
| return true; |
| default: |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| // Make sure we are still getting the format we set on initialization. |
| if (format->fmt.pix_mp.pixelformat != output_format_fourcc_->ToV4L2PixFmt()) { |
| VLOGF(1) << "Unexpected format from G_FMT on output"; |
| return false; |
| } |
| |
| gfx::Size coded_size(format->fmt.pix_mp.width, format->fmt.pix_mp.height); |
| if (visible_size != nullptr) |
| *visible_size = GetVisibleSize(coded_size); |
| |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::CreateBuffersForFormat( |
| const struct v4l2_format& format, |
| const gfx::Size& visible_size) { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| size_t egl_image_planes_count; |
| |
| coded_size_.SetSize(format.fmt.pix_mp.width, format.fmt.pix_mp.height); |
| visible_size_ = visible_size; |
| if (image_processor_device_) { |
| egl_image_size_ = visible_size_; |
| egl_image_planes_count = 0; |
| if (!V4L2ImageProcessorBackend::TryOutputFormat( |
| output_format_fourcc_->ToV4L2PixFmt(), |
| egl_image_format_fourcc_->ToV4L2PixFmt(), coded_size_, |
| &egl_image_size_, &egl_image_planes_count)) { |
| VLOGF(1) << "Fail to get output size and plane count of processor"; |
| return false; |
| } |
| } else { |
| egl_image_size_ = coded_size_; |
| egl_image_planes_count = format.fmt.pix_mp.num_planes; |
| } |
| VLOGF(2) << "new resolution: " << coded_size_.ToString() |
| << ", visible size: " << visible_size_.ToString() |
| << ", decoder output planes count: " << format.fmt.pix_mp.num_planes |
| << ", EGLImage size: " << egl_image_size_.ToString() |
| << ", EGLImage plane count: " << egl_image_planes_count; |
| |
| return CreateOutputBuffers(); |
| } |
| |
| gfx::Size V4L2VideoDecodeAccelerator::GetVisibleSize( |
| const gfx::Size& coded_size) { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| auto ret = output_queue_->GetVisibleRect(); |
| if (!ret) { |
| return coded_size; |
| } |
| gfx::Rect rect = std::move(*ret); |
| DVLOGF(3) << "visible rectangle is " << rect.ToString(); |
| if (!gfx::Rect(coded_size).Contains(rect)) { |
| DVLOGF(3) << "visible rectangle " << rect.ToString() |
| << " is not inside coded size " << coded_size.ToString(); |
| return coded_size; |
| } |
| if (rect.IsEmpty()) { |
| VLOGF(1) << "visible size is empty"; |
| return coded_size; |
| } |
| |
| // Chrome assume picture frame is coded at (0, 0). |
| if (!rect.origin().IsOrigin()) { |
| VLOGF(1) << "Unexpected visible rectangle " << rect.ToString() |
| << ", top-left is not origin"; |
| return coded_size; |
| } |
| |
| return rect.size(); |
| } |
| |
| bool V4L2VideoDecodeAccelerator::CreateInputBuffers() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| // We always run this as we prepare to initialize. |
| DCHECK_EQ(decoder_state_, kInitialized); |
| DCHECK(input_queue_); |
| |
| if (input_queue_->AllocateBuffers(kInputBufferCount, V4L2_MEMORY_MMAP) == 0) { |
| LOG(ERROR) << "Failed allocating input buffers"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::SetupFormats() { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_EQ(decoder_state_, kInitialized); |
| DCHECK(!input_queue_->IsStreaming()); |
| DCHECK(!output_queue_->IsStreaming()); |
| |
| size_t input_size; |
| gfx::Size max_resolution, min_resolution; |
| device_->GetSupportedResolution(input_format_fourcc_, &min_resolution, |
| &max_resolution); |
| if (max_resolution.width() > 1920 && max_resolution.height() > 1088) |
| input_size = kInputBufferMaxSizeFor4k; |
| else |
| input_size = kInputBufferMaxSizeFor1080p; |
| |
| struct v4l2_fmtdesc fmtdesc; |
| memset(&fmtdesc, 0, sizeof(fmtdesc)); |
| fmtdesc.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE; |
| bool is_format_supported = false; |
| while (device_->Ioctl(VIDIOC_ENUM_FMT, &fmtdesc) == 0) { |
| if (fmtdesc.pixelformat == input_format_fourcc_) { |
| is_format_supported = true; |
| break; |
| } |
| ++fmtdesc.index; |
| } |
| |
| if (!is_format_supported) { |
| VLOGF(1) << "Input fourcc " << input_format_fourcc_ |
| << " not supported by device."; |
| return false; |
| } |
| |
| struct v4l2_format format; |
| memset(&format, 0, sizeof(format)); |
| format.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE; |
| format.fmt.pix_mp.pixelformat = input_format_fourcc_; |
| format.fmt.pix_mp.plane_fmt[0].sizeimage = input_size; |
| format.fmt.pix_mp.num_planes = 1; |
| IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_S_FMT, &format); |
| DCHECK_EQ(format.fmt.pix_mp.pixelformat, input_format_fourcc_); |
| |
| // We have to set up the format for output, because the driver may not allow |
| // changing it once we start streaming; whether it can support our chosen |
| // output format or not may depend on the input format. |
| memset(&fmtdesc, 0, sizeof(fmtdesc)); |
| fmtdesc.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE; |
| while (device_->Ioctl(VIDIOC_ENUM_FMT, &fmtdesc) == 0) { |
| auto fourcc = Fourcc::FromV4L2PixFmt(fmtdesc.pixelformat); |
| if (fourcc && device_->CanCreateEGLImageFrom(*fourcc)) { |
| output_format_fourcc_ = *fourcc; |
| break; |
| } |
| ++fmtdesc.index; |
| } |
| |
| DCHECK(!image_processor_device_); |
| if (!output_format_fourcc_) { |
| VLOGF(2) << "Could not find a usable output format. Try image processor"; |
| if (!V4L2ImageProcessorBackend::IsSupported()) { |
| VLOGF(1) << "Image processor not available"; |
| return false; |
| } |
| output_format_fourcc_ = |
| v4l2_vda_helpers::FindImageProcessorInputFormat(device_.get()); |
| if (!output_format_fourcc_) { |
| VLOGF(1) << "Can't find a usable input format from image processor"; |
| return false; |
| } |
| egl_image_format_fourcc_ = |
| v4l2_vda_helpers::FindImageProcessorOutputFormat(device_.get()); |
| if (!egl_image_format_fourcc_) { |
| VLOGF(1) << "Can't find a usable output format from image processor"; |
| return false; |
| } |
| image_processor_device_ = V4L2Device::Create(); |
| if (!image_processor_device_) { |
| VLOGF(1) << "Could not create a V4L2Device for image processor"; |
| return false; |
| } |
| } else { |
| egl_image_format_fourcc_ = output_format_fourcc_; |
| } |
| VLOGF(2) << "Output format=" << output_format_fourcc_->ToString(); |
| |
| // Just set the fourcc for output; resolution, etc., will come from the |
| // driver once it extracts it from the stream. |
| memset(&format, 0, sizeof(format)); |
| format.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE; |
| format.fmt.pix_mp.pixelformat = output_format_fourcc_->ToV4L2PixFmt(); |
| IOCTL_OR_ERROR_RETURN_FALSE(VIDIOC_S_FMT, &format); |
| DCHECK_EQ(format.fmt.pix_mp.pixelformat, |
| output_format_fourcc_->ToV4L2PixFmt()); |
| |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::ResetImageProcessor() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| if (!image_processor_->Reset()) |
| return false; |
| |
| while (!buffers_at_ip_.empty()) |
| buffers_at_ip_.pop(); |
| |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::CreateImageProcessor() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK(!image_processor_); |
| const ImageProcessor::OutputMode image_processor_output_mode = |
| (output_mode_ == Config::OutputMode::ALLOCATE |
| ? ImageProcessor::OutputMode::ALLOCATE |
| : ImageProcessor::OutputMode::IMPORT); |
| |
| // Start with a brand new image processor device, since the old one was |
| // already opened and attempting to open it again is not supported. |
| image_processor_device_ = V4L2Device::Create(); |
| if (!image_processor_device_) { |
| VLOGF(1) << "Could not create a V4L2Device for image processor"; |
| return false; |
| } |
| |
| image_processor_ = v4l2_vda_helpers::CreateImageProcessor( |
| *output_format_fourcc_, *egl_image_format_fourcc_, coded_size_, |
| egl_image_size_, visible_size_, VideoFrame::StorageType::STORAGE_DMABUFS, |
| output_buffer_map_.size(), image_processor_device_, |
| image_processor_output_mode, decoder_thread_.task_runner(), |
| // Unretained(this) is safe for ErrorCB because |decoder_thread_| is owned |
| // by this V4L2VideoDecodeAccelerator and |this| must be valid when |
| // ErrorCB is executed. |
| base::BindRepeating(&V4L2VideoDecodeAccelerator::ImageProcessorError, |
| base::Unretained(this))); |
| |
| if (!image_processor_) { |
| VLOGF(1) << "Error creating image processor"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| return false; |
| } |
| |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::ProcessFrame(int32_t bitstream_buffer_id, |
| V4L2ReadableBufferRef buf) { |
| DVLOGF(4); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| OutputRecord& output_record = output_buffer_map_[buf->BufferId()]; |
| |
| scoped_refptr<VideoFrame> input_frame = buf->GetVideoFrame(); |
| if (!input_frame) { |
| VLOGF(1) << "Could not get the input frame for the image processor!"; |
| return false; |
| } |
| |
| // The |input_frame| has a potentially incorrect visible rectangle and natural |
| // size: that frame gets created by V4L2Buffer::CreateVideoFrame() which uses |
| // v4l2_format::fmt.pix_mp.width and v4l2_format::fmt.pix_mp.height as the |
| // visible rectangle and natural size. However, those dimensions actually |
| // correspond to the coded size. Therefore, we should wrap |input_frame| into |
| // another frame with the right visible rectangle and natural size. |
| DCHECK(input_frame->visible_rect().origin().IsOrigin()); |
| const gfx::Rect visible_rect = image_processor_->input_config().visible_rect; |
| const gfx::Size natural_size = visible_rect.size(); |
| if (!gfx::Rect(input_frame->coded_size()).Contains(visible_rect) || |
| !input_frame->visible_rect().Contains(visible_rect)) { |
| VLOGF(1) << "The visible size is too large!"; |
| return false; |
| } |
| if (!gfx::Rect(input_frame->natural_size()) |
| .Contains(gfx::Rect(natural_size))) { |
| VLOGF(1) << "The natural size is too large!"; |
| return false; |
| } |
| scoped_refptr<VideoFrame> cropped_input_frame = VideoFrame::WrapVideoFrame( |
| input_frame, input_frame->format(), visible_rect, natural_size); |
| if (!cropped_input_frame) { |
| VLOGF(1) << "Could not wrap the input frame for the image processor!"; |
| return false; |
| } |
| |
| // Keep reference to the IP input until the frame is processed |
| buffers_at_ip_.push(std::make_pair(bitstream_buffer_id, buf)); |
| |
| // Unretained(this) is safe for FrameReadyCB because |decoder_thread_| is |
| // owned by this V4L2VideoDecodeAccelerator and |this| must be valid when |
| // FrameReadyCB is executed. |
| if (image_processor_->output_mode() == ImageProcessor::OutputMode::IMPORT) { |
| image_processor_->Process( |
| cropped_input_frame, output_record.output_frame, |
| base::BindOnce(&V4L2VideoDecodeAccelerator::FrameProcessed, |
| base::Unretained(this), bitstream_buffer_id, |
| buf->BufferId())); |
| } else { |
| image_processor_->Process( |
| cropped_input_frame, |
| base::BindOnce(&V4L2VideoDecodeAccelerator::FrameProcessed, |
| base::Unretained(this), bitstream_buffer_id)); |
| } |
| return true; |
| } |
| |
| bool V4L2VideoDecodeAccelerator::CreateOutputBuffers() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK(decoder_state_ == kInitialized || |
| decoder_state_ == kChangingResolution); |
| DCHECK(output_queue_); |
| DCHECK(!output_queue_->IsStreaming()); |
| DCHECK(output_buffer_map_.empty()); |
| |
| // Number of output buffers we need. |
| auto ctrl = device_->GetCtrl(V4L2_CID_MIN_BUFFERS_FOR_CAPTURE); |
| if (!ctrl) |
| return false; |
| output_dpb_size_ = ctrl->value; |
| |
| // Output format setup in Initialize(). |
| |
| uint32_t buffer_count = output_dpb_size_ + kDpbOutputBufferExtraCount; |
| if (image_processor_device_) |
| buffer_count += kDpbOutputBufferExtraCountForImageProcessor; |
| |
| DVLOGF(3) << "buffer_count=" << buffer_count |
| << ", coded_size=" << egl_image_size_.ToString(); |
| |
| // With ALLOCATE mode the client can sample it as RGB and doesn't need to |
| // know the precise format. |
| VideoPixelFormat pixel_format = |
| (output_mode_ == Config::OutputMode::IMPORT) |
| ? egl_image_format_fourcc_->ToVideoPixelFormat() |
| : PIXEL_FORMAT_UNKNOWN; |
| |
| child_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&Client::ProvidePictureBuffersWithVisibleRect, client_, |
| buffer_count, pixel_format, 1, egl_image_size_, |
| gfx::Rect(visible_size_), device_->GetTextureTarget())); |
| |
| // Go into kAwaitingPictureBuffers to prevent us from doing any more decoding |
| // or event handling while we are waiting for AssignPictureBuffers(). Not |
| // having Pictures available would not have prevented us from making decoding |
| // progress entirely e.g. in the case of H.264 where we could further decode |
| // non-slice NALUs and could even get another resolution change before we were |
| // done with this one. After we get the buffers, we'll go back into kIdle and |
| // kick off further event processing, and eventually go back into kDecoding |
| // once no more events are pending (if any). |
| decoder_state_ = kAwaitingPictureBuffers; |
| |
| return true; |
| } |
| |
| void V4L2VideoDecodeAccelerator::DestroyInputBuffers() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| if (!input_queue_) |
| return; |
| |
| input_queue_->DeallocateBuffers(); |
| } |
| |
| bool V4L2VideoDecodeAccelerator::DestroyOutputBuffers() { |
| VLOGF(2); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK(!output_queue_ || !output_queue_->IsStreaming()); |
| bool success = true; |
| |
| if (!output_queue_ || output_buffer_map_.empty()) |
| return true; |
| |
| // Release all buffers waiting for an import buffer event |
| output_wait_map_.clear(); |
| |
| for (size_t i = 0; i < output_buffer_map_.size(); ++i) { |
| OutputRecord& output_record = output_buffer_map_[i]; |
| |
| if (output_record.egl_image != EGL_NO_IMAGE_KHR) { |
| child_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(base::IgnoreResult(&V4L2Device::DestroyEGLImage), |
| device_, egl_display_, output_record.egl_image)); |
| } |
| |
| DVLOGF(3) << "dismissing PictureBuffer id=" << output_record.picture_id; |
| child_task_runner_->PostTask( |
| FROM_HERE, base::BindOnce(&Client::DismissPictureBuffer, client_, |
| output_record.picture_id)); |
| } |
| |
| while (!buffers_awaiting_fence_.empty()) |
| buffers_awaiting_fence_.pop(); |
| |
| if (!output_queue_->DeallocateBuffers()) { |
| LOG(ERROR) << "Failed deallocating output buffers"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| success = false; |
| } |
| |
| output_buffer_map_.clear(); |
| |
| return success; |
| } |
| |
| void V4L2VideoDecodeAccelerator::SendBufferToClient( |
| size_t output_buffer_index, |
| int32_t bitstream_buffer_id, |
| V4L2ReadableBufferRef vda_buffer, |
| scoped_refptr<VideoFrame> frame) { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_GE(bitstream_buffer_id, 0); |
| OutputRecord& output_record = output_buffer_map_[output_buffer_index]; |
| |
| DCHECK_EQ(buffers_at_client_.count(output_record.picture_id), 0u); |
| // We need to keep the VDA buffer for now, as the IP still needs to be told |
| // which buffer to use so we cannot use this buffer index before the client |
| // has returned the corresponding IP buffer. |
| buffers_at_client_.emplace( |
| output_record.picture_id, |
| std::make_pair(std::move(vda_buffer), std::move(frame))); |
| // TODO(hubbe): Insert correct color space. http://crbug.com/647725 |
| const Picture picture(output_record.picture_id, bitstream_buffer_id, |
| gfx::Rect(visible_size_), gfx::ColorSpace(), false); |
| pending_picture_ready_.emplace(output_record.cleared, picture); |
| SendPictureReady(); |
| // This picture will be cleared next time we see it. |
| output_record.cleared = true; |
| } |
| |
| void V4L2VideoDecodeAccelerator::SendPictureReady() { |
| DVLOGF(4); |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| bool send_now = (decoder_state_ == kChangingResolution || |
| decoder_state_ == kResetting || decoder_flushing_); |
| while (pending_picture_ready_.size() > 0) { |
| bool cleared = pending_picture_ready_.front().cleared; |
| const Picture& picture = pending_picture_ready_.front().picture; |
| if (cleared && picture_clearing_count_ == 0) { |
| // This picture is cleared. It can be posted to a thread different than |
| // the main GPU thread to reduce latency. This should be the case after |
| // all pictures are cleared at the beginning. |
| decode_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce(&Client::PictureReady, decode_client_, picture)); |
| pending_picture_ready_.pop(); |
| } else if (!cleared || send_now) { |
| DVLOGF(4) << "cleared=" << pending_picture_ready_.front().cleared |
| << ", decoder_state_=" << decoder_state_ |
| << ", decoder_flushing_=" << decoder_flushing_ |
| << ", picture_clearing_count_=" << picture_clearing_count_; |
| // If the picture is not cleared, post it to the child thread because it |
| // has to be cleared in the child thread. A picture only needs to be |
| // cleared once. If the decoder is changing resolution, resetting or |
| // flushing, send all pictures to ensure PictureReady arrive before |
| // ProvidePictureBuffers, NotifyResetDone, or NotifyFlushDone. |
| child_task_runner_->PostTaskAndReply( |
| FROM_HERE, base::BindOnce(&Client::PictureReady, client_, picture), |
| // Unretained is safe. If Client::PictureReady gets to run, |this| is |
| // alive. Destroy() will wait the decode thread to finish. |
| base::BindOnce(&V4L2VideoDecodeAccelerator::PictureCleared, |
| base::Unretained(this))); |
| picture_clearing_count_++; |
| pending_picture_ready_.pop(); |
| } else { |
| // This picture is cleared. But some pictures are about to be cleared on |
| // the child thread. To preserve the order, do not send this until those |
| // pictures are cleared. |
| break; |
| } |
| } |
| } |
| |
| void V4L2VideoDecodeAccelerator::PictureCleared() { |
| DVLOGF(4) << "clearing count=" << picture_clearing_count_; |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| DCHECK_GT(picture_clearing_count_, 0); |
| picture_clearing_count_--; |
| SendPictureReady(); |
| } |
| |
| void V4L2VideoDecodeAccelerator::FrameProcessed( |
| int32_t bitstream_buffer_id, |
| size_t ip_buffer_index, |
| scoped_refptr<VideoFrame> frame) { |
| DVLOGF(4) << "ip_buffer_index=" << ip_buffer_index |
| << ", bitstream_buffer_id=" << bitstream_buffer_id; |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| // TODO(crbug.com/921825): Remove this workaround once reset callback is |
| // implemented. |
| if (buffers_at_ip_.empty() || |
| buffers_at_ip_.front().first != bitstream_buffer_id || |
| output_buffer_map_.empty()) { |
| // This can happen if image processor is reset. |
| // V4L2VideoDecodeAccelerator::Reset() makes |
| // |buffers_at_ip_| empty. |
| // During ImageProcessor::Reset(), some FrameProcessed() can have been |
| // posted to |decoder_thread|. |bitsream_buffer_id| is pushed to |
| // |buffers_at_ip_| in ProcessFrame(). Although we |
| // are not sure a new bitstream buffer id is pushed after Reset() and before |
| // FrameProcessed(), We should skip the case of mismatch of bitstream buffer |
| // id for safety. |
| // For |output_buffer_map_|, it is cleared in Destroy(). Destroy() destroys |
| // ImageProcessor which may call FrameProcessed() in parallel similar to |
| // Reset() case. |
| DVLOGF(4) << "Ignore processed frame for bitstream_buffer_id=" |
| << bitstream_buffer_id; |
| return; |
| } |
| DCHECK_GE(ip_buffer_index, 0u); |
| DCHECK_LT(ip_buffer_index, output_buffer_map_.size()); |
| |
| // This is the output record for the buffer received from the IP, which index |
| // may differ from the buffer used by the VDA. |
| OutputRecord& ip_output_record = output_buffer_map_[ip_buffer_index]; |
| DVLOGF(4) << "picture_id=" << ip_output_record.picture_id; |
| DCHECK_NE(ip_output_record.picture_id, -1); |
| |
| // If the picture has not been cleared yet, this means it is the first time |
| // we are seeing this buffer from the image processor. Schedule a call to |
| // CreateEGLImageFor before the picture is sent to the client. It is |
| // guaranteed that CreateEGLImageFor will complete before the picture is sent |
| // to the client as both events happen on the child thread due to the picture |
| // uncleared status. |
| if (ip_output_record.texture_id != 0 && !ip_output_record.cleared) { |
| DCHECK(frame->HasDmaBufs()); |
| |
| child_task_runner_->PostTask( |
| FROM_HERE, |
| base::BindOnce( |
| &V4L2VideoDecodeAccelerator::CreateEGLImageFor, weak_this_, |
| image_processor_device_, ip_buffer_index, |
| ip_output_record.picture_id, |
| CreateGpuMemoryBufferHandle(frame.get()).native_pixmap_handle, |
| ip_output_record.texture_id, visible_size_, |
| *egl_image_format_fourcc_)); |
| } |
| |
| // Remove our job from the IP jobs queue |
| DCHECK_GT(buffers_at_ip_.size(), 0u); |
| DCHECK(buffers_at_ip_.front().first == bitstream_buffer_id); |
| // This is the VDA buffer used as input of the IP. |
| V4L2ReadableBufferRef vda_buffer = std::move(buffers_at_ip_.front().second); |
| buffers_at_ip_.pop(); |
| |
| SendBufferToClient(ip_buffer_index, bitstream_buffer_id, |
| std::move(vda_buffer), std::move(frame)); |
| // Flush or resolution change may be waiting image processor to finish. |
| if (buffers_at_ip_.empty()) { |
| NotifyFlushDoneIfNeeded(); |
| if (decoder_state_ == kChangingResolution) |
| StartResolutionChange(); |
| } |
| } |
| |
| void V4L2VideoDecodeAccelerator::ImageProcessorError() { |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| VLOGF(1) << "Image processor error"; |
| NOTIFY_ERROR(PLATFORM_FAILURE); |
| } |
| |
| bool V4L2VideoDecodeAccelerator::OnMemoryDump( |
| const base::trace_event::MemoryDumpArgs& args, |
| base::trace_event::ProcessMemoryDump* pmd) { |
| // OnMemoryDump() must be performed on |decoder_thread_|. |
| DCHECK(decoder_thread_.task_runner()->BelongsToCurrentThread()); |
| |
| // |input_queue| and |output_queue| are owned by |decoder_thread_|. |
| size_t input_queue_buffers_count = 0; |
| size_t input_queue_memory_usage = 0; |
| std::string input_queue_buffers_memory_type; |
| if (input_queue_) { |
| input_queue_buffers_count = input_queue_->AllocatedBuffersCount(); |
| input_queue_buffers_memory_type = |
| V4L2MemoryToString(input_queue_->GetMemoryType()); |
| if (output_queue_->GetMemoryType() == V4L2_MEMORY_MMAP) |
| input_queue_memory_usage = input_queue_->GetMemoryUsage(); |
| } |
| |
| size_t output_queue_buffers_count = 0; |
| size_t output_queue_memory_usage = 0; |
| std::string output_queue_buffers_memory_type; |
| if (output_queue_) { |
| output_queue_buffers_count = output_queue_->AllocatedBuffersCount(); |
| output_queue_buffers_memory_type = |
| V4L2MemoryToString(output_queue_->GetMemoryType()); |
| if (output_queue_->GetMemoryType() == V4L2_MEMORY_MMAP) |
| output_queue_memory_usage = output_queue_->GetMemoryUsage(); |
| } |
| |
| const size_t total_usage = |
| input_queue_memory_usage + output_queue_memory_usage; |
| |
| using ::base::trace_event::MemoryAllocatorDump; |
| |
| auto dump_name = base::StringPrintf("gpu/v4l2/decoder/0x%" PRIxPTR, |
| reinterpret_cast<uintptr_t>(this)); |
| MemoryAllocatorDump* dump = pmd->CreateAllocatorDump(dump_name); |
| dump->AddScalar(MemoryAllocatorDump::kNameSize, |
| MemoryAllocatorDump::kUnitsBytes, |
| static_cast<uint64_t>(total_usage)); |
| dump->AddScalar("input_queue_memory_usage", MemoryAllocatorDump::kUnitsBytes, |
| static_cast<uint64_t>(input_queue_memory_usage)); |
| dump->AddScalar("input_queue_buffers_count", |
| MemoryAllocatorDump::kUnitsObjects, |
| static_cast<uint64_t>(input_queue_buffers_count)); |
| dump->AddString("input_queue_buffers_memory_type", "", |
| input_queue_buffers_memory_type); |
| dump->AddScalar("output_queue_memory_usage", MemoryAllocatorDump::kUnitsBytes, |
| static_cast<uint64_t>(output_queue_memory_usage)); |
| dump->AddScalar("output_queue_buffers_count", |
| MemoryAllocatorDump::kUnitsObjects, |
| static_cast<uint64_t>(output_queue_buffers_count)); |
| dump->AddString("output_queue_buffers_memory_type", "", |
| output_queue_buffers_memory_type); |
| |
| return true; |
| } |
| |
| } // namespace media |