| // Copyright (c) 2012 The Chromium Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #ifndef MEDIA_BASE_AUDIO_PARAMETERS_H_ |
| #define MEDIA_BASE_AUDIO_PARAMETERS_H_ |
| |
| #include <stdint.h> |
| #include <string> |
| #include <vector> |
| |
| #include "base/compiler_specific.h" |
| #include "base/numerics/checked_math.h" |
| #include "base/time/time.h" |
| #include "build/build_config.h" |
| #include "media/base/audio_bus.h" |
| #include "media/base/audio_latency.h" |
| #include "media/base/audio_point.h" |
| #include "media/base/channel_layout.h" |
| #include "media/base/media_shmem_export.h" |
| #include "media/base/sample_format.h" |
| #include "third_party/abseil-cpp/absl/types/optional.h" |
| |
| namespace media { |
| |
| // Use a struct-in-struct approach to ensure that we can calculate the required |
| // size as sizeof(Audio{Input,Output}BufferParameters) + #(bytes in audio |
| // buffer) without using packing. Also align Audio{Input,Output}BufferParameters |
| // instead of in Audio{Input,Output}Buffer to be able to calculate size like so. |
| // Use a macro for the alignment value that's the same as |
| // AudioBus::kChannelAlignment, since MSVC doesn't accept the latter to be used. |
| #if defined(OS_WIN) |
| #pragma warning(push) |
| #pragma warning(disable : 4324) // Disable warning for added padding. |
| #endif |
| #define PARAMETERS_ALIGNMENT 16 |
| static_assert(AudioBus::kChannelAlignment == PARAMETERS_ALIGNMENT, |
| "Audio buffer parameters struct alignment not same as AudioBus"); |
| // ****WARNING****: Do not change the field types or ordering of these fields |
| // without checking that alignment is correct. The structs may be concurrently |
| // accessed by both 32bit and 64bit process in shmem. http://crbug.com/781095. |
| struct MEDIA_SHMEM_EXPORT ALIGNAS(PARAMETERS_ALIGNMENT) |
| AudioInputBufferParameters { |
| double volume; |
| int64_t capture_time_us; // base::TimeTicks in microseconds. |
| uint32_t size; |
| uint32_t id; |
| bool key_pressed; |
| }; |
| struct MEDIA_SHMEM_EXPORT ALIGNAS(PARAMETERS_ALIGNMENT) |
| AudioOutputBufferParameters { |
| int64_t delay_us; // base::TimeDelta in microseconds. |
| int64_t delay_timestamp_us; // base::TimeTicks in microseconds. |
| uint32_t frames_skipped; |
| uint32_t bitstream_data_size; |
| uint32_t bitstream_frames; |
| }; |
| #undef PARAMETERS_ALIGNMENT |
| #if defined(OS_WIN) |
| #pragma warning(pop) |
| #endif |
| |
| static_assert(sizeof(AudioInputBufferParameters) % |
| AudioBus::kChannelAlignment == |
| 0, |
| "AudioInputBufferParameters not aligned"); |
| static_assert(sizeof(AudioOutputBufferParameters) % |
| AudioBus::kChannelAlignment == |
| 0, |
| "AudioOutputBufferParameters not aligned"); |
| |
| struct MEDIA_SHMEM_EXPORT AudioInputBuffer { |
| AudioInputBufferParameters params; |
| int8_t audio[1]; |
| }; |
| struct MEDIA_SHMEM_EXPORT AudioOutputBuffer { |
| AudioOutputBufferParameters params; |
| int8_t audio[1]; |
| }; |
| |
| struct MEDIA_SHMEM_EXPORT AudioRendererAlgorithmParameters { |
| // The maximum size for the audio buffer. |
| base::TimeDelta max_capacity; |
| |
| // The minimum size for the audio buffer. |
| base::TimeDelta starting_capacity; |
| |
| // The minimum size for the audio buffer for encrypted streams. |
| // Set this to be larger than |max_capacity| because the |
| // performance of encrypted playback is always worse than clear playback, due |
| // to decryption and potentially IPC overhead. For the context, see |
| // https://crbug.com/403462, https://crbug.com/718161 and |
| // https://crbug.com/879970. |
| base::TimeDelta starting_capacity_for_encrypted; |
| }; |
| |
| // These convenience function safely computes the size required for |
| // |shared_memory_count| AudioInputBuffers, with enough memory for AudioBus |
| // data, using |paremeters| (or alternatively |channels| and |frames|). The |
| // functions not returning a CheckedNumeric will CHECK on overflow. |
| MEDIA_SHMEM_EXPORT base::CheckedNumeric<uint32_t> |
| ComputeAudioInputBufferSizeChecked(const AudioParameters& parameters, |
| uint32_t audio_bus_count); |
| |
| MEDIA_SHMEM_EXPORT uint32_t |
| ComputeAudioInputBufferSize(const AudioParameters& parameters, |
| uint32_t audio_bus_count); |
| |
| MEDIA_SHMEM_EXPORT uint32_t |
| ComputeAudioInputBufferSize(int channels, int frames, uint32_t audio_bus_count); |
| |
| // These convenience functions safely computes the size required for an |
| // AudioOutputBuffer with enough memory for AudioBus data using |parameters| (or |
| // alternatively |channels| and |frames|). The functions not returning a |
| // CheckedNumeric will CHECK on overflow. |
| MEDIA_SHMEM_EXPORT base::CheckedNumeric<uint32_t> |
| ComputeAudioOutputBufferSizeChecked(const AudioParameters& parameters); |
| |
| MEDIA_SHMEM_EXPORT uint32_t |
| ComputeAudioOutputBufferSize(const AudioParameters& parameters); |
| |
| MEDIA_SHMEM_EXPORT uint32_t ComputeAudioOutputBufferSize(int channels, |
| int frames); |
| |
| class MEDIA_SHMEM_EXPORT AudioParameters { |
| public: |
| // TODO(miu): Rename this enum to something that correctly reflects its |
| // semantics, such as "TransportScheme." |
| enum Format { |
| AUDIO_PCM_LINEAR = 0, // PCM is 'raw' amplitude samples. |
| AUDIO_PCM_LOW_LATENCY, // Linear PCM, low latency requested. |
| AUDIO_BITSTREAM_AC3, // Compressed AC3 bitstream. |
| AUDIO_BITSTREAM_EAC3, // Compressed E-AC3 bitstream. |
| AUDIO_FAKE, // Creates a fake AudioOutputStream object. |
| AUDIO_FORMAT_LAST = AUDIO_FAKE, // Only used for validation of format. |
| }; |
| |
| enum { |
| // Telephone quality sample rate, mostly for speech-only audio. |
| kTelephoneSampleRate = 8000, |
| // CD sampling rate is 44.1 KHz or conveniently 2x2x3x3x5x5x7x7. |
| kAudioCDSampleRate = 44100, |
| }; |
| |
| enum { |
| // The maxmium number of PCM frames can be decoded out of a compressed |
| // audio frame, e.g. MP3, AAC, AC-3. |
| kMaxFramesPerCompressedAudioBuffer = 4096, |
| }; |
| |
| // Bitmasks to determine whether certain platform (typically hardware) audio |
| // effects should be enabled. |
| enum PlatformEffectsMask { |
| NO_EFFECTS = 0x0, |
| ECHO_CANCELLER = 1 << 0, |
| DUCKING = 1 << 1, // Enables ducking if the OS supports it. |
| KEYBOARD_MIC = 1 << 2, |
| HOTWORD = 1 << 3, |
| NOISE_SUPPRESSION = 1 << 4, |
| AUTOMATIC_GAIN_CONTROL = 1 << 5, |
| EXPERIMENTAL_ECHO_CANCELLER = 1 << 6, // Indicates an echo canceller is |
| // available that should only |
| // experimentally be enabled. |
| MULTIZONE = 1 << 7, |
| AUDIO_PREFETCH = 1 << 8, |
| }; |
| |
| struct HardwareCapabilities { |
| HardwareCapabilities(int min_frames_per_buffer, int max_frames_per_buffer) |
| : min_frames_per_buffer(min_frames_per_buffer), |
| max_frames_per_buffer(max_frames_per_buffer) {} |
| HardwareCapabilities() |
| : min_frames_per_buffer(0), max_frames_per_buffer(0) {} |
| |
| // Minimum and maximum buffer sizes supported by the audio hardware. Opening |
| // a device with frames_per_buffer set to a value between min and max should |
| // result in the audio hardware running close to this buffer size, values |
| // above or below will be clamped to the min or max by the audio system. |
| // Either value can be 0 and means that the min or max is not known. |
| int min_frames_per_buffer; |
| int max_frames_per_buffer; |
| }; |
| |
| AudioParameters(); |
| AudioParameters(Format format, |
| ChannelLayout channel_layout, |
| int sample_rate, |
| int frames_per_buffer); |
| AudioParameters(Format format, |
| ChannelLayout channel_layout, |
| int sample_rate, |
| int frames_per_buffer, |
| const HardwareCapabilities& hardware_capabilities); |
| |
| ~AudioParameters(); |
| |
| // Re-initializes all members except for |hardware_capabilities_|. |
| void Reset(Format format, |
| ChannelLayout channel_layout, |
| int sample_rate, |
| int frames_per_buffer); |
| |
| // Checks that all values are in the expected range. All limits are specified |
| // in media::Limits. |
| bool IsValid() const; |
| |
| // Returns a human-readable string describing |*this|. For debugging & test |
| // output only. |
| std::string AsHumanReadableString() const; |
| |
| // Returns size of audio buffer in bytes when using |fmt| for samples. |
| int GetBytesPerBuffer(SampleFormat fmt) const; |
| |
| // Returns the number of bytes representing a frame of audio when using |fmt| |
| // for samples. |
| int GetBytesPerFrame(SampleFormat fmt) const; |
| |
| // Returns the number of microseconds per frame of audio. Intentionally |
| // reported as a double to surface of partial microseconds per frame, which |
| // is common for many sample rates. Failing to account for these nanoseconds |
| // can lead to audio/video sync drift. |
| double GetMicrosecondsPerFrame() const; |
| |
| // Returns the duration of this buffer as calculated from frames_per_buffer() |
| // and sample_rate(). |
| base::TimeDelta GetBufferDuration() const; |
| |
| // Comparison with other AudioParams. |
| bool Equals(const AudioParameters& other) const; |
| |
| // Return true if |format_| is compressed bitstream. |
| bool IsBitstreamFormat() const; |
| |
| void set_format(Format format) { format_ = format; } |
| Format format() const { return format_; } |
| |
| // A setter for channel_layout_ is intentionally excluded. |
| ChannelLayout channel_layout() const { return channel_layout_; } |
| |
| // The number of channels is usually computed from channel_layout_. Setting |
| // this explicitly is only required with CHANNEL_LAYOUT_DISCRETE. |
| void set_channels_for_discrete(int channels) { |
| DCHECK(channel_layout_ == CHANNEL_LAYOUT_DISCRETE || |
| channels == ChannelLayoutToChannelCount(channel_layout_)); |
| channels_ = channels; |
| } |
| int channels() const { return channels_; } |
| |
| void set_sample_rate(int sample_rate) { sample_rate_ = sample_rate; } |
| int sample_rate() const { return sample_rate_; } |
| |
| void set_frames_per_buffer(int frames_per_buffer) { |
| frames_per_buffer_ = frames_per_buffer; |
| } |
| int frames_per_buffer() const { return frames_per_buffer_; } |
| |
| absl::optional<HardwareCapabilities> hardware_capabilities() const { |
| return hardware_capabilities_; |
| } |
| |
| void set_effects(int effects) { effects_ = effects; } |
| int effects() const { return effects_; } |
| |
| void set_mic_positions(const std::vector<Point>& mic_positions) { |
| mic_positions_ = mic_positions; |
| } |
| const std::vector<Point>& mic_positions() const { return mic_positions_; } |
| |
| void set_latency_tag(AudioLatency::LatencyType latency_tag) { |
| latency_tag_ = latency_tag; |
| } |
| AudioLatency::LatencyType latency_tag() const { return latency_tag_; } |
| |
| AudioParameters(const AudioParameters&); |
| AudioParameters& operator=(const AudioParameters&); |
| |
| // Creates reasonable dummy parameters in case no device is available. |
| static AudioParameters UnavailableDeviceParams(); |
| |
| private: |
| Format format_; // Format of the stream. |
| ChannelLayout channel_layout_; // Order of surround sound channels. |
| int channels_; // Number of channels. Value set based on |
| // |channel_layout|. |
| int sample_rate_; // Sampling frequency/rate. |
| int frames_per_buffer_; // Number of frames in a buffer. |
| int effects_; // Bitmask using PlatformEffectsMask. |
| |
| // Microphone positions using Cartesian coordinates: |
| // x: the horizontal dimension, with positive to the right from the camera's |
| // perspective. |
| // y: the depth dimension, with positive forward from the camera's |
| // perspective. |
| // z: the vertical dimension, with positive upwards. |
| // |
| // Usually, the center of the microphone array will be treated as the origin |
| // (often the position of the camera). |
| // |
| // An empty vector indicates unknown positions. |
| std::vector<Point> mic_positions_; |
| |
| // Optional tag to pass latency info from renderer to browser. Set to |
| // AudioLatency::LATENCY_COUNT by default, which means "not specified". |
| AudioLatency::LatencyType latency_tag_; |
| |
| // Audio hardware specific parameters, these are treated as read-only and |
| // changing them has no effect. |
| absl::optional<HardwareCapabilities> hardware_capabilities_; |
| }; |
| |
| // Comparison is useful when AudioParameters is used with std structures. |
| inline bool operator<(const AudioParameters& a, const AudioParameters& b) { |
| if (a.format() != b.format()) |
| return a.format() < b.format(); |
| if (a.channels() != b.channels()) |
| return a.channels() < b.channels(); |
| if (a.sample_rate() != b.sample_rate()) |
| return a.sample_rate() < b.sample_rate(); |
| return a.frames_per_buffer() < b.frames_per_buffer(); |
| } |
| |
| } // namespace media |
| |
| #endif // MEDIA_BASE_AUDIO_PARAMETERS_H_ |