// Copyright (c) 2012 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #ifndef MEDIA_BASE_AUDIO_PARAMETERS_H_ #define MEDIA_BASE_AUDIO_PARAMETERS_H_ #include #include #include #include "base/compiler_specific.h" #include "base/numerics/checked_math.h" #include "base/time/time.h" #include "build/build_config.h" #include "media/base/audio_bus.h" #include "media/base/audio_latency.h" #include "media/base/audio_point.h" #include "media/base/channel_layout.h" #include "media/base/media_shmem_export.h" #include "media/base/sample_format.h" #include "third_party/abseil-cpp/absl/types/optional.h" namespace media { // Use a struct-in-struct approach to ensure that we can calculate the required // size as sizeof(Audio{Input,Output}BufferParameters) + #(bytes in audio // buffer) without using packing. Also align Audio{Input,Output}BufferParameters // instead of in Audio{Input,Output}Buffer to be able to calculate size like so. // Use a macro for the alignment value that's the same as // AudioBus::kChannelAlignment, since MSVC doesn't accept the latter to be used. #if defined(OS_WIN) #pragma warning(push) #pragma warning(disable : 4324) // Disable warning for added padding. #endif #define PARAMETERS_ALIGNMENT 16 static_assert(AudioBus::kChannelAlignment == PARAMETERS_ALIGNMENT, "Audio buffer parameters struct alignment not same as AudioBus"); // ****WARNING****: Do not change the field types or ordering of these fields // without checking that alignment is correct. The structs may be concurrently // accessed by both 32bit and 64bit process in shmem. http://crbug.com/781095. struct MEDIA_SHMEM_EXPORT ALIGNAS(PARAMETERS_ALIGNMENT) AudioInputBufferParameters { double volume; int64_t capture_time_us; // base::TimeTicks in microseconds. uint32_t size; uint32_t id; bool key_pressed; }; struct MEDIA_SHMEM_EXPORT ALIGNAS(PARAMETERS_ALIGNMENT) AudioOutputBufferParameters { int64_t delay_us; // base::TimeDelta in microseconds. int64_t delay_timestamp_us; // base::TimeTicks in microseconds. uint32_t frames_skipped; uint32_t bitstream_data_size; uint32_t bitstream_frames; }; #undef PARAMETERS_ALIGNMENT #if defined(OS_WIN) #pragma warning(pop) #endif static_assert(sizeof(AudioInputBufferParameters) % AudioBus::kChannelAlignment == 0, "AudioInputBufferParameters not aligned"); static_assert(sizeof(AudioOutputBufferParameters) % AudioBus::kChannelAlignment == 0, "AudioOutputBufferParameters not aligned"); struct MEDIA_SHMEM_EXPORT AudioInputBuffer { AudioInputBufferParameters params; int8_t audio[1]; }; struct MEDIA_SHMEM_EXPORT AudioOutputBuffer { AudioOutputBufferParameters params; int8_t audio[1]; }; struct MEDIA_SHMEM_EXPORT AudioRendererAlgorithmParameters { // The maximum size for the audio buffer. base::TimeDelta max_capacity; // The minimum size for the audio buffer. base::TimeDelta starting_capacity; // The minimum size for the audio buffer for encrypted streams. // Set this to be larger than |max_capacity| because the // performance of encrypted playback is always worse than clear playback, due // to decryption and potentially IPC overhead. For the context, see // https://crbug.com/403462, https://crbug.com/718161 and // https://crbug.com/879970. base::TimeDelta starting_capacity_for_encrypted; }; // These convenience function safely computes the size required for // |shared_memory_count| AudioInputBuffers, with enough memory for AudioBus // data, using |paremeters| (or alternatively |channels| and |frames|). The // functions not returning a CheckedNumeric will CHECK on overflow. MEDIA_SHMEM_EXPORT base::CheckedNumeric ComputeAudioInputBufferSizeChecked(const AudioParameters& parameters, uint32_t audio_bus_count); MEDIA_SHMEM_EXPORT uint32_t ComputeAudioInputBufferSize(const AudioParameters& parameters, uint32_t audio_bus_count); MEDIA_SHMEM_EXPORT uint32_t ComputeAudioInputBufferSize(int channels, int frames, uint32_t audio_bus_count); // These convenience functions safely computes the size required for an // AudioOutputBuffer with enough memory for AudioBus data using |parameters| (or // alternatively |channels| and |frames|). The functions not returning a // CheckedNumeric will CHECK on overflow. MEDIA_SHMEM_EXPORT base::CheckedNumeric ComputeAudioOutputBufferSizeChecked(const AudioParameters& parameters); MEDIA_SHMEM_EXPORT uint32_t ComputeAudioOutputBufferSize(const AudioParameters& parameters); MEDIA_SHMEM_EXPORT uint32_t ComputeAudioOutputBufferSize(int channels, int frames); class MEDIA_SHMEM_EXPORT AudioParameters { public: // TODO(miu): Rename this enum to something that correctly reflects its // semantics, such as "TransportScheme." enum Format { AUDIO_PCM_LINEAR = 0, // PCM is 'raw' amplitude samples. AUDIO_PCM_LOW_LATENCY, // Linear PCM, low latency requested. AUDIO_BITSTREAM_AC3, // Compressed AC3 bitstream. AUDIO_BITSTREAM_EAC3, // Compressed E-AC3 bitstream. AUDIO_FAKE, // Creates a fake AudioOutputStream object. AUDIO_FORMAT_LAST = AUDIO_FAKE, // Only used for validation of format. }; enum { // Telephone quality sample rate, mostly for speech-only audio. kTelephoneSampleRate = 8000, // CD sampling rate is 44.1 KHz or conveniently 2x2x3x3x5x5x7x7. kAudioCDSampleRate = 44100, }; enum { // The maxmium number of PCM frames can be decoded out of a compressed // audio frame, e.g. MP3, AAC, AC-3. kMaxFramesPerCompressedAudioBuffer = 4096, }; // Bitmasks to determine whether certain platform (typically hardware) audio // effects should be enabled. enum PlatformEffectsMask { NO_EFFECTS = 0x0, ECHO_CANCELLER = 1 << 0, DUCKING = 1 << 1, // Enables ducking if the OS supports it. KEYBOARD_MIC = 1 << 2, HOTWORD = 1 << 3, NOISE_SUPPRESSION = 1 << 4, AUTOMATIC_GAIN_CONTROL = 1 << 5, EXPERIMENTAL_ECHO_CANCELLER = 1 << 6, // Indicates an echo canceller is // available that should only // experimentally be enabled. MULTIZONE = 1 << 7, AUDIO_PREFETCH = 1 << 8, }; struct HardwareCapabilities { HardwareCapabilities(int min_frames_per_buffer, int max_frames_per_buffer) : min_frames_per_buffer(min_frames_per_buffer), max_frames_per_buffer(max_frames_per_buffer) {} HardwareCapabilities() : min_frames_per_buffer(0), max_frames_per_buffer(0) {} // Minimum and maximum buffer sizes supported by the audio hardware. Opening // a device with frames_per_buffer set to a value between min and max should // result in the audio hardware running close to this buffer size, values // above or below will be clamped to the min or max by the audio system. // Either value can be 0 and means that the min or max is not known. int min_frames_per_buffer; int max_frames_per_buffer; }; AudioParameters(); AudioParameters(Format format, ChannelLayout channel_layout, int sample_rate, int frames_per_buffer); AudioParameters(Format format, ChannelLayout channel_layout, int sample_rate, int frames_per_buffer, const HardwareCapabilities& hardware_capabilities); ~AudioParameters(); // Re-initializes all members except for |hardware_capabilities_|. void Reset(Format format, ChannelLayout channel_layout, int sample_rate, int frames_per_buffer); // Checks that all values are in the expected range. All limits are specified // in media::Limits. bool IsValid() const; // Returns a human-readable string describing |*this|. For debugging & test // output only. std::string AsHumanReadableString() const; // Returns size of audio buffer in bytes when using |fmt| for samples. int GetBytesPerBuffer(SampleFormat fmt) const; // Returns the number of bytes representing a frame of audio when using |fmt| // for samples. int GetBytesPerFrame(SampleFormat fmt) const; // Returns the number of microseconds per frame of audio. Intentionally // reported as a double to surface of partial microseconds per frame, which // is common for many sample rates. Failing to account for these nanoseconds // can lead to audio/video sync drift. double GetMicrosecondsPerFrame() const; // Returns the duration of this buffer as calculated from frames_per_buffer() // and sample_rate(). base::TimeDelta GetBufferDuration() const; // Comparison with other AudioParams. bool Equals(const AudioParameters& other) const; // Return true if |format_| is compressed bitstream. bool IsBitstreamFormat() const; void set_format(Format format) { format_ = format; } Format format() const { return format_; } // A setter for channel_layout_ is intentionally excluded. ChannelLayout channel_layout() const { return channel_layout_; } // The number of channels is usually computed from channel_layout_. Setting // this explicitly is only required with CHANNEL_LAYOUT_DISCRETE. void set_channels_for_discrete(int channels) { DCHECK(channel_layout_ == CHANNEL_LAYOUT_DISCRETE || channels == ChannelLayoutToChannelCount(channel_layout_)); channels_ = channels; } int channels() const { return channels_; } void set_sample_rate(int sample_rate) { sample_rate_ = sample_rate; } int sample_rate() const { return sample_rate_; } void set_frames_per_buffer(int frames_per_buffer) { frames_per_buffer_ = frames_per_buffer; } int frames_per_buffer() const { return frames_per_buffer_; } absl::optional hardware_capabilities() const { return hardware_capabilities_; } void set_effects(int effects) { effects_ = effects; } int effects() const { return effects_; } void set_mic_positions(const std::vector& mic_positions) { mic_positions_ = mic_positions; } const std::vector& mic_positions() const { return mic_positions_; } void set_latency_tag(AudioLatency::LatencyType latency_tag) { latency_tag_ = latency_tag; } AudioLatency::LatencyType latency_tag() const { return latency_tag_; } AudioParameters(const AudioParameters&); AudioParameters& operator=(const AudioParameters&); // Creates reasonable dummy parameters in case no device is available. static AudioParameters UnavailableDeviceParams(); private: Format format_; // Format of the stream. ChannelLayout channel_layout_; // Order of surround sound channels. int channels_; // Number of channels. Value set based on // |channel_layout|. int sample_rate_; // Sampling frequency/rate. int frames_per_buffer_; // Number of frames in a buffer. int effects_; // Bitmask using PlatformEffectsMask. // Microphone positions using Cartesian coordinates: // x: the horizontal dimension, with positive to the right from the camera's // perspective. // y: the depth dimension, with positive forward from the camera's // perspective. // z: the vertical dimension, with positive upwards. // // Usually, the center of the microphone array will be treated as the origin // (often the position of the camera). // // An empty vector indicates unknown positions. std::vector mic_positions_; // Optional tag to pass latency info from renderer to browser. Set to // AudioLatency::LATENCY_COUNT by default, which means "not specified". AudioLatency::LatencyType latency_tag_; // Audio hardware specific parameters, these are treated as read-only and // changing them has no effect. absl::optional hardware_capabilities_; }; // Comparison is useful when AudioParameters is used with std structures. inline bool operator<(const AudioParameters& a, const AudioParameters& b) { if (a.format() != b.format()) return a.format() < b.format(); if (a.channels() != b.channels()) return a.channels() < b.channels(); if (a.sample_rate() != b.sample_rate()) return a.sample_rate() < b.sample_rate(); return a.frames_per_buffer() < b.frames_per_buffer(); } } // namespace media #endif // MEDIA_BASE_AUDIO_PARAMETERS_H_