audio_buffer.h revision 3551c9c881056c480085172ff9840cab31610854
17d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)// Copyright 2013 The Chromium Authors. All rights reserved. 27d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)// Use of this source code is governed by a BSD-style license that can be 37d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)// found in the LICENSE file. 47d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 57d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)#ifndef MEDIA_BASE_AUDIO_BUFFER_H_ 67d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)#define MEDIA_BASE_AUDIO_BUFFER_H_ 77d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 87d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)#include <vector> 97d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 107d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)#include "base/memory/aligned_memory.h" 117d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)#include "base/memory/ref_counted.h" 127d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)#include "base/memory/scoped_ptr.h" 13eb525c5499e34cc9c4b825d6d9e75bb07cc06aceBen Murdoch#include "base/time/time.h" 147d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)#include "media/base/media_export.h" 157d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)#include "media/base/sample_format.h" 167d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 177d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)namespace media { 187d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)class AudioBus; 197d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 207d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)// An audio buffer that takes a copy of the data passed to it, holds it, and 217d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)// copies it into an AudioBus when needed. Also supports an end of stream 227d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)// marker. 237d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)class MEDIA_EXPORT AudioBuffer 247d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) : public base::RefCountedThreadSafe<AudioBuffer> { 257d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) public: 263551c9c881056c480085172ff9840cab31610854Torne (Richard Coles) // Alignment of each channel's data; this must match what ffmpeg expects 273551c9c881056c480085172ff9840cab31610854Torne (Richard Coles) // (which may be 0, 16, or 32, depending on the processor). Selecting 32 in 283551c9c881056c480085172ff9840cab31610854Torne (Richard Coles) // order to work on all processors. 293551c9c881056c480085172ff9840cab31610854Torne (Richard Coles) enum { kChannelAlignment = 32 }; 303551c9c881056c480085172ff9840cab31610854Torne (Richard Coles) 317d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // Create an AudioBuffer whose channel data is copied from |data|. For 327d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // interleaved data, only the first buffer is used. For planar data, the 337d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // number of buffers must be equal to |channel_count|. |frame_count| is the 347d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // number of frames in each buffer. |data| must not be null and |frame_count| 357d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // must be >= 0. 367d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // 377d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // TODO(jrummell): Compute duration rather than pass it in. 387d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) static scoped_refptr<AudioBuffer> CopyFrom(SampleFormat sample_format, 397d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) int channel_count, 407d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) int frame_count, 417d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) const uint8* const* data, 427d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) const base::TimeDelta timestamp, 437d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) const base::TimeDelta duration); 447d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 45a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) // Create an AudioBuffer with |frame_count| frames. Buffer is allocated, but 46a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) // not initialized. Timestamp and duration are set to kNoTimestamp(). 47a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) static scoped_refptr<AudioBuffer> CreateBuffer(SampleFormat sample_format, 48a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) int channel_count, 49a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) int frame_count); 50a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) 517dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch // Create an empty AudioBuffer with |frame_count| frames. 527dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch static scoped_refptr<AudioBuffer> CreateEmptyBuffer( 537dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch int channel_count, 547dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch int frame_count, 557dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch const base::TimeDelta timestamp, 567dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch const base::TimeDelta duration); 577dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch 587d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // Create a AudioBuffer indicating we've reached end of stream. 597d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // Calling any method other than end_of_stream() on the resulting buffer 607d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // is disallowed. 617d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) static scoped_refptr<AudioBuffer> CreateEOSBuffer(); 627d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 637d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // Copy frames into |dest|. |frames_to_copy| is the number of frames to copy. 647dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch // |source_frame_offset| specifies how many frames in the buffer to skip 657d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // first. |dest_frame_offset| is the frame offset in |dest|. The frames are 667d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // converted from their source format into planar float32 data (which is all 677d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // that AudioBus handles). 687d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) void ReadFrames(int frames_to_copy, 697d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) int source_frame_offset, 707d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) int dest_frame_offset, 717d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) AudioBus* dest); 727d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 737dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch // Trim an AudioBuffer by removing |frames_to_trim| frames from the start. 74a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) // Timestamp and duration are adjusted to reflect the fewer frames. 757dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch // Note that repeated calls to TrimStart() may result in timestamp() and 767dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch // duration() being off by a few microseconds due to rounding issues. 777dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch void TrimStart(int frames_to_trim); 787dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch 79a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) // Trim an AudioBuffer by removing |frames_to_trim| frames from the end. 80a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) // Duration is adjusted to reflect the fewer frames. 81a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) void TrimEnd(int frames_to_trim); 82a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) 837dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch // Return the number of channels. 847dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch int channel_count() const { return channel_count_; } 857dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch 867d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // Return the number of frames held. 877dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch int frame_count() const { return adjusted_frame_count_; } 887d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 897d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // Access to constructor parameters. 907d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) base::TimeDelta timestamp() const { return timestamp_; } 917d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) base::TimeDelta duration() const { return duration_; } 927d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 937dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch // TODO(jrummell): Remove set_timestamp() and set_duration() once 947dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch // DecryptingAudioDecoder::EnqueueFrames() is changed to set them when 957dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch // creating the buffer. See http://crbug.com/255261. 967dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch void set_timestamp(base::TimeDelta timestamp) { timestamp_ = timestamp; } 977dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch void set_duration(base::TimeDelta duration) { duration_ = duration; } 987dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch 997d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // If there's no data in this buffer, it represents end of stream. 1007dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch bool end_of_stream() const { return end_of_stream_; } 1017d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 102a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) // Access to the raw buffer for ffmpeg to write directly to. Data for planar 1033551c9c881056c480085172ff9840cab31610854Torne (Richard Coles) // data is grouped by channel. There is only 1 entry for interleaved formats. 1043551c9c881056c480085172ff9840cab31610854Torne (Richard Coles) const std::vector<uint8*>& channel_data() const { return channel_data_; } 105a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) 1067d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) private: 1077d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) friend class base::RefCountedThreadSafe<AudioBuffer>; 1087d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 1097d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // Allocates aligned contiguous buffer to hold all channel data (1 block for 1107d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // interleaved data, |channel_count| blocks for planar data), copies 111a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) // [data,data+data_size) to the allocated buffer(s). If |data| is null, no 112a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) // data is copied. If |create_buffer| is false, no data buffer is created (or 113a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) // copied to). 1147d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) AudioBuffer(SampleFormat sample_format, 1157d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) int channel_count, 1167d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) int frame_count, 117a36e5920737c6adbddd3e43b760e5de8431db6e0Torne (Richard Coles) bool create_buffer, 1187d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) const uint8* const* data, 1197d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) const base::TimeDelta timestamp, 1207d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) const base::TimeDelta duration); 1217d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 1227d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) virtual ~AudioBuffer(); 1237d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 1247dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch const SampleFormat sample_format_; 1257dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch const int channel_count_; 1267dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch int adjusted_frame_count_; 1277dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch int trim_start_; 1287dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch const bool end_of_stream_; 1297d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) base::TimeDelta timestamp_; 1307d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) base::TimeDelta duration_; 1317d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 1327d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // Contiguous block of channel data. 1337d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) scoped_ptr_malloc<uint8, base::ScopedPtrAlignedFree> data_; 1347d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 1357d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) // For planar data, points to each channels data. 1367d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) std::vector<uint8*> channel_data_; 1377d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 1387d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) DISALLOW_IMPLICIT_CONSTRUCTORS(AudioBuffer); 1397d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)}; 1407d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 1417d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)} // namespace media 1427d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles) 1437d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)#endif // MEDIA_BASE_AUDIO_BUFFER_H_ 144