Skip to content

Commit

Permalink
Raw Int16 data for toAVAudioPCMBuffer (#497)
Browse files Browse the repository at this point in the history
  • Loading branch information
hiroshihorie authored Oct 8, 2024
1 parent 3af61d4 commit 4a74cf4
Show file tree
Hide file tree
Showing 4 changed files with 77 additions and 17 deletions.
2 changes: 1 addition & 1 deletion Package.swift
Original file line number Diff line number Diff line change
Expand Up @@ -18,7 +18,7 @@ let package = Package(
],
dependencies: [
// LK-Prefixed Dynamic WebRTC XCFramework
.package(url: "https://github.com/livekit/webrtc-xcframework.git", exact: "125.6422.08"),
.package(url: "https://github.com/livekit/webrtc-xcframework.git", exact: "125.6422.09"),
.package(url: "https://github.com/apple/swift-protobuf.git", from: "1.26.0"),
.package(url: "https://github.com/apple/swift-log.git", from: "1.5.4"),
// Only used for DocC generation
Expand Down
2 changes: 1 addition & 1 deletion [email protected]
Original file line number Diff line number Diff line change
Expand Up @@ -20,7 +20,7 @@ let package = Package(
],
dependencies: [
// LK-Prefixed Dynamic WebRTC XCFramework
.package(url: "https://github.com/livekit/webrtc-xcframework.git", exact: "125.6422.08"),
.package(url: "https://github.com/livekit/webrtc-xcframework.git", exact: "125.6422.09"),
.package(url: "https://github.com/apple/swift-protobuf.git", from: "1.26.0"),
.package(url: "https://github.com/apple/swift-log.git", from: "1.5.4"),
// Only used for DocC generation
Expand Down
28 changes: 13 additions & 15 deletions Sources/LiveKit/Convenience/AudioProcessing.swift
Original file line number Diff line number Diff line change
Expand Up @@ -25,33 +25,31 @@ public struct AudioLevel {
}

public extension LKAudioBuffer {
/// Convert to AVAudioPCMBuffer float buffer will be normalized to 32 bit.
/// Convert to AVAudioPCMBuffer Int16 format.
@objc
func toAVAudioPCMBuffer() -> AVAudioPCMBuffer? {
guard let audioFormat = AVAudioFormat(commonFormat: .pcmFormatFloat32,
guard let audioFormat = AVAudioFormat(commonFormat: .pcmFormatInt16,
sampleRate: Double(frames * 100),
channels: AVAudioChannelCount(channels),
interleaved: false),
let pcmBuffer = AVAudioPCMBuffer(pcmFormat: audioFormat,
frameCapacity: AVAudioFrameCount(frames))
else {
return nil
}
else { return nil }

pcmBuffer.frameLength = AVAudioFrameCount(frames)

guard let targetBufferPointer = pcmBuffer.floatChannelData else { return nil }

// Optimized version
var normalizationFactor: Float = 1.0 / 32768.0
guard let targetBufferPointer = pcmBuffer.int16ChannelData else { return nil }

for i in 0 ..< channels {
vDSP_vsmul(rawBuffer(forChannel: i),
1,
&normalizationFactor,
targetBufferPointer[i],
1,
vDSP_Length(frames))
let sourceBuffer = rawBuffer(forChannel: i)
let targetBuffer = targetBufferPointer[i]
// sourceBuffer is in the format of [Int16] but is stored in 32-bit alignment, we need to pack the Int16 data correctly.

for frame in 0 ..< frames {
// Cast and pack the source 32-bit Int16 data into the target 16-bit buffer
let clampedValue = max(Float(Int16.min), min(Float(Int16.max), sourceBuffer[frame]))
targetBuffer[frame] = Int16(clampedValue)
}
}

return pcmBuffer
Expand Down
62 changes: 62 additions & 0 deletions Sources/LiveKit/Extensions/AVAudioPCMBuffer.swift
Original file line number Diff line number Diff line change
Expand Up @@ -14,6 +14,7 @@
* limitations under the License.
*/

import Accelerate
import AVFoundation

public extension AVAudioPCMBuffer {
Expand Down Expand Up @@ -71,4 +72,65 @@ public extension AVAudioPCMBuffer {

return convertedBuffer
}

/// Convert PCM buffer to specified common format.
/// Currently supports conversion from Int16 to Float32.
func convert(toCommonFormat commonFormat: AVAudioCommonFormat) -> AVAudioPCMBuffer? {
// Check if conversion is needed
guard format.commonFormat != commonFormat else {
return self
}

// Check if the conversion is supported
guard format.commonFormat == .pcmFormatInt16, commonFormat == .pcmFormatFloat32 else {
print("Unsupported conversion: only Int16 to Float32 is supported")
return nil
}

// Create output format
guard let outputFormat = AVAudioFormat(commonFormat: commonFormat,
sampleRate: format.sampleRate,
channels: format.channelCount,
interleaved: false)
else {
print("Failed to create output audio format")
return nil
}

// Create output buffer
guard let outputBuffer = AVAudioPCMBuffer(pcmFormat: outputFormat,
frameCapacity: frameCapacity)
else {
print("Failed to create output PCM buffer")
return nil
}

outputBuffer.frameLength = frameLength

let channelCount = Int(format.channelCount)
let frameCount = Int(frameLength)

// Ensure the source buffer has Int16 data
guard let int16Data = int16ChannelData else {
print("Source buffer doesn't contain Int16 data")
return nil
}

// Ensure the output buffer has Float32 data
guard let floatData = outputBuffer.floatChannelData else {
print("Failed to get float channel data from output buffer")
return nil
}

// Convert Int16 to Float32 and normalize to [-1.0, 1.0]
let scale = Float(Int16.max)
var scalar = 1.0 / scale

for channel in 0 ..< channelCount {
vDSP_vflt16(int16Data[channel], 1, floatData[channel], 1, vDSP_Length(frameCount))
vDSP_vsmul(floatData[channel], 1, &scalar, floatData[channel], 1, vDSP_Length(frameCount))
}

return outputBuffer
}
}

0 comments on commit 4a74cf4

Please sign in to comment.