mirror of
https://github.com/vsariola/sointu.git
synced 2025-05-28 03:10:24 -04:00
Throughout sointu, we assume stereo audiobuffers, but were passing around []float32. This had several issues, including len(buf)/2 and numSamples*2 type of length conversion in many places. Also, it caused one bug in a test case, causing it to succeed when it should have not (the test had +-1 when it should have had +-2). This refactoring makes it impossible to have odd length buffer issues.
61 lines
1.8 KiB
Go
61 lines
1.8 KiB
Go
package tracker
|
|
|
|
import (
|
|
"errors"
|
|
"math"
|
|
|
|
"github.com/vsariola/sointu"
|
|
)
|
|
|
|
// Volume represents an average and peak volume measurement, in decibels. 0 dB =
|
|
// signal level of +-1.
|
|
type Volume struct {
|
|
Average [2]float64
|
|
Peak [2]float64
|
|
}
|
|
|
|
// Analyze updates Average and Peak fields, by analyzing the given buffer.
|
|
//
|
|
// Internally, it first converts the signal to decibels (0 dB = +-1). Then, the
|
|
// average volume level is computed by smoothing the decibel values with a
|
|
// exponentially decaying average, with a time constant tau (in seconds).
|
|
// Typical value could be 0.3 (seconds).
|
|
//
|
|
// Peak volume detection is similar exponential smoothing, but the time
|
|
// constants for attack and release are different. Generally attack << release.
|
|
// Typical values could be attack 1.5e-3 and release 1.5 (seconds)
|
|
//
|
|
// minVolume and maxVolume are hard limits in decibels to prevent negative
|
|
// infinities for volumes
|
|
func (v *Volume) Analyze(buffer sointu.AudioBuffer, tau float64, attack float64, release float64, minVolume float64, maxVolume float64) error {
|
|
alpha := 1 - math.Exp(-1.0/(tau*44100)) // from https://en.wikipedia.org/wiki/Exponential_smoothing
|
|
alphaAttack := 1 - math.Exp(-1.0/(attack*44100))
|
|
alphaRelease := 1 - math.Exp(-1.0/(release*44100))
|
|
var err error
|
|
for j := 0; j < 2; j++ {
|
|
for i := 0; i < len(buffer); i++ {
|
|
sample2 := float64(buffer[i][j] * buffer[i][j])
|
|
if math.IsNaN(sample2) {
|
|
if err == nil {
|
|
err = errors.New("NaN detected in master output")
|
|
}
|
|
continue
|
|
}
|
|
dB := 10 * math.Log10(float64(sample2))
|
|
if dB < minVolume || math.IsNaN(dB) {
|
|
dB = minVolume
|
|
}
|
|
if dB > maxVolume {
|
|
dB = maxVolume
|
|
}
|
|
v.Average[j] += (dB - v.Average[j]) * alpha
|
|
alphaPeak := alphaAttack
|
|
if dB < v.Peak[j] {
|
|
alphaPeak = alphaRelease
|
|
}
|
|
v.Peak[j] += (dB - v.Peak[j]) * alphaPeak
|
|
}
|
|
}
|
|
return err
|
|
}
|