mirror of
https://github.com/livekit/livekit.git
synced 2026-05-10 21:27:08 +00:00
440f00bcac
* Declare audio inactive if stale. Stale samples were used to declare audio active. Maintain last update time and declare inactive if samples are stale. * correct comment * spelling * check level in test
135 lines
3.7 KiB
Go
135 lines
3.7 KiB
Go
// Copyright 2023 LiveKit, Inc.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package audio
|
|
|
|
import (
|
|
"math"
|
|
"sync"
|
|
"time"
|
|
)
|
|
|
|
const (
|
|
silentAudioLevel = 127
|
|
negInv20 = -1.0 / 20
|
|
)
|
|
|
|
type AudioLevelParams struct {
|
|
ActiveLevel uint8
|
|
MinPercentile uint8
|
|
ObserveDuration uint32
|
|
SmoothIntervals uint32
|
|
}
|
|
|
|
// keeps track of audio level for a participant
|
|
type AudioLevel struct {
|
|
params AudioLevelParams
|
|
// min duration within an observe duration window to be considered active
|
|
minActiveDuration uint32
|
|
smoothFactor float64
|
|
activeThreshold float64
|
|
|
|
lock sync.Mutex
|
|
smoothedLevel float64
|
|
|
|
loudestObservedLevel uint8
|
|
activeDuration uint32 // ms
|
|
observedDuration uint32 // ms
|
|
lastObservedAt time.Time
|
|
}
|
|
|
|
func NewAudioLevel(params AudioLevelParams) *AudioLevel {
|
|
l := &AudioLevel{
|
|
params: params,
|
|
minActiveDuration: uint32(params.MinPercentile) * params.ObserveDuration / 100,
|
|
smoothFactor: 1,
|
|
activeThreshold: ConvertAudioLevel(float64(params.ActiveLevel)),
|
|
loudestObservedLevel: silentAudioLevel,
|
|
}
|
|
|
|
if l.params.SmoothIntervals > 0 {
|
|
// exponential moving average (EMA), same center of mass with simple moving average (SMA)
|
|
l.smoothFactor = float64(2) / (float64(l.params.SmoothIntervals + 1))
|
|
}
|
|
|
|
return l
|
|
}
|
|
|
|
// Observes a new frame
|
|
func (l *AudioLevel) Observe(level uint8, durationMs uint32, arrivalTime time.Time) {
|
|
l.lock.Lock()
|
|
defer l.lock.Unlock()
|
|
|
|
l.lastObservedAt = arrivalTime
|
|
|
|
l.observedDuration += durationMs
|
|
|
|
if level <= l.params.ActiveLevel {
|
|
l.activeDuration += durationMs
|
|
if l.loudestObservedLevel > level {
|
|
l.loudestObservedLevel = level
|
|
}
|
|
}
|
|
|
|
if l.observedDuration >= l.params.ObserveDuration {
|
|
smoothedLevel := float64(0.0)
|
|
// compute and reset
|
|
if l.activeDuration >= l.minActiveDuration {
|
|
// adjust loudest observed level by how much of the window was active.
|
|
// Weight will be 0 if active the entire duration
|
|
// > 0 if active for longer than observe duration
|
|
// < 0 if active for less than observe duration
|
|
activityWeight := 20 * math.Log10(float64(l.activeDuration)/float64(l.params.ObserveDuration))
|
|
adjustedLevel := float64(l.loudestObservedLevel) - activityWeight
|
|
linearLevel := ConvertAudioLevel(adjustedLevel)
|
|
|
|
// exponential smoothing to dampen transients
|
|
smoothedLevel = l.smoothedLevel + (linearLevel-l.smoothedLevel)*l.smoothFactor
|
|
}
|
|
l.resetLocked(smoothedLevel)
|
|
}
|
|
}
|
|
|
|
// returns current soothed audio level
|
|
func (l *AudioLevel) GetLevel(now time.Time) (float64, bool) {
|
|
l.lock.Lock()
|
|
defer l.lock.Unlock()
|
|
|
|
l.resetIfStaleLocked(now)
|
|
|
|
return l.smoothedLevel, l.smoothedLevel >= l.activeThreshold
|
|
}
|
|
|
|
func (l *AudioLevel) resetIfStaleLocked(arrivalTime time.Time) {
|
|
if arrivalTime.Sub(l.lastObservedAt).Milliseconds() < int64(2*l.params.ObserveDuration) {
|
|
return
|
|
}
|
|
|
|
l.resetLocked(0.0)
|
|
}
|
|
|
|
func (l *AudioLevel) resetLocked(smoothedLevel float64) {
|
|
l.smoothedLevel = smoothedLevel
|
|
l.loudestObservedLevel = silentAudioLevel
|
|
l.activeDuration = 0
|
|
l.observedDuration = 0
|
|
}
|
|
|
|
// ---------------------------------------------------
|
|
|
|
// convert decibel back to linear
|
|
func ConvertAudioLevel(level float64) float64 {
|
|
return math.Pow(10, level*negInv20)
|
|
}
|