You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
lal/pkg/rtsp/avpacket_queue.go

277 lines
8.0 KiB
Go

// Copyright 2020, Chef. All rights reserved.
// https://github.com/q191201771/lal
//
// Use of this source code is governed by a MIT-style license
// that can be found in the License file.
//
// Author: Chef (191201771@qq.com)
package rtsp
import (
"bytes"
"fmt"
"github.com/q191201771/lal/pkg/base"
"github.com/q191201771/naza/pkg/circularqueue"
)
const maxQueueSize = 128
type OnAvPacket func(pkt base.AvPacket)
// AvPacketQueue
//
// 处理音频和视频的时间戳:
// 1. 让音频和视频的时间戳都从0开始改变原时间戳
// 2. 让音频和视频的时间戳交替递增输出(不改变原时间戳)
// 3. 当时间戳翻转时,保持时间戳的连续性(改变原时间戳)
//
// 注意,本模块默认音频和视频都存在,如果只有音频或只有视频,则不要使用该模块
//
// TODO(chef): [refactor] 重命名为filter 202305
type AvPacketQueue struct {
onAvPacket OnAvPacket
audioQueue *circularqueue.CircularQueue // TODO chef: 特化成AvPacket类型
videoQueue *circularqueue.CircularQueue
audioBaseTs int64 // audio base timestamp
videoBaseTs int64 // video base timestamp
audioPrevOriginTs int64
videoPrevOriginTs int64
audioPrevModTs int64
videoPrevModTs int64
audioPrevIntervalTs int64
videoPrevIntervalTs int64
}
func NewAvPacketQueue(onAvPacket OnAvPacket) *AvPacketQueue {
return &AvPacketQueue{
onAvPacket: onAvPacket,
audioQueue: circularqueue.New(maxQueueSize),
videoQueue: circularqueue.New(maxQueueSize),
audioBaseTs: -1,
videoBaseTs: -1,
audioPrevOriginTs: -1,
videoPrevOriginTs: -1,
audioPrevModTs: -1,
videoPrevModTs: -1,
audioPrevIntervalTs: -1,
videoPrevIntervalTs: -1,
}
}
func (a *AvPacketQueue) adjustTsHandleRotate(pkt *base.AvPacket) {
// TODO(chef): [refactor] adjustTsXxx 这一层换成fn这一层 202305
fn := func(prevOriginTs, prevModTs, prevIntervalTs *int64, isAudio bool) {
if *prevOriginTs == -1 {
// 第一次
*prevOriginTs = pkt.Timestamp
pkt.Timestamp = 0
*prevModTs = pkt.Timestamp
// 没有prev所以没法也不需要计算 prevIntervalTs
} else {
// 非第一次
interval := pkt.Timestamp - *prevOriginTs
if interval < -1000 {
// 时间戳翻滚并且差值大于阈值了为了避免B帧导致的小范围翻滚)
Log.Warnf("[AVQ] ts rotate. isAudio=%v, interval=%d, prevModTs=%d, prevIntervalTs=%d, prevOriginTs=%d, pktTS=%d, audioQueue=%d, videoQueue=%d",
isAudio, interval, *prevModTs, *prevIntervalTs, *prevOriginTs, pkt.Timestamp, a.audioQueue.Size(), a.videoQueue.Size())
// 注意这个不要放到if判断的前面因为需要先打印旧值日志
*prevOriginTs = pkt.Timestamp
// 用历史差值来更新
pkt.Timestamp = *prevModTs + *prevIntervalTs
} else {
*prevOriginTs = pkt.Timestamp
pkt.Timestamp = *prevModTs + interval
*prevIntervalTs = interval
}
if pkt.Timestamp < 0 {
Log.Warnf("[AVQ] ts negative. isAudio=%v, interval=%d, prevModTs=%d, prevIntervalTs=%d, prevOriginTs=%d, pktTS=%d, audioQueue=%d, videoQueue=%d",
isAudio, interval, *prevModTs, *prevIntervalTs, *prevOriginTs, pkt.Timestamp, a.audioQueue.Size(), a.videoQueue.Size())
pkt.Timestamp = 0
}
*prevModTs = pkt.Timestamp
}
}
if pkt.IsVideo() {
fn(&a.videoPrevOriginTs, &a.videoPrevModTs, &a.videoPrevIntervalTs, false)
_ = a.videoQueue.PushBack(*pkt)
} else {
fn(&a.audioPrevOriginTs, &a.audioPrevModTs, &a.audioPrevIntervalTs, true)
_ = a.audioQueue.PushBack(*pkt)
}
}
func (a *AvPacketQueue) adjustTs(pkt *base.AvPacket) {
if pkt.IsVideo() {
// 时间戳回退了
if pkt.Timestamp < a.videoBaseTs {
Log.Warnf("[AVQ] video ts rotate. pktTS=%d, audioBaseTs=%d, videoBaseTs=%d, audioQueue=%d, videoQueue=%d",
pkt.Timestamp, a.audioBaseTs, a.videoBaseTs, a.audioQueue.Size(), a.videoQueue.Size())
a.PopAllByForce()
}
// 第一次
if a.videoBaseTs == -1 {
a.videoBaseTs = pkt.Timestamp
}
// 根据基准调节
pkt.Timestamp -= a.videoBaseTs
_ = a.videoQueue.PushBack(*pkt)
} else {
if pkt.Timestamp < a.audioBaseTs {
Log.Warnf("[AVQ] audio ts rotate. pktTS=%d, audioBaseTs=%d, videoBaseTs=%d, audioQueue=%d, videoQueue=%d",
pkt.Timestamp, a.audioBaseTs, a.videoBaseTs, a.audioQueue.Size(), a.videoQueue.Size())
a.PopAllByForce()
}
if a.audioBaseTs == -1 {
a.audioBaseTs = pkt.Timestamp
}
pkt.Timestamp -= a.audioBaseTs
_ = a.audioQueue.PushBack(*pkt)
}
}
// Feed 注意,调用方保证,音频相较于音频,视频相较于视频,时间戳是线性递增的。
func (a *AvPacketQueue) Feed(pkt base.AvPacket) {
Log.Debugf("[AVQ] Feed. t=%d, ts=%d, Q(%d,%d), %s, base(%d,%d)",
pkt.PayloadType, pkt.Timestamp, a.audioQueue.Size(), a.videoQueue.Size(), packetsReadable(peekQueuePackets(a)), a.audioBaseTs, a.videoBaseTs)
if TimestampFilterHandleRotateFlag {
a.adjustTsHandleRotate(&pkt)
} else {
a.adjustTs(&pkt)
}
// 如果音频和视频都存在,则按序输出,直到其中一个为空
for !a.audioQueue.Empty() && !a.videoQueue.Empty() {
apkt, _ := a.audioQueue.Front()
vpkt, _ := a.videoQueue.Front()
aapkt := apkt.(base.AvPacket)
vvpkt := vpkt.(base.AvPacket)
if aapkt.Timestamp < vvpkt.Timestamp {
_, _ = a.audioQueue.PopFront()
Log.Debugf("[AVQ] pop audio by video. a=%d, v=%d", aapkt.Timestamp, vvpkt.Timestamp)
a.onAvPacket(aapkt)
} else if aapkt.Timestamp > vvpkt.Timestamp {
_, _ = a.videoQueue.PopFront()
Log.Debugf("[AVQ] pop video by audio. a=%d, v=%d", aapkt.Timestamp, vvpkt.Timestamp)
a.onAvPacket(vvpkt)
} else {
// 相等时,我们把早加入的先输出
if pkt.IsAudio() {
_, _ = a.videoQueue.PopFront()
Log.Debugf("[AVQ] pop video by audio. a=%d, v=%d", aapkt.Timestamp, vvpkt.Timestamp)
a.onAvPacket(vvpkt)
} else {
_, _ = a.audioQueue.PopFront()
Log.Debugf("[AVQ] pop audio by video. a=%d, v=%d", aapkt.Timestamp, vvpkt.Timestamp)
a.onAvPacket(aapkt)
}
}
}
// 如果视频满了,则全部输出
if a.videoQueue.Full() {
Log.Assert(true, a.audioQueue.Empty())
a.popAllVideo()
return
}
// 如果音频满了,则全部输出
if a.audioQueue.Full() {
Log.Assert(true, a.videoQueue.Empty())
a.popAllAudio()
return
}
}
func (a *AvPacketQueue) PopAllByForce() {
a.videoBaseTs = -1
a.audioBaseTs = -1
if a.audioQueue.Empty() && a.videoQueue.Empty() {
// noop
} else if a.audioQueue.Empty() && !a.videoQueue.Empty() {
a.popAllVideo()
} else if !a.audioQueue.Empty() && a.videoQueue.Empty() {
a.popAllAudio()
} else {
// 这种情况不可能发生
// 因为每次排出时,都会排空一个队列
}
}
func (a *AvPacketQueue) popAllAudio() {
Log.Debugf("[AVQ] pop all audio. audioQueue=%d, videoQueue=%d", a.audioQueue.Size(), a.videoQueue.Size())
for !a.audioQueue.Empty() {
pkt, _ := a.audioQueue.Front()
ppkt := pkt.(base.AvPacket)
_, _ = a.audioQueue.PopFront()
a.onAvPacket(ppkt)
}
}
func (a *AvPacketQueue) popAllVideo() {
Log.Debugf("[AVQ] pop all video. audioQueue=%d, videoQueue=%d", a.audioQueue.Size(), a.videoQueue.Size())
for !a.videoQueue.Empty() {
pkt, _ := a.videoQueue.Front()
ppkt := pkt.(base.AvPacket)
_, _ = a.videoQueue.PopFront()
a.onAvPacket(ppkt)
}
}
// ---------------------------------------------------------------------------------------------------------------------
func packetsReadable(pkts []base.AvPacket) string {
var buf bytes.Buffer
buf.WriteString("[")
for _, pkt := range pkts {
if pkt.IsAudio() {
buf.WriteString(fmt.Sprintf(" A(%d) ", pkt.Timestamp))
} else if pkt.IsVideo() {
buf.WriteString(fmt.Sprintf(" V(%d) ", pkt.Timestamp))
} else {
buf.WriteString(fmt.Sprintf(" U(%d) ", pkt.Timestamp))
}
}
buf.WriteString("]")
return buf.String()
}
func peekQueuePackets(q *AvPacketQueue) []base.AvPacket {
var out []base.AvPacket
for i := 0; i < q.audioQueue.Size(); i++ {
pkt, _ := q.audioQueue.At(i)
ppkt := pkt.(base.AvPacket)
out = append(out, ppkt)
}
for i := 0; i < q.videoQueue.Size(); i++ {
pkt, _ := q.videoQueue.At(i)
ppkt := pkt.(base.AvPacket)
out = append(out, ppkt)
}
return out
}