Files
go2rtc/pkg/webcodecs/consumer.go
T
2026-03-21 13:48:25 +03:00

268 lines
5.8 KiB
Go

package webcodecs
import (
"encoding/binary"
"errors"
"io"
"sync"
"github.com/AlexxIT/go2rtc/pkg/aac"
"github.com/AlexxIT/go2rtc/pkg/core"
"github.com/AlexxIT/go2rtc/pkg/h264"
"github.com/AlexxIT/go2rtc/pkg/h264/annexb"
"github.com/AlexxIT/go2rtc/pkg/h265"
"github.com/pion/rtp"
)
// Binary frame header (9 bytes):
// Byte 0: flags (bit7=video, bit6=keyframe, bits0-5=trackID)
// Byte 1-8: timestamp in microseconds (uint64 BE)
// Byte 9+: payload
const headerSize = 9
type Consumer struct {
core.Connection
wr *core.WriteBuffer
mu sync.Mutex
start bool
UseGOP bool
}
type InitInfo struct {
Video *VideoInfo `json:"video,omitempty"`
Audio *AudioInfo `json:"audio,omitempty"`
}
type VideoInfo struct {
Codec string `json:"codec"`
}
type AudioInfo struct {
Codec string `json:"codec"`
SampleRate int `json:"sampleRate"`
Channels int `json:"channels"`
}
func NewConsumer(medias []*core.Media) *Consumer {
if medias == nil {
medias = []*core.Media{
{
Kind: core.KindVideo,
Direction: core.DirectionSendonly,
Codecs: []*core.Codec{
{Name: core.CodecH264},
{Name: core.CodecH265},
},
},
{
Kind: core.KindAudio,
Direction: core.DirectionSendonly,
Codecs: []*core.Codec{
{Name: core.CodecAAC},
{Name: core.CodecOpus},
{Name: core.CodecPCMA},
{Name: core.CodecPCMU},
},
},
}
}
wr := core.NewWriteBuffer(nil)
return &Consumer{
Connection: core.Connection{
ID: core.NewID(),
FormatName: "webcodecs",
Medias: medias,
Transport: wr,
},
wr: wr,
}
}
func (c *Consumer) AddTrack(media *core.Media, _ *core.Codec, track *core.Receiver) error {
trackID := byte(len(c.Senders))
codec := track.Codec.Clone()
handler := core.NewSender(media, codec)
switch track.Codec.Name {
case core.CodecH264:
clockRate := codec.ClockRate
handler.Handler = func(packet *rtp.Packet) {
keyframe := h264.IsKeyframe(packet.Payload)
if !c.start {
if !keyframe {
return
}
c.start = true
}
payload := annexb.DecodeAVCC(packet.Payload, true)
flags := byte(0x80) | trackID // video flag
if keyframe {
flags |= 0x40 // keyframe flag
}
c.mu.Lock()
msg := buildFrame(flags, rtpToMicroseconds(packet.Timestamp, clockRate), payload)
if n, err := c.wr.Write(msg); err == nil {
c.Send += n
}
c.mu.Unlock()
}
if track.Codec.IsRTP() {
handler.Handler = h264.RTPDepay(track.Codec, handler.Handler)
} else {
handler.Handler = h264.RepairAVCC(track.Codec, handler.Handler)
}
case core.CodecH265:
clockRate := codec.ClockRate
handler.Handler = func(packet *rtp.Packet) {
keyframe := h265.IsKeyframe(packet.Payload)
if !c.start {
if !keyframe {
return
}
c.start = true
}
payload := annexb.DecodeAVCC(packet.Payload, true)
flags := byte(0x80) | trackID // video flag
if keyframe {
flags |= 0x40 // keyframe flag
}
c.mu.Lock()
msg := buildFrame(flags, rtpToMicroseconds(packet.Timestamp, clockRate), payload)
if n, err := c.wr.Write(msg); err == nil {
c.Send += n
}
c.mu.Unlock()
}
if track.Codec.IsRTP() {
handler.Handler = h265.RTPDepay(track.Codec, handler.Handler)
} else {
handler.Handler = h265.RepairAVCC(track.Codec, handler.Handler)
}
default:
clockRate := codec.ClockRate
handler.Handler = func(packet *rtp.Packet) {
if !c.start {
return
}
flags := trackID // audio flag (bit7=0)
c.mu.Lock()
msg := buildFrame(flags, rtpToMicroseconds(packet.Timestamp, clockRate), packet.Payload)
if n, err := c.wr.Write(msg); err == nil {
c.Send += n
}
c.mu.Unlock()
}
switch track.Codec.Name {
case core.CodecAAC:
if track.Codec.IsRTP() {
handler.Handler = aac.RTPDepay(handler.Handler)
}
case core.CodecOpus, core.CodecPCMA, core.CodecPCMU:
// pass through directly — WebCodecs decodes these natively
default:
handler.Handler = nil
}
}
if handler.Handler == nil {
s := "webcodecs: unsupported codec: " + track.Codec.String()
println(s)
return errors.New(s)
}
handler.HandleRTP(track)
c.Senders = append(c.Senders, handler)
return nil
}
func (c *Consumer) GetInitInfo() *InitInfo {
info := &InitInfo{}
for _, sender := range c.Senders {
codec := sender.Codec
switch codec.Name {
case core.CodecH264:
info.Video = &VideoInfo{
Codec: "avc1." + h264.GetProfileLevelID(codec.FmtpLine),
}
case core.CodecH265:
info.Video = &VideoInfo{
Codec: "hvc1.1.6.L153.B0",
}
case core.CodecAAC:
channels := int(codec.Channels)
if channels == 0 {
channels = 1
}
info.Audio = &AudioInfo{
Codec: "mp4a.40.2",
SampleRate: int(codec.ClockRate),
Channels: channels,
}
case core.CodecOpus:
channels := int(codec.Channels)
if channels == 0 {
channels = 2
}
info.Audio = &AudioInfo{
Codec: "opus",
SampleRate: int(codec.ClockRate),
Channels: channels,
}
case core.CodecPCMA:
info.Audio = &AudioInfo{
Codec: "alaw",
SampleRate: int(codec.ClockRate),
Channels: 1,
}
case core.CodecPCMU:
info.Audio = &AudioInfo{
Codec: "ulaw",
SampleRate: int(codec.ClockRate),
Channels: 1,
}
}
}
return info
}
func (c *Consumer) WriteTo(wr io.Writer) (int64, error) {
if len(c.Senders) == 1 && c.Senders[0].Codec.IsAudio() {
c.start = true
}
return c.wr.WriteTo(wr)
}
func buildFrame(flags byte, timestamp uint64, payload []byte) []byte {
msg := make([]byte, headerSize+len(payload))
msg[0] = flags
binary.BigEndian.PutUint64(msg[1:9], timestamp)
copy(msg[headerSize:], payload)
return msg
}
func rtpToMicroseconds(timestamp uint32, clockRate uint32) uint64 {
if clockRate == 0 {
return uint64(timestamp)
}
return uint64(timestamp) * 1_000_000 / uint64(clockRate)
}