Files
gortsplib/pkg/rtph264/encoder.go

248 lines
5.2 KiB
Go

package rtph264
import (
"crypto/rand"
"encoding/binary"
"time"
"github.com/pion/rtp"
)
const (
rtpVersion = 0x02
rtpPayloadMaxSize = 1460 // 1500 (mtu) - 20 (ip header) - 8 (udp header) - 12 (rtp header)
rtpClockRate = 90000 // h264 always uses 90khz
)
func randUint32() uint32 {
var b [4]byte
rand.Read(b[:])
return uint32(b[0])<<24 | uint32(b[1])<<16 | uint32(b[2])<<8 | uint32(b[3])
}
// Encoder is a RTP/H264 encoder.
type Encoder struct {
payloadType uint8
sequenceNumber uint16
ssrc uint32
initialTs uint32
}
// NewEncoder allocates an Encoder.
func NewEncoder(payloadType uint8,
sequenceNumber *uint16,
ssrc *uint32,
initialTs *uint32) *Encoder {
return &Encoder{
payloadType: payloadType,
sequenceNumber: func() uint16 {
if sequenceNumber != nil {
return *sequenceNumber
}
return uint16(randUint32())
}(),
ssrc: func() uint32 {
if ssrc != nil {
return *ssrc
}
return randUint32()
}(),
initialTs: func() uint32 {
if initialTs != nil {
return *initialTs
}
return randUint32()
}(),
}
}
func (e *Encoder) encodeTimestamp(ts time.Duration) uint32 {
return e.initialTs + uint32(ts.Seconds()*rtpClockRate)
}
// Encode encodes NALUs into RTP/H264 packets.
// It returns the encoded packets.
func (e *Encoder) Encode(nalus [][]byte, pts time.Duration) ([][]byte, error) {
var rets [][]byte
var batch [][]byte
// split NALUs into batches
for _, nalu := range nalus {
if e.lenAggregated(batch, nalu) <= rtpPayloadMaxSize {
// add to existing batch
batch = append(batch, nalu)
} else {
// write batch
if batch != nil {
pkts, err := e.writeBatch(batch, pts, false)
if err != nil {
return nil, err
}
rets = append(rets, pkts...)
}
// initialize new batch
batch = [][]byte{nalu}
}
}
// write final batch
// marker is used to indicate when all NALUs with same PTS have been sent
pkts, err := e.writeBatch(batch, pts, true)
if err != nil {
return nil, err
}
rets = append(rets, pkts...)
return rets, nil
}
func (e *Encoder) writeBatch(nalus [][]byte, pts time.Duration, marker bool) ([][]byte, error) {
if len(nalus) == 1 {
// the NALU fits into a single RTP packet
if len(nalus[0]) < rtpPayloadMaxSize {
return e.writeSingle(nalus[0], pts, marker)
}
// split the NALU into multiple fragmentation packet
return e.writeFragmented(nalus[0], pts, marker)
}
return e.writeAggregated(nalus, pts, marker)
}
func (e *Encoder) writeSingle(nalu []byte, pts time.Duration, marker bool) ([][]byte, error) {
frame, err := (&rtp.Packet{
Header: rtp.Header{
Version: rtpVersion,
PayloadType: e.payloadType,
SequenceNumber: e.sequenceNumber,
Timestamp: e.encodeTimestamp(pts),
SSRC: e.ssrc,
Marker: marker,
},
Payload: nalu,
}).Marshal()
if err != nil {
return nil, err
}
e.sequenceNumber++
return [][]byte{frame}, nil
}
func (e *Encoder) writeFragmented(nalu []byte, pts time.Duration, marker bool) ([][]byte, error) {
// use only FU-A, not FU-B, since we always use non-interleaved mode
// (packetization-mode=1)
packetCount := (len(nalu) - 1) / (rtpPayloadMaxSize - 2)
lastPacketSize := (len(nalu) - 1) % (rtpPayloadMaxSize - 2)
if lastPacketSize > 0 {
packetCount++
}
ret := make([][]byte, packetCount)
encPTS := e.encodeTimestamp(pts)
nri := (nalu[0] >> 5) & 0x03
typ := nalu[0] & 0x1F
nalu = nalu[1:] // remove header
for i := range ret {
indicator := (nri << 5) | uint8(naluTypeFUA)
start := uint8(0)
if i == 0 {
start = 1
}
end := uint8(0)
le := rtpPayloadMaxSize - 2
if i == (packetCount - 1) {
end = 1
le = lastPacketSize
}
header := (start << 7) | (end << 6) | typ
data := make([]byte, 2+le)
data[0] = indicator
data[1] = header
copy(data[2:], nalu[:le])
nalu = nalu[le:]
frame, err := (&rtp.Packet{
Header: rtp.Header{
Version: rtpVersion,
PayloadType: e.payloadType,
SequenceNumber: e.sequenceNumber,
Timestamp: encPTS,
SSRC: e.ssrc,
Marker: (i == (packetCount-1) && marker),
},
Payload: data,
}).Marshal()
if err != nil {
return nil, err
}
e.sequenceNumber++
ret[i] = frame
}
return ret, nil
}
func (e *Encoder) lenAggregated(nalus [][]byte, addNALU []byte) int {
ret := 1 // header
for _, nalu := range nalus {
ret += 2 // size
ret += len(nalu) // nalu
}
if addNALU != nil {
ret += 2 // size
ret += len(addNALU) // nalu
}
return ret
}
func (e *Encoder) writeAggregated(nalus [][]byte, pts time.Duration, marker bool) ([][]byte, error) {
payload := make([]byte, e.lenAggregated(nalus, nil))
// header
payload[0] = uint8(naluTypeSTAPA)
pos := 1
for _, nalu := range nalus {
// size
naluLen := len(nalu)
binary.BigEndian.PutUint16(payload[pos:], uint16(naluLen))
pos += 2
// nalu
copy(payload[pos:], nalu)
pos += naluLen
}
frame, err := (&rtp.Packet{
Header: rtp.Header{
Version: rtpVersion,
PayloadType: e.payloadType,
SequenceNumber: e.sequenceNumber,
Timestamp: e.encodeTimestamp(pts),
SSRC: e.ssrc,
Marker: marker,
},
Payload: payload,
}).Marshal()
if err != nil {
return nil, err
}
e.sequenceNumber++
return [][]byte{frame}, nil
}