mirror of
https://github.com/jech/galene.git
synced 2024-11-22 16:45:58 +01:00
d94e5583cd
Metadata OBUs can appear between the sequence header and the first frame header.
278 lines
6 KiB
Go
278 lines
6 KiB
Go
package rtpconn
|
|
|
|
import (
|
|
"errors"
|
|
"strings"
|
|
|
|
"github.com/pion/rtp"
|
|
"github.com/pion/rtp/codecs"
|
|
)
|
|
|
|
// isKeyframe determines if packet is the start of a keyframe.
|
|
// It returns (true, true) if that is the case, (false, true) if that is
|
|
// definitely not the case, and (false, false) if the information cannot
|
|
// be determined.
|
|
func isKeyframe(codec string, packet *rtp.Packet) (bool, bool) {
|
|
if strings.EqualFold(codec, "video/vp8") {
|
|
var vp8 codecs.VP8Packet
|
|
_, err := vp8.Unmarshal(packet.Payload)
|
|
if err != nil || len(vp8.Payload) < 1 {
|
|
return false, false
|
|
}
|
|
|
|
if vp8.S != 0 && vp8.PID == 0 && (vp8.Payload[0]&0x1) == 0 {
|
|
return true, true
|
|
}
|
|
return false, true
|
|
} else if strings.EqualFold(codec, "video/vp9") {
|
|
var vp9 codecs.VP9Packet
|
|
_, err := vp9.Unmarshal(packet.Payload)
|
|
if err != nil || len(vp9.Payload) < 1 {
|
|
return false, false
|
|
}
|
|
if !vp9.B {
|
|
return false, true
|
|
}
|
|
|
|
if (vp9.Payload[0] & 0xc0) != 0x80 {
|
|
return false, false
|
|
}
|
|
|
|
profile := (vp9.Payload[0] >> 4) & 0x3
|
|
if profile != 3 {
|
|
return (vp9.Payload[0] & 0xC) == 0, true
|
|
}
|
|
return (vp9.Payload[0] & 0x6) == 0, true
|
|
} else if strings.EqualFold(codec, "video/av1x") {
|
|
if len(packet.Payload) < 2 {
|
|
return false, true
|
|
}
|
|
// Z=0, N=1
|
|
if (packet.Payload[0] & 0x88) != 0x08 {
|
|
return false, true
|
|
}
|
|
w := (packet.Payload[0] & 0x30) >> 4
|
|
|
|
getObu := func(data []byte, last bool) ([]byte, int, bool) {
|
|
if last {
|
|
return data, len(data), false
|
|
}
|
|
offset := 0
|
|
length := 0
|
|
for {
|
|
if len(data) <= offset {
|
|
return nil, offset, offset > 0
|
|
}
|
|
l := data[offset]
|
|
length |= int(l & 0x7f) << (offset * 7)
|
|
offset++
|
|
if (l & 0x80) == 0 {
|
|
break
|
|
}
|
|
}
|
|
if len(data) < offset+length {
|
|
return data[offset:], len(data), true
|
|
}
|
|
return data[offset : offset+length],
|
|
offset + length, false
|
|
}
|
|
offset := 1
|
|
i := 0
|
|
for {
|
|
obu, length, truncated :=
|
|
getObu(packet.Payload[offset:], int(w) == i+1)
|
|
if len(obu) < 1 {
|
|
return false, false
|
|
}
|
|
tpe := (obu[0] & 0x38) >> 3
|
|
switch i {
|
|
case 0:
|
|
// OBU_SEQUENCE_HEADER
|
|
if tpe != 1 {
|
|
return false, true
|
|
}
|
|
default:
|
|
// OBU_FRAME_HEADER or OBU_FRAME
|
|
if tpe == 3 || tpe == 6 {
|
|
if len(obu) < 2 {
|
|
return false, false
|
|
}
|
|
// show_existing_frame == 0
|
|
if (obu[1] & 0x80) != 0 {
|
|
return false, true
|
|
}
|
|
// frame_type == KEY_FRAME
|
|
return (obu[1] & 0x60) == 0, true
|
|
}
|
|
}
|
|
if truncated || i >= int(w) {
|
|
// the first frame header is in a second
|
|
// packet, give up.
|
|
return false, false
|
|
}
|
|
offset += length
|
|
i++
|
|
}
|
|
} else if strings.EqualFold(codec, "video/h264") {
|
|
if len(packet.Payload) < 1 {
|
|
return false, false
|
|
}
|
|
nalu := packet.Payload[0] & 0x1F
|
|
if nalu == 0 {
|
|
// reserved
|
|
return false, false
|
|
} else if nalu <= 23 {
|
|
// simple NALU
|
|
return nalu == 5, true
|
|
} else if nalu == 24 || nalu == 25 || nalu == 26 || nalu == 27 {
|
|
// STAP-A, STAP-B, MTAP16 or MTAP24
|
|
i := 1
|
|
if nalu == 25 || nalu == 26 || nalu == 27 {
|
|
// skip DON
|
|
i += 2
|
|
}
|
|
for i < len(packet.Payload) {
|
|
if i+2 > len(packet.Payload) {
|
|
return false, false
|
|
}
|
|
length := uint16(packet.Payload[i])<<8 |
|
|
uint16(packet.Payload[i+1])
|
|
i += 2
|
|
if i+int(length) > len(packet.Payload) {
|
|
return false, false
|
|
}
|
|
offset := 0
|
|
if nalu == 26 {
|
|
offset = 3
|
|
} else if nalu == 27 {
|
|
offset = 4
|
|
}
|
|
if offset >= int(length) {
|
|
return false, false
|
|
}
|
|
n := packet.Payload[i+offset] & 0x1F
|
|
if n == 7 {
|
|
return true, true
|
|
} else if n >= 24 {
|
|
// is this legal?
|
|
return false, false
|
|
}
|
|
i += int(length)
|
|
}
|
|
if i == len(packet.Payload) {
|
|
return false, true
|
|
}
|
|
return false, false
|
|
} else if nalu == 28 || nalu == 29 {
|
|
// FU-A or FU-B
|
|
if len(packet.Payload) < 2 {
|
|
return false, false
|
|
}
|
|
if (packet.Payload[1] & 0x80) == 0 {
|
|
// not a starting fragment
|
|
return false, true
|
|
}
|
|
return (packet.Payload[1]&0x1F == 7), true
|
|
}
|
|
return false, false
|
|
}
|
|
return false, false
|
|
}
|
|
|
|
var errTruncated = errors.New("truncated packet")
|
|
var errUnsupportedCodec = errors.New("unsupported codec")
|
|
|
|
func packetFlags(codec string, buf []byte) (seqno uint16, start bool, pid uint16, tid uint8, sid uint8, layersync bool, discardable bool, err error) {
|
|
if len(buf) < 12 {
|
|
err = errTruncated
|
|
return
|
|
}
|
|
|
|
seqno = (uint16(buf[2]) << 8) | uint16(buf[3])
|
|
|
|
if strings.EqualFold(codec, "video/vp8") {
|
|
var packet rtp.Packet
|
|
err = packet.Unmarshal(buf)
|
|
if err != nil {
|
|
return
|
|
}
|
|
var vp8 codecs.VP8Packet
|
|
_, err = vp8.Unmarshal(packet.Payload)
|
|
if err != nil {
|
|
return
|
|
}
|
|
|
|
start = vp8.S == 1 && vp8.PID == 0
|
|
pid = vp8.PictureID
|
|
tid = vp8.TID
|
|
layersync = vp8.Y == 1
|
|
discardable = vp8.N == 1
|
|
return
|
|
} else if strings.EqualFold(codec, "video/vp9") {
|
|
var packet rtp.Packet
|
|
err = packet.Unmarshal(buf)
|
|
if err != nil {
|
|
return
|
|
}
|
|
var vp9 codecs.VP9Packet
|
|
_, err = vp9.Unmarshal(packet.Payload)
|
|
if err != nil {
|
|
return
|
|
}
|
|
start = vp9.B
|
|
tid = vp9.TID
|
|
sid = vp9.SID
|
|
layersync = vp9.U
|
|
return
|
|
}
|
|
return
|
|
}
|
|
|
|
func rewritePacket(codec string, data []byte, seqno uint16, delta uint16) error {
|
|
if len(data) < 12 {
|
|
return errTruncated
|
|
}
|
|
|
|
data[2] = uint8(seqno >> 8)
|
|
data[3] = uint8(seqno)
|
|
if delta == 0 {
|
|
return nil
|
|
}
|
|
|
|
offset := 12
|
|
offset += int(data[0]&0x0F) * 4
|
|
if len(data) < offset+4 {
|
|
return errTruncated
|
|
}
|
|
|
|
if (data[0] & 0x10) != 0 {
|
|
length := uint16(data[offset+2])<<8 | uint16(data[offset+3])
|
|
offset += 4 + int(length)*4
|
|
if len(data) < offset+4 {
|
|
return errTruncated
|
|
}
|
|
}
|
|
|
|
if strings.EqualFold(codec, "video/vp8") {
|
|
x := (data[offset] & 0x80) != 0
|
|
if !x {
|
|
return nil
|
|
}
|
|
i := (data[offset+1] & 0x80) != 0
|
|
if !i {
|
|
return nil
|
|
}
|
|
m := (data[offset+2] & 0x80) != 0
|
|
if m {
|
|
pid := (uint16(data[offset+2]&0x7F) << 8) |
|
|
uint16(data[offset+3])
|
|
pid = (pid + delta) & 0x7FFF
|
|
data[offset+2] = 0x80 | byte((pid>>8)&0x7F)
|
|
data[offset+3] = byte(pid & 0xFF)
|
|
} else {
|
|
data[offset+2] = (data[offset+2] + uint8(delta)) & 0x7F
|
|
}
|
|
return nil
|
|
}
|
|
return errUnsupportedCodec
|
|
}
|