mirror of https://bitbucket.org/ausocean/av.git
269 lines
6.0 KiB
Go
269 lines
6.0 KiB
Go
/*
|
|
NAME
|
|
flv_generator.go
|
|
|
|
DESCRIPTION
|
|
See Readme.md
|
|
|
|
AUTHOR
|
|
Dan Kortschak <dan@ausocean.org>
|
|
Saxon Nelson-Milton <saxon@ausocean.org>
|
|
|
|
LICENSE
|
|
flv_generator.go is Copyright (C) 2017 the Australian Ocean Lab (AusOcean)
|
|
|
|
It is free software: you can redistribute it and/or modify them
|
|
under the terms of the GNU General Public License as published by the
|
|
Free Software Foundation, either version 3 of the License, or (at your
|
|
option) any later version.
|
|
|
|
It is distributed in the hope that it will be useful, but WITHOUT
|
|
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with revid in gpl.txt. If not, see http://www.gnu.org/licenses.
|
|
*/
|
|
package flv
|
|
|
|
import (
|
|
"io"
|
|
"time"
|
|
)
|
|
|
|
const (
|
|
inputChanLength = 500
|
|
outputChanLength = 500
|
|
audioSize = 18
|
|
videoHeaderSize = 16
|
|
)
|
|
|
|
// Data representing silent audio (required for youtube)
|
|
var (
|
|
dummyAudioTag1Data = []byte{
|
|
0x00, 0x12, 0x08, 0x56, 0xe5, 0x00,
|
|
}
|
|
|
|
dummyAudioTag2Data = []byte{
|
|
0x01, 0xdc, 0x00, 0x4c, 0x61, 0x76, 0x63, 0x35, 0x38,
|
|
0x2e, 0x36, 0x2e, 0x31, 0x30, 0x32, 0x00, 0x02, 0x30,
|
|
0x40, 0x0e,
|
|
}
|
|
)
|
|
|
|
// Encoder provides properties required for the generation of flv video
|
|
// from raw video data
|
|
type Encoder struct {
|
|
dst io.Writer
|
|
|
|
fps int
|
|
audio bool
|
|
video bool
|
|
lastTagSize int
|
|
header Header
|
|
start time.Time
|
|
}
|
|
|
|
// NewEncoder retuns a new FLV encoder.
|
|
func NewEncoder(dst io.Writer, audio, video bool, fps int) (*Encoder, error) {
|
|
e := Encoder{
|
|
dst: dst,
|
|
fps: fps,
|
|
audio: audio,
|
|
video: video,
|
|
}
|
|
// TODO(kortschak): Do this lazily.
|
|
_, err := e.dst.Write(e.HeaderBytes())
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return &e, nil
|
|
}
|
|
|
|
// HeaderBytes returns the a
|
|
func (e *Encoder) HeaderBytes() []byte {
|
|
header := Header{
|
|
HasAudio: e.audio,
|
|
HasVideo: e.video,
|
|
}
|
|
return header.Bytes()
|
|
}
|
|
|
|
// getNextTimestamp generates and returns the next timestamp based on current time
|
|
func (e *Encoder) getNextTimestamp() (timestamp uint32) {
|
|
if e.start.IsZero() {
|
|
e.start = time.Now()
|
|
return 0
|
|
}
|
|
return uint32(time.Now().Sub(e.start).Seconds() * float64(1000))
|
|
}
|
|
|
|
// http://www.itu.int/rec/dologin_pub.asp?lang=e&id=T-REC-H.264-200305-S!!PDF-E&type=items
|
|
// Table 7-1 NAL unit type codes
|
|
const (
|
|
nonIdrPic = 1
|
|
idrPic = 5
|
|
suppEnhInf = 6
|
|
seqParamSet = 7
|
|
paramSet = 8
|
|
)
|
|
|
|
// isKeyFrame returns true if the passed frame data represents that of a keyframe
|
|
// FIXME(kortschak): Clarify and document the logic of this functions.
|
|
func isKeyFrame(frame []byte) bool {
|
|
sc := frameScanner{buf: frame}
|
|
for {
|
|
b, ok := sc.readByte()
|
|
if !ok {
|
|
return false
|
|
}
|
|
for i := 1; b == 0x00 && i < 4; i++ {
|
|
b, ok = sc.readByte()
|
|
if !ok {
|
|
return false
|
|
}
|
|
if b != 0x01 || (i != 3 && i != 2) {
|
|
continue
|
|
}
|
|
|
|
b, ok = sc.readByte()
|
|
if !ok {
|
|
return false
|
|
}
|
|
switch nalTyp := b & 0x1f; nalTyp {
|
|
case idrPic, suppEnhInf:
|
|
return true
|
|
case nonIdrPic:
|
|
return false
|
|
}
|
|
}
|
|
}
|
|
return false
|
|
}
|
|
|
|
// isSequenceHeader returns true if the passed frame data represents that of a
|
|
// a sequence header.
|
|
// FIXME(kortschak): Clarify and document the logic of this functions.
|
|
func isSequenceHeader(frame []byte) bool {
|
|
sc := frameScanner{buf: frame}
|
|
for {
|
|
b, ok := sc.readByte()
|
|
if !ok {
|
|
return false
|
|
}
|
|
for i := 1; b == 0x00 && i != 4; i++ {
|
|
b, ok = sc.readByte()
|
|
if !ok {
|
|
return false
|
|
}
|
|
if b != 0x01 || (i != 2 && i != 3) {
|
|
continue
|
|
}
|
|
|
|
b, ok = sc.readByte()
|
|
if !ok {
|
|
return false
|
|
}
|
|
switch nalTyp := b & 0x1f; nalTyp {
|
|
case suppEnhInf, seqParamSet, paramSet:
|
|
return true
|
|
case nonIdrPic, idrPic:
|
|
return false
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
type frameScanner struct {
|
|
off int
|
|
buf []byte
|
|
}
|
|
|
|
func (s *frameScanner) readByte() (b byte, ok bool) {
|
|
if s.off >= len(s.buf) {
|
|
return 0, false
|
|
}
|
|
b = s.buf[s.off]
|
|
s.off++
|
|
return b, true
|
|
}
|
|
|
|
// generate takes in raw video data from the input chan and packetises it into
|
|
// flv tags, which are then passed to the output channel.
|
|
func (e *Encoder) Encode(frame []byte) error {
|
|
var frameType byte
|
|
var packetType byte
|
|
timeStamp := e.getNextTimestamp()
|
|
// Do we have video to send off?
|
|
if e.video {
|
|
if isKeyFrame(frame) {
|
|
frameType = KeyFrameType
|
|
} else {
|
|
frameType = InterFrameType
|
|
}
|
|
if isSequenceHeader(frame) {
|
|
packetType = SequenceHeader
|
|
} else {
|
|
packetType = AVCNALU
|
|
}
|
|
|
|
tag := VideoTag{
|
|
TagType: uint8(VideoTagType),
|
|
DataSize: uint32(len(frame)) + DataHeaderLength,
|
|
Timestamp: timeStamp,
|
|
TimestampExtended: NoTimestampExtension,
|
|
FrameType: frameType,
|
|
Codec: H264,
|
|
PacketType: packetType,
|
|
CompositionTime: 0,
|
|
Data: frame,
|
|
PrevTagSize: uint32(videoHeaderSize + len(frame)),
|
|
}
|
|
_, err := e.dst.Write(tag.Bytes())
|
|
if err != nil {
|
|
return err
|
|
}
|
|
}
|
|
// Do we even have some audio to send off ?
|
|
if e.audio {
|
|
// Not sure why but we need two audio tags for dummy silent audio
|
|
// TODO: create constants or SoundSize and SoundType parameters
|
|
tag := AudioTag{
|
|
TagType: uint8(AudioTagType),
|
|
DataSize: 7,
|
|
Timestamp: timeStamp,
|
|
TimestampExtended: NoTimestampExtension,
|
|
SoundFormat: AACAudioFormat,
|
|
SoundRate: 3,
|
|
SoundSize: true,
|
|
SoundType: true,
|
|
Data: dummyAudioTag1Data,
|
|
PrevTagSize: uint32(audioSize),
|
|
}
|
|
_, err := e.dst.Write(tag.Bytes())
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
tag = AudioTag{
|
|
TagType: uint8(AudioTagType),
|
|
DataSize: 21,
|
|
Timestamp: timeStamp,
|
|
TimestampExtended: NoTimestampExtension,
|
|
SoundFormat: AACAudioFormat,
|
|
SoundRate: 3,
|
|
SoundSize: true,
|
|
SoundType: true,
|
|
Data: dummyAudioTag2Data,
|
|
PrevTagSize: uint32(22),
|
|
}
|
|
_, err = e.dst.Write(tag.Bytes())
|
|
if err != nil {
|
|
return err
|
|
}
|
|
}
|
|
|
|
return nil
|
|
}
|