av/container/flv/encoder.go

/*
NAME
  encoder.go

DESCRIPTION
  See Readme.md

AUTHOR
  Dan Kortschak <dan@ausocean.org>
  Saxon Nelson-Milton <saxon@ausocean.org>

LICENSE
  flv_generator.go is Copyright (C) 2017 the Australian Ocean Lab (AusOcean)

  It is free software: you can redistribute it and/or modify them
  under the terms of the GNU General Public License as published by the
  Free Software Foundation, either version 3 of the License, or (at your
  option) any later version.

  It is distributed in the hope that it will be useful, but WITHOUT
  ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
 for more details.

  You should have received a copy of the GNU General Public License
  along with revid in gpl.txt. If not, see http://www.gnu.org/licenses.
*/

package flv

import (
	"io"
	"time"
)

const (
	inputChanLength  = 500
	outputChanLength = 500
	audioSize        = 18
	videoHeaderSize  = 16
)

// Data representing silent audio (required for youtube)
var (
	dummyAudioTag1Data = []byte{
		0x00, 0x12, 0x08, 0x56, 0xe5, 0x00,
	}

	dummyAudioTag2Data = []byte{
		0x01, 0xdc, 0x00, 0x4c, 0x61, 0x76, 0x63, 0x35, 0x38,
		0x2e, 0x36, 0x2e, 0x31, 0x30, 0x32, 0x00, 0x02, 0x30,
		0x40, 0x0e,
	}
)

// Encoder provides properties required for the generation of flv video
// from raw video data
type Encoder struct {
	dst   io.WriteCloser
	fps   int
	audio bool
	video bool
	start time.Time
}

// NewEncoder retuns a new FLV encoder.
func NewEncoder(dst io.WriteCloser, audio, video bool, fps int) (*Encoder, error) {
	e := Encoder{
		dst:   dst,
		fps:   fps,
		audio: audio,
		video: video,
	}
	return &e, nil
}

// getNextTimestamp generates and returns the next timestamp based on current time
func (e *Encoder) getNextTimestamp() (timestamp uint32) {
	if e.start.IsZero() {
		e.start = time.Now()
		return 0
	}
	return uint32(time.Now().Sub(e.start).Seconds() * float64(1000))
}

// http://www.itu.int/rec/dologin_pub.asp?lang=e&id=T-REC-H.264-200305-S!!PDF-E&type=items
// Table 7-1 NAL unit type codes
const (
	nonIdrPic   = 1
	idrPic      = 5
	suppEnhInf  = 6
	seqParamSet = 7
	paramSet    = 8
)

// isKeyFrame returns true if the passed frame data represents that of a keyframe
// FIXME(kortschak): Clarify and document the logic of this functions.
func isKeyFrame(frame []byte) bool {
	sc := frameScanner{buf: frame}
	for {
		b, ok := sc.readByte()
		if !ok {
			return false
		}
		for i := 1; b == 0x00 && i < 4; i++ {
			b, ok = sc.readByte()
			if !ok {
				return false
			}
			if b != 0x01 || (i != 3 && i != 2) {
				continue
			}

			b, ok = sc.readByte()
			if !ok {
				return false
			}
			switch nalTyp := b & 0x1f; nalTyp {
			case idrPic:
				return true
			case nonIdrPic:
				return false
			}
		}
	}
	return false
}

// isSequenceHeader returns true if the passed frame data represents that of a
// a sequence header.
// FIXME(kortschak): Clarify and document the logic of this functions.
func isSequenceHeader(frame []byte) bool {
	sc := frameScanner{buf: frame}
	for {
		b, ok := sc.readByte()
		if !ok {
			return false
		}
		for i := 1; b == 0x00 && i != 4; i++ {
			b, ok = sc.readByte()
			if !ok {
				return false
			}
			if b != 0x01 || (i != 2 && i != 3) {
				continue
			}

			b, ok = sc.readByte()
			if !ok {
				return false
			}
			switch nalTyp := b & 0x1f; nalTyp {
			case suppEnhInf, seqParamSet, paramSet:
				return true
			case nonIdrPic, idrPic:
				return false
			}
		}
	}
}

type frameScanner struct {
	off int
	buf []byte
}

func (s *frameScanner) readByte() (b byte, ok bool) {
	if s.off >= len(s.buf) {
		return 0, false
	}
	b = s.buf[s.off]
	s.off++
	return b, true
}

// write implements io.Writer. It takes raw h264 and encodes into flv, then
// writes to the encoders io.Writer destination.
func (e *Encoder) Write(frame []byte) (int, error) {
	var frameType byte
	var packetType byte
	if e.start.IsZero() {
		// This is the first frame, so write the PreviousTagSize0.
		//
		// See https://download.macromedia.com/f4v/video_file_format_spec_v10_1.pdf
		// section E.3.
		var zero [4]byte
		_, err := e.dst.Write(zero[:])
		if err != nil {
			return 0, err
		}
	}
	timeStamp := e.getNextTimestamp()
	// Do we have video to send off?
	if e.video {
		if isKeyFrame(frame) {
			frameType = KeyFrameType
		} else {
			frameType = InterFrameType
		}
		if isSequenceHeader(frame) {
			packetType = SequenceHeader
		} else {
			packetType = AVCNALU
		}

		tag := VideoTag{
			TagType:           uint8(VideoTagType),
			DataSize:          uint32(len(frame)) + DataHeaderLength,
			Timestamp:         timeStamp,
			TimestampExtended: NoTimestampExtension,
			FrameType:         frameType,
			Codec:             H264,
			PacketType:        packetType,
			CompositionTime:   0,
			Data:              frame,
			PrevTagSize:       uint32(videoHeaderSize + len(frame)),
		}
		_, err := e.dst.Write(tag.Bytes())
		if err != nil {
			return len(frame), err
		}
	}
	// Do we even have some audio to send off ?
	if e.audio {
		// Not sure why but we need two audio tags for dummy silent audio
		// TODO: create constants or SoundSize and SoundType parameters
		tag := AudioTag{
			TagType:           uint8(AudioTagType),
			DataSize:          7,
			Timestamp:         timeStamp,
			TimestampExtended: NoTimestampExtension,
			SoundFormat:       AACAudioFormat,
			SoundRate:         3,
			SoundSize:         true,
			SoundType:         true,
			Data:              dummyAudioTag1Data,
			PrevTagSize:       uint32(audioSize),
		}
		_, err := e.dst.Write(tag.Bytes())
		if err != nil {
			return len(frame), err
		}

		tag = AudioTag{
			TagType:           uint8(AudioTagType),
			DataSize:          21,
			Timestamp:         timeStamp,
			TimestampExtended: NoTimestampExtension,
			SoundFormat:       AACAudioFormat,
			SoundRate:         3,
			SoundSize:         true,
			SoundType:         true,
			Data:              dummyAudioTag2Data,
			PrevTagSize:       uint32(22),
		}
		_, err = e.dst.Write(tag.Bytes())
		if err != nil {
			return len(frame), err
		}
	}

	return len(frame), nil
}

// Close will close the encoder destination.
func (e *Encoder) Close() error {
	return e.dst.Close()
}
providing install_soft build target 2022-05-31 08:17:06 +03:00			`/*`
			`NAME`
			`encoder.go`

			`DESCRIPTION`
			`See Readme.md`

			`AUTHOR`
			`Dan Kortschak <dan@ausocean.org>`
			`Saxon Nelson-Milton <saxon@ausocean.org>`

			`LICENSE`
			`flv_generator.go is Copyright (C) 2017 the Australian Ocean Lab (AusOcean)`

			`It is free software: you can redistribute it and/or modify them`
			`under the terms of the GNU General Public License as published by the`
			`Free Software Foundation, either version 3 of the License, or (at your`
			`option) any later version.`

			`It is distributed in the hope that it will be useful, but WITHOUT`
			`ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or`
			`FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License`
			`for more details.`

			`You should have received a copy of the GNU General Public License`
			`along with revid in gpl.txt. If not, see http://www.gnu.org/licenses.`
			`*/`

			`package flv`

			`import (`
			`"io"`
			`"time"`
			`)`

			`const (`
			`inputChanLength = 500`
			`outputChanLength = 500`
			`audioSize = 18`
			`videoHeaderSize = 16`
			`)`

			`// Data representing silent audio (required for youtube)`
			`var (`
			`dummyAudioTag1Data = []byte{`
			`0x00, 0x12, 0x08, 0x56, 0xe5, 0x00,`
			`}`

			`dummyAudioTag2Data = []byte{`
			`0x01, 0xdc, 0x00, 0x4c, 0x61, 0x76, 0x63, 0x35, 0x38,`
			`0x2e, 0x36, 0x2e, 0x31, 0x30, 0x32, 0x00, 0x02, 0x30,`
			`0x40, 0x0e,`
			`}`
			`)`

			`// Encoder provides properties required for the generation of flv video`
			`// from raw video data`
			`type Encoder struct {`
			`dst io.WriteCloser`
			`fps int`
			`audio bool`
			`video bool`
			`start time.Time`
			`}`

			`// NewEncoder retuns a new FLV encoder.`
			`func NewEncoder(dst io.WriteCloser, audio, video bool, fps int) (*Encoder, error) {`
			`e := Encoder{`
			`dst: dst,`
			`fps: fps,`
			`audio: audio,`
			`video: video,`
			`}`
			`return &e, nil`
			`}`

			`// getNextTimestamp generates and returns the next timestamp based on current time`
			`func (e *Encoder) getNextTimestamp() (timestamp uint32) {`
			`if e.start.IsZero() {`
			`e.start = time.Now()`
			`return 0`
			`}`
			`return uint32(time.Now().Sub(e.start).Seconds() * float64(1000))`
			`}`

			`// http://www.itu.int/rec/dologin_pub.asp?lang=e&id=T-REC-H.264-200305-S!!PDF-E&type=items`
			`// Table 7-1 NAL unit type codes`
			`const (`
			`nonIdrPic = 1`
			`idrPic = 5`
			`suppEnhInf = 6`
			`seqParamSet = 7`
			`paramSet = 8`
			`)`

			`// isKeyFrame returns true if the passed frame data represents that of a keyframe`
			`// FIXME(kortschak): Clarify and document the logic of this functions.`
			`func isKeyFrame(frame []byte) bool {`
			`sc := frameScanner{buf: frame}`
			`for {`
			`b, ok := sc.readByte()`
			`if !ok {`
			`return false`
			`}`
			`for i := 1; b == 0x00 && i < 4; i++ {`
			`b, ok = sc.readByte()`
			`if !ok {`
			`return false`
			`}`
			`if b != 0x01 \|\| (i != 3 && i != 2) {`
			`continue`
			`}`

			`b, ok = sc.readByte()`
			`if !ok {`
			`return false`
			`}`
			`switch nalTyp := b & 0x1f; nalTyp {`
			`case idrPic:`
			`return true`
			`case nonIdrPic:`
			`return false`
			`}`
			`}`
			`}`
			`return false`
			`}`

			`// isSequenceHeader returns true if the passed frame data represents that of a`
			`// a sequence header.`
			`// FIXME(kortschak): Clarify and document the logic of this functions.`
			`func isSequenceHeader(frame []byte) bool {`
			`sc := frameScanner{buf: frame}`
			`for {`
			`b, ok := sc.readByte()`
			`if !ok {`
			`return false`
			`}`
			`for i := 1; b == 0x00 && i != 4; i++ {`
			`b, ok = sc.readByte()`
			`if !ok {`
			`return false`
			`}`
			`if b != 0x01 \|\| (i != 2 && i != 3) {`
			`continue`
			`}`

			`b, ok = sc.readByte()`
			`if !ok {`
			`return false`
			`}`
			`switch nalTyp := b & 0x1f; nalTyp {`
			`case suppEnhInf, seqParamSet, paramSet:`
			`return true`
			`case nonIdrPic, idrPic:`
			`return false`
			`}`
			`}`
			`}`
			`}`

			`type frameScanner struct {`
			`off int`
			`buf []byte`
			`}`

			`func (s *frameScanner) readByte() (b byte, ok bool) {`
			`if s.off >= len(s.buf) {`
			`return 0, false`
			`}`
			`b = s.buf[s.off]`
			`s.off++`
			`return b, true`
			`}`

			`// write implements io.Writer. It takes raw h264 and encodes into flv, then`
			`// writes to the encoders io.Writer destination.`
			`func (e *Encoder) Write(frame []byte) (int, error) {`
			`var frameType byte`
			`var packetType byte`
			`if e.start.IsZero() {`
			`// This is the first frame, so write the PreviousTagSize0.`
			`//`
			`// See https://download.macromedia.com/f4v/video_file_format_spec_v10_1.pdf`
			`// section E.3.`
			`var zero [4]byte`
			`_, err := e.dst.Write(zero[:])`
			`if err != nil {`
			`return 0, err`
			`}`
			`}`
			`timeStamp := e.getNextTimestamp()`
			`// Do we have video to send off?`
			`if e.video {`
			`if isKeyFrame(frame) {`
			`frameType = KeyFrameType`
			`} else {`
			`frameType = InterFrameType`
			`}`
			`if isSequenceHeader(frame) {`
			`packetType = SequenceHeader`
			`} else {`
			`packetType = AVCNALU`
			`}`

			`tag := VideoTag{`
			`TagType: uint8(VideoTagType),`
			`DataSize: uint32(len(frame)) + DataHeaderLength,`
			`Timestamp: timeStamp,`
			`TimestampExtended: NoTimestampExtension,`
			`FrameType: frameType,`
			`Codec: H264,`
			`PacketType: packetType,`
			`CompositionTime: 0,`
			`Data: frame,`
			`PrevTagSize: uint32(videoHeaderSize + len(frame)),`
			`}`
			`_, err := e.dst.Write(tag.Bytes())`
			`if err != nil {`
			`return len(frame), err`
			`}`
			`}`
			`// Do we even have some audio to send off ?`
			`if e.audio {`
			`// Not sure why but we need two audio tags for dummy silent audio`
			`// TODO: create constants or SoundSize and SoundType parameters`
			`tag := AudioTag{`
			`TagType: uint8(AudioTagType),`
			`DataSize: 7,`
			`Timestamp: timeStamp,`
			`TimestampExtended: NoTimestampExtension,`
			`SoundFormat: AACAudioFormat,`
			`SoundRate: 3,`
			`SoundSize: true,`
			`SoundType: true,`
			`Data: dummyAudioTag1Data,`
			`PrevTagSize: uint32(audioSize),`
			`}`
			`_, err := e.dst.Write(tag.Bytes())`
			`if err != nil {`
			`return len(frame), err`
			`}`

			`tag = AudioTag{`
			`TagType: uint8(AudioTagType),`
			`DataSize: 21,`
			`Timestamp: timeStamp,`
			`TimestampExtended: NoTimestampExtension,`
			`SoundFormat: AACAudioFormat,`
			`SoundRate: 3,`
			`SoundSize: true,`
			`SoundType: true,`
			`Data: dummyAudioTag2Data,`
			`PrevTagSize: uint32(22),`
			`}`
			`_, err = e.dst.Write(tag.Bytes())`
			`if err != nil {`
			`return len(frame), err`
			`}`
			`}`

			`return len(frame), nil`
			`}`

			`// Close will close the encoder destination.`
			`func (e *Encoder) Close() error {`
			`return e.dst.Close()`
			`}`