/* NAME encoder.go AUTHOR Dan Kortschak Saxon Nelson-Milton LICENSE encoder.go is Copyright (C) 2017-2018 the Australian Ocean Lab (AusOcean) It is free software: you can redistribute it and/or modify them under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. It is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with revid in gpl.txt. If not, see http://www.gnu.org/licenses. */ package mts import ( "fmt" "io" "strconv" "sync" "time" "bitbucket.org/ausocean/av/codec/h264" "bitbucket.org/ausocean/av/container/mts/meta" "bitbucket.org/ausocean/av/container/mts/pes" "bitbucket.org/ausocean/av/container/mts/psi" ) // Some common manifestations of PSI. var ( // StandardPAT is a minimal PAT. StandardPAT = psi.PSI{ Pf: 0x00, Tid: 0x00, Ssi: true, Pb: false, Sl: 0x0d, Tss: &psi.TSS{ Tide: 0x01, V: 0, Cni: true, Sn: 0, Lsn: 0, Sd: &psi.PAT{ Pn: 0x01, Pmpid: 0x1000, }, }, } // Base PMT is a minimal PMT without specific data. BasePMT = psi.PSI{ Pf: 0x00, Tid: 0x02, Ssi: true, Sl: 0x12, Tss: &psi.TSS{ Tide: 0x01, V: 0, Cni: true, Sn: 0, Lsn: 0, }, } ) const ( psiInterval = 1 * time.Second psiSendCount = 7 ) // Meta allows addition of metadata to encoded mts from outside of this pkg. // See meta pkg for usage. // // TODO: make this not global. var Meta *meta.Data var ( patTable = StandardPAT.Bytes() pmtTable []byte ) const ( H264ID = 27 H265ID = 36 audioStreamID = 0xc0 // First audio stream ID. ) // Constants used to communicate which media codec will be packetized. const ( EncodeH264 = iota EncodeH265 EncodeAudio ) // Time-related constants. const ( // ptsOffset is the offset added to the clock to determine // the current presentation timestamp. ptsOffset = 700 * time.Millisecond // PCRFrequency is the base Program Clock Reference frequency in Hz. PCRFrequency = 90000 // PTSFrequency is the presentation timestamp frequency in Hz. PTSFrequency = 90000 // MaxPTS is the largest PTS value (i.e., for a 33-bit unsigned integer). MaxPTS = (1 << 33) - 1 ) // Globals for use in keeping real time. var ( realRefTime time.Time // Holds a reference real time given to SetTime. sysRefTime time.Time // Holds a system reference time set when realRefTime is obtained. timeIsSet bool // Indicates if the time has been set. mu = sync.Mutex{} // Used when accessing/mutating above time vars. ) // SetTime allows setting of current time. This is useful if the system running // this encoder does not have time keeping. The user may wish to obtain an // accurate time from an NTP server or local machine and pass to this function. func SetTime(t time.Time) { mu.Lock() realRefTime = t sysRefTime = time.Now() timeIsSet = true mu.Unlock() } // Time provides either a real time that has been calculated from a reference // set by SetTime, or using the current system time. func Time() time.Time { mu.Lock() t := realRefTime.Add(time.Now().Sub(sysRefTime)) mu.Unlock() return t } // TimeIsSet returns true if SetTime has been used to set a real reference time. func TimeIsSet() bool { mu.Lock() b := timeIsSet mu.Unlock() return b } // Encoder encapsulates properties of an MPEG-TS generator. type Encoder struct { dst io.WriteCloser clock time.Duration lastTime time.Time writePeriod time.Duration ptsOffset time.Duration tsSpace [PacketSize]byte pesSpace [pes.MaxPesSize]byte continuity map[int]byte nalBasedPSI bool pktCount int psiSendCount int mediaPid int streamID byte } // NewEncoder returns an Encoder with the specified media type and rate eg. if a video stream // calls write for every frame, the rate will be the frame rate of the video. func NewEncoder(dst io.WriteCloser, rate float64, mediaType int) *Encoder { var mPid int var sid byte switch mediaType { case EncodeAudio: mPid = AudioPid sid = audioStreamID case EncodeH265: mPid = VideoPid sid = H265ID case EncodeH264: mPid = VideoPid sid = H264ID } pmt := BasePMT pmt.Tss.Sd = &psi.PMT{ Pcrpid: 0x0100, Pil: 0, Essd: &psi.ESSD{ St: byte(sid), Epid: 0x0100, Esil: 0x00, }, } pmtTable = pmt.Bytes() return &Encoder{ dst: dst, writePeriod: time.Duration(float64(time.Second) / rate), ptsOffset: ptsOffset, nalBasedPSI: true, pktCount: 8, mediaPid: mPid, streamID: sid, continuity: map[int]byte{ PatPid: 0, PmtPid: 0, mPid: 0, }, } } const ( hasPayload = 0x1 hasAdaptationField = 0x2 ) const ( hasDTS = 0x1 hasPTS = 0x2 ) func (e *Encoder) NALBasedPSI(b bool, sendCount int) { e.nalBasedPSI = b e.psiSendCount = sendCount e.pktCount = e.psiSendCount } // Write implements io.Writer. Write takes raw video or audio data and encodes into MPEG-TS, // then sending it to the encoder's io.Writer destination. func (e *Encoder) Write(data []byte) (int, error) { if e.nalBasedPSI { nalType, err := h264.NALType(data) if err != nil { return 0, fmt.Errorf("could not get type from NAL unit, failed with error: %v", err) } // NAL type that will signify refresh. These are defined in H.264 specifications // table 7-1. const nalTypeSPS = 7 if nalType == nalTypeSPS { err := e.writePSI() if err != nil { return 0, err } } } else if e.pktCount >= e.psiSendCount { e.pktCount = 0 err := e.writePSI() if err != nil { return 0, err } } // Prepare PES data. pesPkt := pes.Packet{ StreamID: e.streamID, PDI: hasPTS, PTS: e.pts(), Data: data, HeaderLength: 5, } buf := pesPkt.Bytes(e.pesSpace[:pes.MaxPesSize]) pusi := true for len(buf) != 0 { pkt := Packet{ PUSI: pusi, PID: uint16(e.mediaPid), RAI: pusi, CC: e.ccFor(e.mediaPid), AFC: hasAdaptationField | hasPayload, PCRF: pusi, } n := pkt.FillPayload(buf) buf = buf[n:] if pusi { // If the packet has a Payload Unit Start Indicator // flag set then we need to write a PCR. pkt.PCR = e.pcr() pusi = false } _, err := e.dst.Write(pkt.Bytes(e.tsSpace[:PacketSize])) if err != nil { return len(data), err } e.pktCount++ } e.tick() return len(data), nil } // writePSI creates MPEG-TS with pat and pmt tables - with pmt table having updated // location and time data. func (e *Encoder) writePSI() error { // Write PAT. patPkt := Packet{ PUSI: true, PID: PatPid, CC: e.ccFor(PatPid), AFC: hasPayload, Payload: psi.AddPadding(patTable), } _, err := e.dst.Write(patPkt.Bytes(e.tsSpace[:PacketSize])) if err != nil { return err } e.pktCount++ pmtTable, err = updateMeta(pmtTable) if err != nil { return err } // Create mts packet from pmt table. pmtPkt := Packet{ PUSI: true, PID: PmtPid, CC: e.ccFor(PmtPid), AFC: hasPayload, Payload: psi.AddPadding(pmtTable), } _, err = e.dst.Write(pmtPkt.Bytes(e.tsSpace[:PacketSize])) if err != nil { return err } e.pktCount++ return nil } // tick advances the clock one frame interval. func (e *Encoder) tick() { e.clock += e.writePeriod } // pts retuns the current presentation timestamp. func (e *Encoder) pts() uint64 { return uint64((e.clock + e.ptsOffset).Seconds() * PTSFrequency) } // pcr returns the current program clock reference. func (e *Encoder) pcr() uint64 { return uint64(e.clock.Seconds() * PCRFrequency) } // ccFor returns the next continuity counter for pid. func (e *Encoder) ccFor(pid int) byte { cc := e.continuity[pid] const continuityCounterMask = 0xf e.continuity[pid] = (cc + 1) & continuityCounterMask return cc } // updateMeta adds/updates a metaData descriptor in the given psi bytes using data // contained in the global Meta struct. func updateMeta(b []byte) ([]byte, error) { p := psi.PSIBytes(b) if TimeIsSet() { Meta.Add("ts", strconv.Itoa(int(Time().Unix()))) } err := p.AddDescriptor(psi.MetadataTag, Meta.Encode()) return []byte(p), err } func (e *Encoder) Close() error { return e.dst.Close() }