Squash: Fix rtc to rtmp sync timestamp using sender report. #2470

2025-03-09 15:49:59 +00:00 · 2021-08-17 07:25:03 +08:00 · 2021-08-17 07:25:03 +08:00 · 85620a34f5
commit 85620a34f5
parent 3d58e98d1c
309 changed files with 14837 additions and 8525 deletions
--- a/trunk/3rdparty/srs-bench/vendor/github.com/ossrs/go-oryx-lib/aac/aac.go
+++ b/trunk/3rdparty/srs-bench/vendor/github.com/ossrs/go-oryx-lib/aac/aac.go
@ -0,0 +1,516 @@
+// The MIT License (MIT)
+//
+// Copyright (c) 2013-2017 Oryx(ossrs)
+//
+// Permission is hereby granted, free of charge, to any person obtaining a copy of
+// this software and associated documentation files (the "Software"), to deal in
+// the Software without restriction, including without limitation the rights to
+// use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of
+// the Software, and to permit persons to whom the Software is furnished to do so,
+// subject to the following conditions:
+//
+// The above copyright notice and this permission notice shall be included in all
+// copies or substantial portions of the Software.
+//
+// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS
+// FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR
+// COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER
+// IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
+// CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
+
+// The oryx AAC package includes some utilites.
+package aac
+
+import (
+	"github.com/ossrs/go-oryx-lib/errors"
+)
+
+// The ADTS is a format of AAC.
+// We can encode the RAW AAC frame in ADTS muxer.
+// We can also decode the ADTS data to RAW AAC frame.
+type ADTS interface {
+	// Set the ASC, the codec information.
+	// Before encoding raw frame, user must set the asc.
+	SetASC(asc []byte) (err error)
+	// Encode the raw aac frame to adts data.
+	// @remark User must set the asc first.
+	Encode(raw []byte) (adts []byte, err error)
+
+	// Decode the adts data to raw frame.
+	// @remark User can get the asc after decode ok.
+	// @remark When left if not nil, user must decode it again.
+	Decode(adts []byte) (raw, left []byte, err error)
+	// Get the ASC, the codec information.
+	// When decode a adts data or set the asc, user can use this API to get it.
+	ASC() *AudioSpecificConfig
+}
+
+// The AAC object type in RAW AAC frame.
+// Refer to @doc ISO_IEC_14496-3-AAC-2001.pdf, @page 23, @section 1.5.1.1 Audio object type definition
+type ObjectType uint8
+
+const (
+	ObjectTypeForbidden ObjectType = iota
+
+	ObjectTypeMain
+	ObjectTypeLC
+	ObjectTypeSSR
+
+	ObjectTypeHE   ObjectType = 5  // HE=LC+SBR
+	ObjectTypeHEv2 ObjectType = 29 // HEv2=LC+SBR+PS
+)
+
+func (v ObjectType) String() string {
+	switch v {
+	case ObjectTypeMain:
+		return "Main"
+	case ObjectTypeLC:
+		return "LC"
+	case ObjectTypeSSR:
+		return "SSR"
+	case ObjectTypeHE:
+		return "HE"
+	case ObjectTypeHEv2:
+		return "HEv2"
+	default:
+		return "Forbidden"
+	}
+}
+
+func (v ObjectType) ToProfile() Profile {
+	switch v {
+	case ObjectTypeMain:
+		return ProfileMain
+	case ObjectTypeHE, ObjectTypeHEv2, ObjectTypeLC:
+		return ProfileLC
+	case ObjectTypeSSR:
+		return ProfileSSR
+	default:
+		return ProfileForbidden
+	}
+}
+
+// The profile of AAC in ADTS.
+// Refer to @doc ISO_IEC_13818-7-AAC-2004.pdf, @page 40, @section 7.1 Profiles
+type Profile uint8
+
+const (
+	ProfileMain Profile = iota
+	ProfileLC
+	ProfileSSR
+	ProfileForbidden
+)
+
+func (v Profile) String() string {
+	switch v {
+	case ProfileMain:
+		return "Main"
+	case ProfileLC:
+		return "LC"
+	case ProfileSSR:
+		return "SSR"
+	default:
+		return "Forbidden"
+	}
+}
+
+func (v Profile) ToObjectType() ObjectType {
+	switch v {
+	case ProfileMain:
+		return ObjectTypeMain
+	case ProfileLC:
+		return ObjectTypeLC
+	case ProfileSSR:
+		return ObjectTypeSSR
+	default:
+		return ObjectTypeForbidden
+	}
+}
+
+// The aac sample rate index.
+// Refer to @doc ISO_IEC_13818-7-AAC-2004.pdf, @page 46, @section Table 35 – Sampling frequency
+type SampleRateIndex uint8
+
+const (
+	SampleRateIndex96kHz SampleRateIndex = iota
+	SampleRateIndex88kHz
+	SampleRateIndex64kHz
+	SampleRateIndex48kHz
+	SampleRateIndex44kHz
+	SampleRateIndex32kHz
+	SampleRateIndex24kHz
+	SampleRateIndex22kHz
+	SampleRateIndex16kHz
+	SampleRateIndex12kHz
+	SampleRateIndex11kHz
+	SampleRateIndex8kHz
+	SampleRateIndex7kHz
+	SampleRateIndexReserved0
+	SampleRateIndexReserved1
+	SampleRateIndexReserved2
+	SampleRateIndexReserved3
+	SampleRateIndexForbidden
+)
+
+func (v SampleRateIndex) String() string {
+	switch v {
+	case SampleRateIndex96kHz:
+		return "96kHz"
+	case SampleRateIndex88kHz:
+		return "88kHz"
+	case SampleRateIndex64kHz:
+		return "64kHz"
+	case SampleRateIndex48kHz:
+		return "48kHz"
+	case SampleRateIndex44kHz:
+		return "44kHz"
+	case SampleRateIndex32kHz:
+		return "32kHz"
+	case SampleRateIndex24kHz:
+		return "24kHz"
+	case SampleRateIndex22kHz:
+		return "22kHz"
+	case SampleRateIndex16kHz:
+		return "16kHz"
+	case SampleRateIndex12kHz:
+		return "12kHz"
+	case SampleRateIndex11kHz:
+		return "11kHz"
+	case SampleRateIndex8kHz:
+		return "8kHz"
+	case SampleRateIndex7kHz:
+		return "7kHz"
+	case SampleRateIndexReserved0, SampleRateIndexReserved1, SampleRateIndexReserved2, SampleRateIndexReserved3:
+		return "Reserved"
+	default:
+		return "Forbidden"
+	}
+}
+
+func (v SampleRateIndex) ToHz() int {
+	aacSR := []int{
+		96000, 88200, 64000, 48000,
+		44100, 32000, 24000, 22050,
+		16000, 12000, 11025, 8000,
+		7350, 0, 0, 0,
+		/* To avoid overflow by forbidden */
+		0,
+	}
+	return aacSR[v]
+}
+
+// The aac channel.
+// Refer to @doc ISO_IEC_13818-7-AAC-2004.pdf, @page 72, @section Table 42 – Implicit speaker mapping
+type Channels uint8
+
+const (
+	ChannelForbidden Channels = iota
+	// center front speaker
+	// FFMPEG: mono           FC
+	ChannelMono
+	// left, right front speakers
+	// FFMPEG: stereo         FL+FR
+	ChannelStereo
+	// center front speaker, left, right front speakers
+	// FFMPEG: 2.1            FL+FR+LFE
+	// FFMPEG: 3.0            FL+FR+FC
+	// FFMPEG: 3.0(back)      FL+FR+BC
+	Channel3
+	// center front speaker, left, right center front speakers, rear surround
+	// FFMPEG: 4.0            FL+FR+FC+BC
+	// FFMPEG: quad           FL+FR+BL+BR
+	// FFMPEG: quad(side)     FL+FR+SL+SR
+	// FFMPEG: 3.1            FL+FR+FC+LFE
+	Channel4
+	// center front speaker, left, right front speakers, left surround, right surround rear speakers
+	// FFMPEG: 5.0            FL+FR+FC+BL+BR
+	// FFMPEG: 5.0(side)      FL+FR+FC+SL+SR
+	// FFMPEG: 4.1            FL+FR+FC+LFE+BC
+	Channel5
+	// center front speaker, left, right front speakers, left surround, right surround rear speakers,
+	// front low frequency effects speaker
+	// FFMPEG: 5.1            FL+FR+FC+LFE+BL+BR
+	// FFMPEG: 5.1(side)      FL+FR+FC+LFE+SL+SR
+	// FFMPEG: 6.0            FL+FR+FC+BC+SL+SR
+	// FFMPEG: 6.0(front)     FL+FR+FLC+FRC+SL+SR
+	// FFMPEG: hexagonal      FL+FR+FC+BL+BR+BC
+	Channel5_1 // speakers: 6
+	// center front speaker, left, right center front speakers, left, right outside front speakers,
+	// left surround, right surround rear speakers, front low frequency effects speaker
+	// FFMPEG: 7.1            FL+FR+FC+LFE+BL+BR+SL+SR
+	// FFMPEG: 7.1(wide)      FL+FR+FC+LFE+BL+BR+FLC+FRC
+	// FFMPEG: 7.1(wide-side) FL+FR+FC+LFE+FLC+FRC+SL+SR
+	Channel7_1 // speakers: 7
+	// FFMPEG: 6.1            FL+FR+FC+LFE+BC+SL+SR
+	// FFMPEG: 6.1(back)      FL+FR+FC+LFE+BL+BR+BC
+	// FFMPEG: 6.1(front)     FL+FR+LFE+FLC+FRC+SL+SR
+	// FFMPEG: 7.0            FL+FR+FC+BL+BR+SL+SR
+	// FFMPEG: 7.0(front)     FL+FR+FC+FLC+FRC+SL+SR
+)
+
+func (v Channels) String() string {
+	switch v {
+	case ChannelMono:
+		return "Mono(FC)"
+	case ChannelStereo:
+		return "Stereo(FL+FR)"
+	case Channel3:
+		return "FL+FR+FC"
+	case Channel4:
+		return "FL+FR+FC+BC"
+	case Channel5:
+		return "FL+FR+FC+SL+SR"
+	case Channel5_1:
+		return "FL+FR+FC+LFE+SL+SR"
+	case Channel7_1:
+		return "FL+FR+FC+LFE+BL+BR+SL+SR"
+	default:
+		return "Forbidden"
+	}
+}
+
+// Please use NewADTS() and interface ADTS instead.
+// It's only exposed for example.
+type ADTSImpl struct {
+	asc AudioSpecificConfig
+}
+
+func NewADTS() (ADTS, error) {
+	return &ADTSImpl{}, nil
+}
+
+func (v *ADTSImpl) SetASC(asc []byte) (err error) {
+	return v.asc.UnmarshalBinary(asc)
+}
+
+func (v *ADTSImpl) Encode(raw []byte) (data []byte, err error) {
+	if err = v.asc.validate(); err != nil {
+		return nil, errors.WithMessage(err, "adts encode")
+	}
+
+	// write the ADTS header.
+	// Refer to @doc ISO_IEC_13818-7-AAC-2004.pdf, @page 26, @section 6.2 Audio Data Transport Stream, ADTS
+	// byte_alignment()
+
+	// adts_fixed_header:
+	//      12bits syncword,
+	//      16bits left.
+	// adts_variable_header:
+	//      28bits
+	//      12+16+28=56bits
+	// adts_error_check:
+	//      16bits if protection_absent
+	//      56+16=72bits
+	// if protection_absent:
+	//      require(7bytes)=56bits
+	// else
+	//      require(9bytes)=72bits
+	aacFixedHeader := make([]byte, 7)
+	p := aacFixedHeader
+
+	// Syncword 12 bslbf
+	p[0] = byte(0xff)
+	// 4bits left.
+	// Refer to @doc ISO_IEC_13818-7-AAC-2004.pdf, @page 27, @section 6.2.1 Fixed Header of ADTS
+	// ID 1 bslbf
+	// Layer 2 uimsbf
+	// protection_absent 1 bslbf
+	p[1] = byte(0xf1)
+
+	// profile 2 uimsbf
+	// sampling_frequency_index 4 uimsbf
+	// private_bit 1 bslbf
+	// channel_configuration 3 uimsbf
+	// original/copy 1 bslbf
+	// home 1 bslbf
+	profile := v.asc.Object.ToProfile()
+	p[2] = byte((profile<<6)&0xc0) | byte((v.asc.SampleRate<<2)&0x3c) | byte((v.asc.Channels>>2)&0x01)
+
+	// 4bits left.
+	// Refer to @doc ISO_IEC_13818-7-AAC-2004.pdf, @page 27, @section 6.2.2 Variable Header of ADTS
+	// copyright_identification_bit 1 bslbf
+	// copyright_identification_start 1 bslbf
+	aacFrameLength := uint16(len(raw) + len(aacFixedHeader))
+	p[3] = byte((v.asc.Channels<<6)&0xc0) | byte((aacFrameLength>>11)&0x03)
+
+	// aac_frame_length 13 bslbf: Length of the frame including headers and error_check in bytes.
+	// use the left 2bits as the 13 and 12 bit,
+	// the aac_frame_length is 13bits, so we move 13-2=11.
+	p[4] = byte(aacFrameLength >> 3)
+	// adts_buffer_fullness 11 bslbf
+	p[5] = byte(aacFrameLength<<5) & byte(0xe0)
+
+	// no_raw_data_blocks_in_frame 2 uimsbf
+	p[6] = byte(0xfc)
+
+	return append(p, raw...), nil
+}
+
+func (v *ADTSImpl) Decode(data []byte) (raw, left []byte, err error) {
+	// write the ADTS header.
+	// Refer to @doc ISO_IEC_13818-7-AAC-2004.pdf, @page 26, @section 6.2 Audio Data Transport Stream, ADTS
+	// @see https://github.com/ossrs/srs/issues/212#issuecomment-64145885
+	// byte_alignment()
+	p := data
+	if len(p) <= 7 {
+		return nil, nil, errors.Errorf("requires 7+ but only %v bytes", len(p))
+	}
+
+	// matched 12bits 0xFFF,
+	// @remark, we must cast the 0xff to char to compare.
+	if p[0] != 0xff || p[1]&0xf0 != 0xf0 {
+		return nil, nil, errors.Errorf("invalid signature %#x", uint8(p[1]&0xf0))
+	}
+
+	// Syncword 12 bslbf
+	_ = p[0]
+	// 4bits left.
+	// Refer to @doc ISO_IEC_13818-7-AAC-2004.pdf, @page 27, @section 6.2.1 Fixed Header of ADTS
+	// ID 1 bslbf
+	// layer 2 uimsbf
+	// protection_absent 1 bslbf
+	pat := uint8(p[1]) & 0x0f
+	id := (pat >> 3) & 0x01
+	//layer := (pat >> 1) & 0x03
+	protectionAbsent := pat & 0x01
+
+	// ID: MPEG identifier, set to '1' if the audio data in the ADTS stream are MPEG-2 AAC (See ISO/IEC 13818-7)
+	// and set to '0' if the audio data are MPEG-4. See also ISO/IEC 11172-3, subclause 2.4.2.3.
+	if id != 0x01 {
+		// well, some system always use 0, but actually is aac format.
+		// for example, houjian vod ts always set the aac id to 0, actually 1.
+		// we just ignore it, and alwyas use 1(aac) to demux.
+		id = 0x01
+	}
+
+	sfiv := uint16(p[2])<<8 | uint16(p[3])
+	// profile 2 uimsbf
+	// sampling_frequency_index 4 uimsbf
+	// private_bit 1 bslbf
+	// channel_configuration 3 uimsbf
+	// original/copy 1 bslbf
+	// home 1 bslbf
+	profile := Profile(uint8(sfiv>>14) & 0x03)
+	samplingFrequencyIndex := uint8(sfiv>>10) & 0x0f
+	//private_bit := (t >> 9) & 0x01
+	channelConfiguration := uint8(sfiv>>6) & 0x07
+	//original := uint8(sfiv >> 5) & 0x01
+	//home := uint8(sfiv >> 4) & 0x01
+	// 4bits left.
+	// Refer to @doc ISO_IEC_13818-7-AAC-2004.pdf, @page 27, @section 6.2.2 Variable Header of ADTS
+	// copyright_identification_bit 1 bslbf
+	// copyright_identification_start 1 bslbf
+	//fh_copyright_identification_bit = uint8(sfiv >> 3) & 0x01
+	//fh_copyright_identification_start = uint8(sfiv >> 2) & 0x01
+	// frame_length 13 bslbf: Length of the frame including headers and error_check in bytes.
+	// use the left 2bits as the 13 and 12 bit,
+	// the frame_length is 13bits, so we move 13-2=11.
+	frameLength := (sfiv << 11) & 0x1800
+
+	abfv := uint32(p[4])<<16 | uint32(p[5])<<8 | uint32(p[6])
+	p = p[7:]
+
+	// frame_length 13 bslbf: consume the first 13-2=11bits
+	// the fh2 is 24bits, so we move right 24-11=13.
+	frameLength |= uint16((abfv >> 13) & 0x07ff)
+	// adts_buffer_fullness 11 bslbf
+	//fh_adts_buffer_fullness = (abfv >> 2) & 0x7ff
+	// number_of_raw_data_blocks_in_frame 2 uimsbf
+	//number_of_raw_data_blocks_in_frame = abfv & 0x03
+	// adts_error_check(), 1.A.2.2.3 Error detection
+	if protectionAbsent == 0 {
+		if len(p) <= 2 {
+			return nil, nil, errors.Errorf("requires 2+ but only %v bytes", len(p))
+		}
+		// crc_check 16 Rpchof
+		p = p[2:]
+	}
+
+	v.asc.Object = profile.ToObjectType()
+	v.asc.Channels = Channels(channelConfiguration)
+	v.asc.SampleRate = SampleRateIndex(samplingFrequencyIndex)
+
+	nbRaw := int(frameLength - 7)
+	if len(p) < nbRaw {
+		return nil, nil, errors.Errorf("requires %v but only %v bytes", nbRaw, len(p))
+	}
+	raw = p[:nbRaw]
+	left = p[nbRaw:]
+
+	if err = v.asc.validate(); err != nil {
+		return nil, nil, errors.WithMessage(err, "adts decode")
+	}
+
+	return
+}
+
+func (v *ADTSImpl) ASC() *AudioSpecificConfig {
+	return &v.asc
+}
+
+// Convert the ASC(Audio Specific Configuration).
+// Refer to @doc ISO_IEC_14496-3-AAC-2001.pdf, @page 33, @section 1.6.2.1 AudioSpecificConfig
+type AudioSpecificConfig struct {
+	Object     ObjectType      // AAC object type.
+	SampleRate SampleRateIndex // AAC sample rate, not the FLV sampling rate.
+	Channels   Channels        // AAC channel configuration.
+}
+
+func (v *AudioSpecificConfig) validate() (err error) {
+	switch v.Object {
+	case ObjectTypeMain, ObjectTypeLC, ObjectTypeSSR, ObjectTypeHE, ObjectTypeHEv2:
+	default:
+		return errors.Errorf("invalid object %#x", uint8(v.Object))
+	}
+
+	if v.SampleRate < SampleRateIndex88kHz || v.SampleRate > SampleRateIndex7kHz {
+		return errors.Errorf("invalid sample-rate %#x", uint8(v.SampleRate))
+	}
+
+	if v.Channels < ChannelMono || v.Channels > Channel7_1 {
+		return errors.Errorf("invalid channels %#x", uint8(v.Channels))
+	}
+	return
+}
+
+func (v *AudioSpecificConfig) UnmarshalBinary(data []byte) (err error) {
+	// AudioSpecificConfig
+	// Refer to @doc ISO_IEC_14496-3-AAC-2001.pdf, @page 33, @section 1.6.2.1 AudioSpecificConfig
+	//
+	// only need to decode the first 2bytes:
+	// audioObjectType, 5bits.
+	// samplingFrequencyIndex, aac_sample_rate, 4bits.
+	// channelConfiguration, aac_channels, 4bits
+	//
+	// @see SrsAacTransmuxer::write_audio
+	if len(data) < 2 {
+		return errors.Errorf("requires 2 but only %v bytes", len(data))
+	}
+
+	t0, t1 := uint8(data[0]), uint8(data[1])
+
+	v.Object = ObjectType((t0 >> 3) & 0x1f)
+	v.SampleRate = SampleRateIndex(((t0 << 1) & 0x0e) | ((t1 >> 7) & 0x01))
+	v.Channels = Channels((t1 >> 3) & 0x0f)
+
+	return v.validate()
+}
+
+func (v *AudioSpecificConfig) MarshalBinary() (data []byte, err error) {
+	if err = v.validate(); err != nil {
+		return
+	}
+
+	// AudioSpecificConfig
+	// Refer to @doc ISO_IEC_14496-3-AAC-2001.pdf, @page 33, @section 1.6.2.1 AudioSpecificConfig
+	//
+	// only need to decode the first 2bytes:
+	// audioObjectType, 5bits.
+	// samplingFrequencyIndex, aac_sample_rate, 4bits.
+	// channelConfiguration, aac_channels, 4bits
+	return []byte{
+		byte(byte(v.Object)&0x1f)<<3 | byte(byte(v.SampleRate)&0x0e)>>1,
+		byte(byte(v.SampleRate)&0x01)<<7 | byte(byte(v.Channels)&0x0f)<<3,
+	}, nil
+}
--- a/trunk/3rdparty/srs-bench/vendor/github.com/ossrs/go-oryx-lib/flv/flv.go
+++ b/trunk/3rdparty/srs-bench/vendor/github.com/ossrs/go-oryx-lib/flv/flv.go
@ -0,0 +1,747 @@
+// The MIT License (MIT)
+//
+// Copyright (c) 2013-2017 Oryx(ossrs)
+//
+// Permission is hereby granted, free of charge, to any person obtaining a copy of
+// this software and associated documentation files (the "Software"), to deal in
+// the Software without restriction, including without limitation the rights to
+// use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of
+// the Software, and to permit persons to whom the Software is furnished to do so,
+// subject to the following conditions:
+//
+// The above copyright notice and this permission notice shall be included in all
+// copies or substantial portions of the Software.
+//
+// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS
+// FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR
+// COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER
+// IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
+// CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
+
+// The oryx FLV package support bytes from/to FLV tags.
+package flv
+
+import (
+	"bytes"
+	"errors"
+	"github.com/ossrs/go-oryx-lib/aac"
+	"io"
+	"strings"
+)
+
+// FLV Tag Type is the type of tag,
+// refer to @doc video_file_format_spec_v10.pdf, @page 9, @section FLV tags
+type TagType uint8
+
+const (
+	TagTypeForbidden  TagType = 0
+	TagTypeAudio      TagType = 8
+	TagTypeVideo      TagType = 9
+	TagTypeScriptData TagType = 18
+)
+
+func (v TagType) String() string {
+	switch v {
+	case TagTypeVideo:
+		return "Video"
+	case TagTypeAudio:
+		return "Audio"
+	case TagTypeScriptData:
+		return "Data"
+	default:
+		return "Forbidden"
+	}
+}
+
+// FLV Demuxer is used to demux FLV file.
+// Refer to @doc video_file_format_spec_v10.pdf, @page 74, @section Annex E. The FLV File Format
+// A FLV file must consist the bellow parts:
+//	1. A FLV header, refer to @doc video_file_format_spec_v10.pdf, @page 8, @section The FLV header
+//	2. One or more tags, refer to @doc video_file_format_spec_v10.pdf, @page 9, @section FLV tags
+// @remark We always ignore the previous tag size.
+type Demuxer interface {
+	// Read the FLV header, return the version of FLV, whether hasVideo or hasAudio in header.
+	ReadHeader() (version uint8, hasVideo, hasAudio bool, err error)
+	// Read the FLV tag header, return the tag information, especially the tag size,
+	// then user can read the tag payload.
+	ReadTagHeader() (tagType TagType, tagSize, timestamp uint32, err error)
+	// Read the FLV tag body, drop the next 4 bytes previous tag size.
+	ReadTag(tagSize uint32) (tag []byte, err error)
+	// Close the demuxer.
+	Close() error
+}
+
+// When FLV signature is not "FLV"
+var errSignature = errors.New("FLV signatures are illegal")
+
+// Create a demuxer object.
+func NewDemuxer(r io.Reader) (Demuxer, error) {
+	return &demuxer{
+		r: r,
+	}, nil
+}
+
+type demuxer struct {
+	r io.Reader
+}
+
+func (v *demuxer) ReadHeader() (version uint8, hasVideo, hasAudio bool, err error) {
+	h := &bytes.Buffer{}
+	if _, err = io.CopyN(h, v.r, 13); err != nil {
+		return
+	}
+
+	p := h.Bytes()
+
+	if !bytes.Equal([]byte{byte('F'), byte('L'), byte('V')}, p[:3]) {
+		err = errSignature
+		return
+	}
+
+	version = uint8(p[3])
+	hasVideo = (p[4] & 0x01) == 0x01
+	hasAudio = ((p[4] >> 2) & 0x01) == 0x01
+
+	return
+}
+
+func (v *demuxer) ReadTagHeader() (tagType TagType, tagSize uint32, timestamp uint32, err error) {
+	h := &bytes.Buffer{}
+	if _, err = io.CopyN(h, v.r, 11); err != nil {
+		return
+	}
+
+	p := h.Bytes()
+
+	tagType = TagType(p[0])
+	tagSize = uint32(p[1])<<16 | uint32(p[2])<<8 | uint32(p[3])
+	timestamp = uint32(p[7])<<24 | uint32(p[4])<<16 | uint32(p[5])<<8 | uint32(p[6])
+
+	return
+}
+
+func (v *demuxer) ReadTag(tagSize uint32) (tag []byte, err error) {
+	h := &bytes.Buffer{}
+	if _, err = io.CopyN(h, v.r, int64(tagSize+4)); err != nil {
+		return
+	}
+
+	p := h.Bytes()
+	tag = p[0 : len(p)-4]
+
+	return
+}
+
+func (v *demuxer) Close() error {
+	return nil
+}
+
+// The FLV muxer is used to write packet in FLV protocol.
+// Refer to @doc video_file_format_spec_v10.pdf, @page 74, @section Annex E. The FLV File Format
+type Muxer interface {
+	// Write the FLV header.
+	WriteHeader(hasVideo, hasAudio bool) (err error)
+	// Write A FLV tag.
+	WriteTag(tagType TagType, timestamp uint32, tag []byte) (err error)
+	// Close the muxer.
+	Close() error
+}
+
+// Create a muxer object.
+func NewMuxer(w io.Writer) (Muxer, error) {
+	return &muxer{
+		w: w,
+	}, nil
+}
+
+type muxer struct {
+	w io.Writer
+}
+
+func (v *muxer) WriteHeader(hasVideo, hasAudio bool) (err error) {
+	var flags byte
+	if hasVideo {
+		flags |= 0x01
+	}
+	if hasAudio {
+		flags |= 0x04
+	}
+
+	r := bytes.NewReader([]byte{
+		byte('F'), byte('L'), byte('V'),
+		0x01,
+		flags,
+		0x00, 0x00, 0x00, 0x09,
+		0x00, 0x00, 0x00, 0x00,
+	})
+
+	if _, err = io.Copy(v.w, r); err != nil {
+		return
+	}
+
+	return
+}
+
+func (v *muxer) WriteTag(tagType TagType, timestamp uint32, tag []byte) (err error) {
+	// Tag header.
+	tagSize := uint32(len(tag))
+
+	r := bytes.NewReader([]byte{
+		byte(tagType),
+		byte(tagSize >> 16), byte(tagSize >> 8), byte(tagSize),
+		byte(timestamp >> 16), byte(timestamp >> 8), byte(timestamp),
+		byte(timestamp >> 24),
+		0x00, 0x00, 0x00,
+	})
+
+	if _, err = io.Copy(v.w, r); err != nil {
+		return
+	}
+
+	// TAG
+	if _, err = io.Copy(v.w, bytes.NewReader(tag)); err != nil {
+		return
+	}
+
+	// Previous tag size.
+	pts := uint32(11 + len(tag))
+	r = bytes.NewReader([]byte{
+		byte(pts >> 24), byte(pts >> 16), byte(pts >> 8), byte(pts),
+	})
+
+	if _, err = io.Copy(v.w, r); err != nil {
+		return
+	}
+
+	return
+}
+
+func (v *muxer) Close() error {
+	return nil
+}
+
+// The Audio AAC frame trait, whether sequence header(ASC) or raw data.
+// Refer to @doc video_file_format_spec_v10.pdf, @page 77, @section E.4.2 Audio Tags
+type AudioFrameTrait uint8
+
+const (
+	// For AAC, the frame trait.
+	AudioFrameTraitSequenceHeader AudioFrameTrait = 0 // 0 = AAC sequence header
+	AudioFrameTraitRaw            AudioFrameTrait = 1 // 1 = AAC raw
+
+	// For Opus, the frame trait, may has more than one traits.
+	AudioFrameTraitOpusRaw          AudioFrameTrait = 0x02 // 2, Has RAW Opus data.
+	AudioFrameTraitOpusSamplingRate AudioFrameTrait = 0x04 // 4, Has Opus SamplingRate.
+	AudioFrameTraitOpusAudioLevel   AudioFrameTrait = 0x08 // 8, Has audio level data, 16bits.
+
+	AudioFrameTraitForbidden AudioFrameTrait = 0xff
+)
+
+func (v AudioFrameTrait) String() string {
+	if v > AudioFrameTraitRaw && v < AudioFrameTraitForbidden {
+		var s []string
+		if (v & AudioFrameTraitOpusRaw) == AudioFrameTraitOpusRaw {
+			s = append(s, "RAW")
+		}
+		if (v & AudioFrameTraitOpusSamplingRate) == AudioFrameTraitOpusSamplingRate {
+			s = append(s, "SR")
+		}
+		if (v & AudioFrameTraitOpusAudioLevel) == AudioFrameTraitOpusAudioLevel {
+			s = append(s, "AL")
+		}
+		return strings.Join(s, "|")
+	}
+
+	switch v {
+	case AudioFrameTraitSequenceHeader:
+		return "SequenceHeader"
+	case AudioFrameTraitRaw:
+		return "Raw"
+	default:
+		return "Forbidden"
+	}
+}
+
+// The audio channels, FLV named it the SoundType.
+// Refer to @doc video_file_format_spec_v10.pdf, @page 77, @section E.4.2 Audio Tags
+type AudioChannels uint8
+
+const (
+	AudioChannelsMono   AudioChannels = iota // 0 = Mono sound
+	AudioChannelsStereo                      // 1 = Stereo sound
+	AudioChannelsForbidden
+)
+
+func (v AudioChannels) String() string {
+	switch v {
+	case AudioChannelsMono:
+		return "Mono"
+	case AudioChannelsStereo:
+		return "Stereo"
+	default:
+		return "Forbidden"
+	}
+}
+
+func (v *AudioChannels) From(a aac.Channels) {
+	switch a {
+	case aac.ChannelMono:
+		*v = AudioChannelsMono
+	case aac.ChannelStereo:
+		*v = AudioChannelsStereo
+	case aac.Channel3, aac.Channel4, aac.Channel5, aac.Channel5_1, aac.Channel7_1:
+		*v = AudioChannelsStereo
+	default:
+		*v = AudioChannelsForbidden
+	}
+}
+
+// The audio sample bits, FLV named it the SoundSize.
+// Refer to @doc video_file_format_spec_v10.pdf, @page 76, @section E.4.2 Audio Tags
+type AudioSampleBits uint8
+
+const (
+	AudioSampleBits8bits  AudioSampleBits = iota // 0 = 8-bit samples
+	AudioSampleBits16bits                        // 1 = 16-bit samples
+	AudioSampleBitsForbidden
+)
+
+func (v AudioSampleBits) String() string {
+	switch v {
+	case AudioSampleBits8bits:
+		return "8-bits"
+	case AudioSampleBits16bits:
+		return "16-bits"
+	default:
+		return "Forbidden"
+	}
+}
+
+// The audio sampling rate, FLV named it the SoundRate.
+// Refer to @doc video_file_format_spec_v10.pdf, @page 76, @section E.4.2 Audio Tags
+type AudioSamplingRate uint8
+
+const (
+	// For FLV, only support 5, 11, 22, 44KHz sampling rate.
+	AudioSamplingRate5kHz  AudioSamplingRate = iota // 0 = 5.5 kHz
+	AudioSamplingRate11kHz                          // 1 = 11 kHz
+	AudioSamplingRate22kHz                          // 2 = 22 kHz
+	AudioSamplingRate44kHz                          // 3 = 44 kHz
+	// For Opus, support 8, 12, 16, 24, 48KHz
+	// We will write a UINT8 sampling rate after FLV audio tag header.
+	// @doc https://tools.ietf.org/html/rfc6716#section-2
+	AudioSamplingRateNB8kHz   = 8  // NB (narrowband)
+	AudioSamplingRateMB12kHz  = 12 // MB (medium-band)
+	AudioSamplingRateWB16kHz  = 16 // WB (wideband)
+	AudioSamplingRateSWB24kHz = 24 // SWB (super-wideband)
+	AudioSamplingRateFB48kHz  = 48 // FB (fullband)
+
+	AudioSamplingRateForbidden
+)
+
+func (v AudioSamplingRate) String() string {
+	switch v {
+	case AudioSamplingRate5kHz:
+		return "5.5kHz"
+	case AudioSamplingRate11kHz:
+		return "11kHz"
+	case AudioSamplingRate22kHz:
+		return "22kHz"
+	case AudioSamplingRate44kHz:
+		return "44kHz"
+	case AudioSamplingRateNB8kHz:
+		return "NB8kHz"
+	case AudioSamplingRateMB12kHz:
+		return "MB12kHz"
+	case AudioSamplingRateWB16kHz:
+		return "WB16kHz"
+	case AudioSamplingRateSWB24kHz:
+		return "SWB24kHz"
+	case AudioSamplingRateFB48kHz:
+		return "FB48kHz"
+	default:
+		return "Forbidden"
+	}
+}
+
+// Parse the FLV sampling rate to Hz.
+func (v AudioSamplingRate) ToHz() int {
+	flvSR := []int{5512, 11025, 22050, 44100}
+	return flvSR[v]
+}
+
+// For FLV, convert aac sample rate index to FLV sampling rate.
+func (v *AudioSamplingRate) From(a aac.SampleRateIndex) {
+	switch a {
+	case aac.SampleRateIndex96kHz, aac.SampleRateIndex88kHz, aac.SampleRateIndex64kHz:
+		*v = AudioSamplingRate44kHz
+	case aac.SampleRateIndex48kHz:
+		*v = AudioSamplingRate44kHz
+	case aac.SampleRateIndex44kHz, aac.SampleRateIndex32kHz:
+		*v = AudioSamplingRate44kHz
+	case aac.SampleRateIndex24kHz, aac.SampleRateIndex22kHz, aac.SampleRateIndex16kHz:
+		*v = AudioSamplingRate22kHz
+	case aac.SampleRateIndex12kHz, aac.SampleRateIndex11kHz, aac.SampleRateIndex8kHz:
+		*v = AudioSamplingRate11kHz
+	case aac.SampleRateIndex7kHz:
+		*v = AudioSamplingRate5kHz
+	default:
+		*v = AudioSamplingRateForbidden
+	}
+}
+
+// Parse the Opus sampling rate to Hz.
+func (v AudioSamplingRate) OpusToHz() int {
+	opusSR := []int{8000, 12000, 16000, 24000, 48000}
+	return opusSR[v]
+}
+
+// For Opus, convert aac sample rate index to FLV sampling rate.
+func (v *AudioSamplingRate) OpusFrom(a aac.SampleRateIndex) {
+	switch a {
+	case aac.SampleRateIndex96kHz, aac.SampleRateIndex88kHz, aac.SampleRateIndex64kHz:
+		*v = AudioSamplingRateFB48kHz
+	case aac.SampleRateIndex48kHz, aac.SampleRateIndex44kHz, aac.SampleRateIndex32kHz:
+		*v = AudioSamplingRateFB48kHz
+	case aac.SampleRateIndex24kHz, aac.SampleRateIndex22kHz:
+		*v = AudioSamplingRateSWB24kHz
+	case aac.SampleRateIndex16kHz:
+		*v = AudioSamplingRateWB16kHz
+	case aac.SampleRateIndex12kHz, aac.SampleRateIndex11kHz:
+		*v = AudioSamplingRateMB12kHz
+	case aac.SampleRateIndex8kHz, aac.SampleRateIndex7kHz:
+		*v = AudioSamplingRateNB8kHz
+	default:
+		*v = AudioSamplingRateForbidden
+	}
+}
+
+// The audio codec id, FLV named it the SoundFormat.
+// Refer to @doc video_file_format_spec_v10.pdf, @page 76, @section E.4.2 Audio Tags
+// It's 4bits, that is 0-16.
+type AudioCodec uint8
+
+const (
+	AudioCodecLinearPCM       AudioCodec = iota // 0 = Linear PCM, platform endian
+	AudioCodecADPCM                             // 1 = ADPCM
+	AudioCodecMP3                               // 2 = MP3
+	AudioCodecLinearPCMle                       // 3 = Linear PCM, little endian
+	AudioCodecNellymoser16kHz                   // 4 = Nellymoser 16 kHz mono
+	AudioCodecNellymoser8kHz                    // 5 = Nellymoser 8 kHz mono
+	AudioCodecNellymoser                        // 6 = Nellymoser
+	AudioCodecG711Alaw                          // 7 = G.711 A-law logarithmic PCM
+	AudioCodecG711MuLaw                         // 8 = G.711 mu-law logarithmic PCM
+	AudioCodecReserved                          // 9 = reserved
+	AudioCodecAAC                               // 10 = AAC
+	AudioCodecSpeex                             // 11 = Speex
+	AudioCodecUndefined12
+	// For FLV, it's undefined, we define it as Opus for WebRTC.
+	AudioCodecOpus           // 13 = Opus
+	AudioCodecMP3In8kHz      // 14 = MP3 8 kHz
+	AudioCodecDeviceSpecific // 15 = Device-specific sound
+	AudioCodecForbidden
+)
+
+func (v AudioCodec) String() string {
+	switch v {
+	case AudioCodecLinearPCM:
+		return "LinearPCM(platform-endian)"
+	case AudioCodecADPCM:
+		return "ADPCM"
+	case AudioCodecMP3:
+		return "MP3"
+	case AudioCodecLinearPCMle:
+		return "LinearPCM(little-endian)"
+	case AudioCodecNellymoser16kHz:
+		return "Nellymoser(16kHz-mono)"
+	case AudioCodecNellymoser8kHz:
+		return "Nellymoser(8kHz-mono)"
+	case AudioCodecNellymoser:
+		return "Nellymoser"
+	case AudioCodecG711Alaw:
+		return "G.711(A-law)"
+	case AudioCodecG711MuLaw:
+		return "G.711(mu-law)"
+	case AudioCodecAAC:
+		return "AAC"
+	case AudioCodecSpeex:
+		return "Speex"
+	case AudioCodecOpus:
+		return "Opus"
+	case AudioCodecMP3In8kHz:
+		return "MP3(8kHz)"
+	case AudioCodecDeviceSpecific:
+		return "DeviceSpecific"
+	default:
+		return "Forbidden"
+	}
+}
+
+type AudioFrame struct {
+	SoundFormat AudioCodec
+	SoundRate   AudioSamplingRate
+	SoundSize   AudioSampleBits
+	SoundType   AudioChannels
+	Trait       AudioFrameTrait
+	AudioLevel  uint16
+	Raw         []byte
+}
+
+// The packager used to codec the FLV audio tag body.
+// Refer to @doc video_file_format_spec_v10.pdf, @page 76, @section E.4.2 Audio Tags
+type AudioPackager interface {
+	// Encode the audio frame to FLV audio tag.
+	Encode(frame *AudioFrame) (tag []byte, err error)
+	// Decode the FLV audio tag to audio frame.
+	Decode(tag []byte) (frame *AudioFrame, err error)
+}
+
+var errDataNotEnough = errors.New("Data not enough")
+
+type audioPackager struct {
+}
+
+func NewAudioPackager() (AudioPackager, error) {
+	return &audioPackager{}, nil
+}
+
+func (v *audioPackager) Encode(frame *AudioFrame) (tag []byte, err error) {
+	audioTagHeader := []byte{
+		byte(frame.SoundFormat)<<4 | byte(frame.SoundRate)<<2 | byte(frame.SoundSize)<<1 | byte(frame.SoundType),
+	}
+
+	// For Opus, we put the sampling rate after trait,
+	// so we set the sound rate in audio tag to 0.
+	if frame.SoundFormat == AudioCodecOpus {
+		audioTagHeader[0] &= 0xf3
+	}
+
+	if frame.SoundFormat == AudioCodecAAC {
+		return append(append(audioTagHeader, byte(frame.Trait)), frame.Raw...), nil
+	} else if frame.SoundFormat == AudioCodecOpus {
+		var b bytes.Buffer
+
+		b.Write(audioTagHeader)
+
+		b.WriteByte(byte(frame.Trait))
+		if (frame.Trait & AudioFrameTraitOpusSamplingRate) == AudioFrameTraitOpusSamplingRate {
+			b.WriteByte(byte(frame.SoundRate))
+		}
+		if (frame.Trait & AudioFrameTraitOpusAudioLevel) == AudioFrameTraitOpusAudioLevel {
+			b.WriteByte(byte(frame.AudioLevel >> 8))
+			b.WriteByte(byte(frame.AudioLevel))
+		}
+
+		b.Write(frame.Raw)
+
+		return b.Bytes(), nil
+	} else {
+		return append(audioTagHeader, frame.Raw...), nil
+	}
+}
+
+func (v *audioPackager) Decode(tag []byte) (frame *AudioFrame, err error) {
+	// Refer to @doc video_file_format_spec_v10.pdf, @page 76, @section E.4.2 Audio Tags
+	// @see SrsFormat::audio_aac_demux
+	if len(tag) < 2 {
+		err = errDataNotEnough
+		return
+	}
+
+	t := uint8(tag[0])
+	frame = &AudioFrame{}
+	frame.SoundFormat = AudioCodec(uint8(t>>4) & 0x0f)
+	frame.SoundRate = AudioSamplingRate(uint8(t>>2) & 0x03)
+	frame.SoundSize = AudioSampleBits(uint8(t>>1) & 0x01)
+	frame.SoundType = AudioChannels(t & 0x01)
+
+	if frame.SoundFormat == AudioCodecAAC {
+		frame.Trait = AudioFrameTrait(tag[1])
+		frame.Raw = tag[2:]
+	} else if frame.SoundFormat == AudioCodecOpus {
+		frame.Trait = AudioFrameTrait(tag[1])
+		p := tag[2:]
+
+		// For Opus, we put sampling rate after trait.
+		if (frame.Trait & AudioFrameTraitOpusSamplingRate) == AudioFrameTraitOpusSamplingRate {
+			if len(p) < 1 {
+				return nil, errDataNotEnough
+			}
+			frame.SoundRate = AudioSamplingRate(p[0])
+			p = p[1:]
+		}
+
+		// For Opus, we put audio level after trait.
+		if (frame.Trait & AudioFrameTraitOpusAudioLevel) == AudioFrameTraitOpusAudioLevel {
+			if len(p) < 2 {
+				return nil, errDataNotEnough
+			}
+			frame.AudioLevel = uint16(p[0])<<8 | uint16(p[1])
+			p = p[2:]
+		}
+
+		frame.Raw = p
+	} else {
+		frame.Raw = tag[1:]
+	}
+
+	return
+}
+
+// The video frame type.
+// Refer to @doc video_file_format_spec_v10.pdf, @page 78, @section E.4.3 Video Tags
+type VideoFrameType uint8
+
+const (
+	VideoFrameTypeForbidden  VideoFrameType = iota
+	VideoFrameTypeKeyframe                  //  1 = key frame (for AVC, a seekable frame)
+	VideoFrameTypeInterframe                // 2 = inter frame (for AVC, a non-seekable frame)
+	VideoFrameTypeDisposable                // 3 = disposable inter frame (H.263 only)
+	VideoFrameTypeGenerated                 // 4 = generated key frame (reserved for server use only)
+	VideoFrameTypeInfo                      // 5 = video info/command frame
+)
+
+func (v VideoFrameType) String() string {
+	switch v {
+	case VideoFrameTypeKeyframe:
+		return "Keyframe"
+	case VideoFrameTypeInterframe:
+		return "Interframe"
+	case VideoFrameTypeDisposable:
+		return "DisposableInterframe"
+	case VideoFrameTypeGenerated:
+		return "GeneratedKeyframe"
+	case VideoFrameTypeInfo:
+		return "Info"
+	default:
+		return "Forbidden"
+	}
+}
+
+// The video codec id.
+// Refer to @doc video_file_format_spec_v10.pdf, @page 78, @section E.4.3 Video Tags
+// It's 4bits, that is 0-16.
+type VideoCodec uint8
+
+const (
+	VideoCodecForbidden   VideoCodec = iota + 1
+	VideoCodecH263                   // 2 = Sorenson H.263
+	VideoCodecScreen                 // 3 = Screen video
+	VideoCodecOn2VP6                 // 4 = On2 VP6
+	VideoCodecOn2VP6Alpha            // 5 = On2 VP6 with alpha channel
+	VideoCodecScreen2                // 6 = Screen video version 2
+	VideoCodecAVC                    // 7 = AVC
+	// See page 79 at @doc https://github.com/CDN-Union/H265/blob/master/Document/video_file_format_spec_v10_1_ksyun_20170615.doc
+	VideoCodecHEVC VideoCodec = 12 // 12 = HEVC
+)
+
+func (v VideoCodec) String() string {
+	switch v {
+	case VideoCodecH263:
+		return "H.263"
+	case VideoCodecScreen:
+		return "Screen"
+	case VideoCodecOn2VP6:
+		return "VP6"
+	case VideoCodecOn2VP6Alpha:
+		return "On2VP6(alpha)"
+	case VideoCodecScreen2:
+		return "Screen2"
+	case VideoCodecAVC:
+		return "AVC"
+	case VideoCodecHEVC:
+		return "HEVC"
+	default:
+		return "Forbidden"
+	}
+}
+
+// The video AVC frame trait, whethere sequence header or not.
+// Refer to @doc video_file_format_spec_v10.pdf, @page 78, @section E.4.3 Video Tags
+// If AVC or HEVC, it's 8bits.
+type VideoFrameTrait uint8
+
+const (
+	VideoFrameTraitSequenceHeader VideoFrameTrait = iota // 0 = AVC/HEVC sequence header
+	VideoFrameTraitNALU                                  // 1 = AVC/HEVC NALU
+	VideoFrameTraitSequenceEOF                           // 2 = AVC/HEVC end of sequence (lower level NALU sequence ender is
+	VideoFrameTraitForbidden
+)
+
+func (v VideoFrameTrait) String() string {
+	switch v {
+	case VideoFrameTraitSequenceHeader:
+		return "SequenceHeader"
+	case VideoFrameTraitNALU:
+		return "NALU"
+	case VideoFrameTraitSequenceEOF:
+		return "SequenceEOF"
+	default:
+		return "Forbidden"
+	}
+}
+
+type VideoFrame struct {
+	CodecID   VideoCodec
+	FrameType VideoFrameType
+	Trait     VideoFrameTrait
+	CTS       int32
+	Raw       []byte
+}
+
+func NewVideoFrame() *VideoFrame {
+	return &VideoFrame{}
+}
+
+// The packager used to codec the FLV video tag body.
+// Refer to @doc video_file_format_spec_v10.pdf, @page 78, @section E.4.3 Video Tags
+type VideoPackager interface {
+	// Decode the FLV video tag to video frame.
+	// @remark For RTMP/FLV: pts = dts + cts, where dts is timestamp in packet/tag.
+	Decode(tag []byte) (frame *VideoFrame, err error)
+	// Encode the video frame to FLV video tag.
+	Encode(frame *VideoFrame) (tag []byte, err error)
+}
+
+type videoPackager struct {
+}
+
+func NewVideoPackager() (VideoPackager, error) {
+	return &videoPackager{}, nil
+}
+
+func (v *videoPackager) Decode(tag []byte) (frame *VideoFrame, err error) {
+	if len(tag) < 5 {
+		err = errDataNotEnough
+		return
+	}
+
+	p := tag
+	frame = &VideoFrame{}
+	frame.FrameType = VideoFrameType(byte(p[0]>>4) & 0x0f)
+	frame.CodecID = VideoCodec(byte(p[0]) & 0x0f)
+
+	if frame.CodecID == VideoCodecAVC || frame.CodecID == VideoCodecHEVC {
+		frame.Trait = VideoFrameTrait(p[1])
+		frame.CTS = int32(uint32(p[2])<<16 | uint32(p[3])<<8 | uint32(p[4]))
+		frame.Raw = tag[5:]
+	} else {
+		frame.Raw = tag[1:]
+	}
+
+	return
+}
+
+func (v videoPackager) Encode(frame *VideoFrame) (tag []byte, err error) {
+	if frame.CodecID == VideoCodecAVC || frame.CodecID == VideoCodecHEVC {
+		return append([]byte{
+			byte(frame.FrameType)<<4 | byte(frame.CodecID), byte(frame.Trait),
+			byte(frame.CTS >> 16), byte(frame.CTS >> 8), byte(frame.CTS),
+		}, frame.Raw...), nil
+	} else {
+		return append([]byte{
+			byte(frame.FrameType)<<4 | byte(frame.CodecID),
+		}, frame.Raw...), nil
+	}
+}