add comments

This commit is contained in:
nareix 2016-07-30 13:08:26 +08:00
parent a90312e55b
commit 6b25c3b4db
2 changed files with 106 additions and 52 deletions

139
av/av.go
View File

@ -5,20 +5,21 @@ import (
"time"
)
// Audio sample format
type SampleFormat uint8
const (
U8 = SampleFormat(iota + 1)
S16
S32
FLT
DBL
U8P
S16P
S32P
FLTP
DBLP
U32
U8 = SampleFormat(iota + 1) // 8-bit unsigned integer
S16 // signed 16-bit integer
S32 // signed 32-bit integer
FLT // 32-bit float
DBL // 64-bit float
U8P // 8-bit unsigned integer in planar
S16P // signed 16-bit integer in planar
S32P // signed 32-bit integer in planar
FLTP // 32-bit float in planar
DBLP // 64-bit float in planar
U32 // unsigned 32-bit integer
)
func (self SampleFormat) BytesPerSample() int {
@ -63,6 +64,7 @@ func (self SampleFormat) String() string {
}
}
// checkout if this sample format is in planar
func (self SampleFormat) IsPlanar() bool {
switch self {
case S16P, S32P, FLTP, DBLP:
@ -72,6 +74,7 @@ func (self SampleFormat) IsPlanar() bool {
}
}
// audio channel layout
type ChannelLayout uint16
func (self ChannelLayout) String() string {
@ -107,8 +110,18 @@ func (self ChannelLayout) Count() (n int) {
return
}
// Video/Audio codec type. can be H264/AAC/SPEEX/...
type CodecType uint32
var (
H264 = MakeVideoCodecType(avCodecTypeMagic + 1)
AAC = MakeAudioCodecType(avCodecTypeMagic + 1)
PCM_MULAW = MakeAudioCodecType(avCodecTypeMagic + 2)
PCM_ALAW = MakeAudioCodecType(avCodecTypeMagic + 3)
SPEEX = MakeAudioCodecType(avCodecTypeMagic + 4)
NELLYMOSER = MakeAudioCodecType(avCodecTypeMagic + 5)
)
const codecTypeAudioBit = 0x1
const codecTypeOtherBits = 1
@ -130,19 +143,23 @@ func (self CodecType) String() string {
return ""
}
// CodecType is audio
func (self CodecType) IsAudio() bool {
return self&codecTypeAudioBit != 0
}
// CodecType is video
func (self CodecType) IsVideo() bool {
return self&codecTypeAudioBit == 0
}
// make a new audio codec type
func MakeAudioCodecType(base uint32) (c CodecType) {
c = CodecType(base)<<codecTypeOtherBits | CodecType(codecTypeAudioBit)
return
}
// make a new video codec type
func MakeVideoCodecType(base uint32) (c CodecType) {
c = CodecType(base) << codecTypeOtherBits
return
@ -150,31 +167,28 @@ func MakeVideoCodecType(base uint32) (c CodecType) {
const avCodecTypeMagic = 233333
var (
H264 = MakeVideoCodecType(avCodecTypeMagic + 1)
AAC = MakeAudioCodecType(avCodecTypeMagic + 1)
PCM_MULAW = MakeAudioCodecType(avCodecTypeMagic + 2)
PCM_ALAW = MakeAudioCodecType(avCodecTypeMagic + 3)
SPEEX = MakeAudioCodecType(avCodecTypeMagic + 4)
NELLYMOSER = MakeAudioCodecType(avCodecTypeMagic + 5)
)
// CodecData is some bytes for initializing audio/video decoder
// video width/height and audio samplerate/channellayout can get from CodecData
// CodecData can convert to VideoCodecData or AudioCodecData using:
// codecdata.(AudioCodecData) or codecdata.(VideoCodecData)
// e.g: for H264, CodecData is AVCDecoderConfigure bytes, includes SPS/PPS
type CodecData interface {
Type() CodecType
Type() CodecType // Video/Audio codec type
}
type VideoCodecData interface {
CodecData
Width() int
Height() int
Width() int // Video height
Height() int // Video width
}
type AudioCodecData interface {
CodecData
SampleFormat() SampleFormat
SampleRate() int
ChannelLayout() ChannelLayout
SampleFormat() SampleFormat // Audio sample format
SampleRate() int // Audio sample rate
ChannelLayout() ChannelLayout // Audio channel layout
// get audio packet duration
PacketDuration([]byte) (time.Duration, error)
}
@ -186,47 +200,66 @@ type PacketReader interface {
ReadPacket() (Packet,error)
}
// Muxer describes the steps of writing compressed audio/video packets into container formats like MP4/FLV/MPEG-TS.
// 1. WriteHeader([]CodecData) write the file header, each stream
// 2. WritePacket(Packet) write the audio/video packets
// 3. WriteTrailer() end writing, now it's a complete file.
//
// WriteHeader/WriteTrailer can be called only once.
//
// every formsts(format/flv format/mp4 ...) implements Muxer interface.
// rtmp.Conn implements Muxer interface.
// and in some case like transcode.Muxer also implements Muxer interface.
type Muxer interface {
PacketWriter
WriteHeader([]CodecData) error
WriteTrailer() error
}
// Muxer with Close() method
type MuxCloser interface {
Muxer
Close() error
}
// Demuxer can demux compressed audio/video packets from container formats like MP4/FLV/MPEG-TS.
// Streams() ([]CodecData, error) reads the file header, contains video/audio meta infomations
// ReadPacket() (Packet, error) read compressed audio/video packets
type Demuxer interface {
PacketReader
Streams() ([]CodecData, error)
}
// Demuxer with Close() method
type DemuxCloser interface {
Demuxer
Close() error
}
// Packet stores compressed audio/video data
type Packet struct {
IsKeyFrame bool
Idx int8
CompositionTime time.Duration
Time time.Duration
Data []byte
IsKeyFrame bool // video packet is key frame
Idx int8 // stream index in container format
CompositionTime time.Duration // packet presentation time minus decode time for H264 B-Frame
Time time.Duration // packet decode time
Data []byte // packet data
}
// Raw audio frame
type AudioFrame struct {
SampleFormat SampleFormat
ChannelLayout ChannelLayout
SampleCount int
SampleRate int
Data [][]byte
SampleFormat SampleFormat // audio sample format, e.g: S16,FLTP,...
ChannelLayout ChannelLayout // audio channel layout, e.g: CH_MONO,CH_STEREO,...
SampleCount int // sample count in this frame
SampleRate int // sample rate
Data [][]byte // data array for planar format len(Data) > 1
}
// audio frame duration
func (self AudioFrame) Duration() time.Duration {
return time.Second * time.Duration(self.SampleCount) / time.Duration(self.SampleRate)
}
// check this audio frame has same format as other audio frame
func (self AudioFrame) HasSameFormat(other AudioFrame) bool {
if self.SampleRate != other.SampleRate {
return false
@ -240,6 +273,7 @@ func (self AudioFrame) HasSameFormat(other AudioFrame) bool {
return true
}
// split sample audio sample from this frame
func (self AudioFrame) Slice(start int, end int) (out AudioFrame) {
out = self
out.Data = append([][]byte(nil), out.Data...)
@ -251,6 +285,7 @@ func (self AudioFrame) Slice(start int, end int) (out AudioFrame) {
return
}
// concat two audio frames
func (self AudioFrame) Concat(in AudioFrame) (out AudioFrame) {
out = self
out.Data = append([][]byte(nil), out.Data...)
@ -261,25 +296,31 @@ func (self AudioFrame) Concat(in AudioFrame) (out AudioFrame) {
return
}
// AudioEncoder can encode raw audio frame into compressed audio packets
// now cgo/ffmpeg inplements AudioEncoder, using ffmpeg.NewAudioEncoder to create it
type AudioEncoder interface {
CodecData() (AudioCodecData, error)
Encode(AudioFrame) ([][]byte, error)
CodecData() (AudioCodecData, error) // encoder's codec data can put into container
Encode(AudioFrame) ([][]byte, error) // encode raw audio frame into compressed pakcet(s)
//Flush() ([]Packet, error)
Close()
SetSampleRate(int) (error)
SetChannelLayout(ChannelLayout) (error)
SetSampleFormat(SampleFormat) (error)
SetBitrate(int) (error)
SetOption(string,interface{}) (error)
GetOption(string,interface{}) (error)
Close() // close encoder, free cgo contexts
SetSampleRate(int) (error) // set encoder sample rate
SetChannelLayout(ChannelLayout) (error) // set encoder channel layout
SetSampleFormat(SampleFormat) (error) // set encoder sample format
SetBitrate(int) (error) // set encoder bitrate
SetOption(string,interface{}) (error) // encoder setopt, in ffmpeg is av_opt_set_dict()
GetOption(string,interface{}) (error) // encoder getopt
}
// AudioDecoder can decode compressed audio packets into raw audio frame
// use ffmpeg.NewAudioDecoder to create it
type AudioDecoder interface {
Decode([]byte) (bool, AudioFrame, error)
Decode([]byte) (bool, AudioFrame, error) // decode one compressed audio packet
//Flush() (AudioFrame, error)
Close()
Close() // close decode, free cgo contexts
}
// AudioResampler can convert raw audio frames in different sample rate/format/channel layout
type AudioResampler interface {
Resample(AudioFrame) (AudioFrame, error)
Resample(AudioFrame) (AudioFrame, error) // convert raw audio frames
}

View File

@ -17,14 +17,17 @@ type tStream struct {
adec av.AudioDecoder
}
// Transcode options
type Options struct {
FindAudioDecoderEncoder func(codec av.AudioCodecData, i int) (ok bool, dec av.AudioDecoder, enc av.AudioEncoder, err error)
// if transcode is needed, create your AudioDecoder and AudioEncoder for Transcoder use.
FindAudioDecoderEncoder func(codec av.AudioCodecData, i int) (need bool, dec av.AudioDecoder, enc av.AudioEncoder, err error)
}
type Transcoder struct {
streams []*tStream
}
// Create new Transcoder
func NewTranscoder(streams []av.CodecData, options Options) (_self *Transcoder, err error) {
self := &Transcoder{}
self.streams = []*tStream{}
@ -102,6 +105,10 @@ func (self *tStream) audioDecodeAndEncode(inpkt av.Packet) (outpkts []av.Packet,
return
}
// Do the transcode.
//
// in audio transcoding one Packet may transcode into many Packets.
// packet time will be adjusted in transcoder.
func (self *Transcoder) Do(pkt av.Packet) (out []av.Packet, err error) {
stream := self.streams[pkt.Idx]
if stream.aenc != nil && stream.adec != nil {
@ -114,6 +121,7 @@ func (self *Transcoder) Do(pkt av.Packet) (out []av.Packet, err error) {
return
}
// CodecData after transcode
func (self *Transcoder) Streams() (streams []av.CodecData, err error) {
for _, stream := range self.streams {
streams = append(streams, stream.codec)
@ -121,6 +129,7 @@ func (self *Transcoder) Streams() (streams []av.CodecData, err error) {
return
}
// Close transcoder, will close related encoder and decoders
func (self *Transcoder) Close() (err error) {
for _, stream := range self.streams {
if stream.aenc != nil {
@ -136,10 +145,12 @@ func (self *Transcoder) Close() (err error) {
return
}
// Wrap transcoder and origin Muxer into new Muxer.
// write to new Muxer will do transcode automatically
type Muxer struct {
av.Muxer
av.Muxer // origin Muxer
transcoder *Transcoder
Options
Options // transcode options
}
func (self *Muxer) WriteHeader(streams []av.CodecData) (err error) {
@ -176,6 +187,8 @@ func (self *Muxer) Close() (err error) {
return
}
// Wrap transcoder and origin Demuxer into new Demuxer.
// read this Demuxer will do transcode automatically
type Demuxer struct {
av.Demuxer
transcoder *Transcoder