perkeep/internal/media/audio.go

197 lines
6.0 KiB
Go

/*
Copyright 2014 The Perkeep Authors.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
// Package media provides means for querying information about audio and video data.
package media // import "perkeep.org/internal/media"
import (
"bytes"
"encoding/binary"
"errors"
"fmt"
"io"
"time"
"go4.org/readerutil"
)
// ID3v1TagLength is the length of an MP3 ID3v1 tag in bytes.
const ID3v1TagLength = 128
// id3v1Magic is the byte sequence appearing at the beginning of an ID3v1 tag.
var id3v1Magic = []byte("TAG")
// HasID3v1Tag returns true if an ID3v1 tag is present at the end of r.
func HasID3v1Tag(r readerutil.SizeReaderAt) (bool, error) {
if r.Size() < ID3v1TagLength {
return false, nil
}
buf := make([]byte, len(id3v1Magic))
if _, err := r.ReadAt(buf, r.Size()-ID3v1TagLength); err != nil {
return false, fmt.Errorf("Failed to read ID3v1 data: %v", err)
}
if bytes.Equal(buf, id3v1Magic) {
return true, nil
}
return false, nil
}
type mpegVersion int
const (
mpegVersion1 mpegVersion = iota
mpegVersion2
mpegVersion2_5
)
// mpegVersionsByID maps from a 2-bit version ID from an MPEG header to the corresponding MPEG audio version.
var mpegVersionsByID = map[uint32]mpegVersion{
0x0: mpegVersion2_5,
0x2: mpegVersion2,
0x3: mpegVersion1,
}
type mpegLayer int
const (
mpegLayer1 mpegLayer = iota
mpegLayer2
mpegLayer3
)
// mpegLayersByIndex maps from a 2-bit layer index from an MPEG header to the corresponding MPEG layer.
var mpegLayersByIndex = map[uint32]mpegLayer{
0x1: mpegLayer3,
0x2: mpegLayer2,
0x3: mpegLayer1,
}
// mpegBitrates is indexed by a 4-bit bitrate index from an MPEG header. Values are in kilobits.
var mpegBitrates = map[mpegVersion]map[mpegLayer][16]int{
mpegVersion1: {
mpegLayer1: {0, 32, 64, 96, 128, 160, 192, 224, 256, 288, 320, 352, 384, 416, 448, 0},
mpegLayer2: {0, 32, 48, 56, 64, 80, 96, 112, 128, 160, 192, 224, 256, 320, 384, 0},
mpegLayer3: {0, 32, 40, 48, 56, 64, 80, 96, 112, 128, 160, 192, 224, 256, 320, 0},
},
mpegVersion2: {
mpegLayer1: {0, 32, 48, 56, 64, 80, 96, 112, 128, 144, 160, 176, 192, 224, 256, 0},
mpegLayer2: {0, 8, 16, 24, 32, 40, 48, 56, 64, 80, 96, 112, 128, 144, 160, 0},
mpegLayer3: {0, 8, 16, 24, 32, 40, 48, 56, 64, 80, 96, 112, 128, 144, 160, 0},
},
mpegVersion2_5: {
mpegLayer1: {0, 32, 48, 56, 64, 80, 96, 112, 128, 144, 160, 176, 192, 224, 256, 0},
mpegLayer2: {0, 8, 16, 24, 32, 40, 48, 56, 64, 80, 96, 112, 128, 144, 160, 0},
mpegLayer3: {0, 8, 16, 24, 32, 40, 48, 56, 64, 80, 96, 112, 128, 144, 160, 0},
},
}
// mpegSamplingRates is indexed by a 2-bit sampling rate index from an MPEG header. Values are in hertz.
var mpegSamplingRates = map[mpegVersion][4]int{
mpegVersion1: {44100, 48000, 32000, 0},
mpegVersion2: {22050, 24000, 16000, 0},
mpegVersion2_5: {11025, 12000, 8000, 0},
}
var mpegSamplesPerFrame = map[mpegVersion]map[mpegLayer]int{
mpegVersion1: {
mpegLayer1: 384,
mpegLayer2: 1152,
mpegLayer3: 1152,
},
mpegVersion2: {
mpegLayer1: 384,
mpegLayer2: 1152,
mpegLayer3: 576,
},
mpegVersion2_5: {
mpegLayer1: 384,
mpegLayer2: 1152,
mpegLayer3: 576,
},
}
var xingHeaderName = []byte("Xing")
var infoHeaderName = []byte("Info")
// GetMPEGAudioDuration reads the first frame in r and returns the audio length with millisecond precision.
// Format details are at http://www.codeproject.com/Articles/8295/MPEG-Audio-Frame-Header.
func GetMPEGAudioDuration(r readerutil.SizeReaderAt) (time.Duration, error) {
var header uint32
if err := binary.Read(io.NewSectionReader(r, 0, r.Size()), binary.BigEndian, &header); err != nil {
return 0, fmt.Errorf("Failed to read MPEG frame header: %v", err)
}
getBits := func(startBit, numBits uint) uint32 {
return (header << startBit) >> (32 - numBits)
}
if getBits(0, 11) != 0x7ff {
return 0, errors.New("Missing sync bits in MPEG frame header")
}
var version mpegVersion
var ok bool
if version, ok = mpegVersionsByID[getBits(11, 2)]; !ok {
return 0, errors.New("Invalid MPEG version index")
}
var layer mpegLayer
if layer, ok = mpegLayersByIndex[getBits(13, 2)]; !ok {
return 0, errors.New("Invalid MPEG layer index")
}
bitrate := mpegBitrates[version][layer][getBits(16, 4)]
if bitrate == 0 {
return 0, errors.New("Invalid MPEG bitrate")
}
samplingRate := mpegSamplingRates[version][getBits(20, 2)]
if samplingRate == 0 {
return 0, errors.New("Invalid MPEG sample rate")
}
samplesPerFrame := mpegSamplesPerFrame[version][layer]
var xingHeaderStart int64 = 4
// Skip "side information".
if getBits(24, 2) == 0x3 { // Channel mode; 0x3 is mono.
xingHeaderStart += 17
} else {
xingHeaderStart += 32
}
// Skip 16-bit CRC if present.
if getBits(15, 1) == 0x0 { // 0x0 means "has protection".
xingHeaderStart += 2
}
b := make([]byte, 12)
if _, err := r.ReadAt(b, xingHeaderStart); err != nil {
return 0, fmt.Errorf("Unable to read Xing header at %d: %v", xingHeaderStart, err)
}
var ms int64
if bytes.Equal(b[0:4], xingHeaderName) || bytes.Equal(b[0:4], infoHeaderName) {
r := bytes.NewReader(b[4:])
var xingFlags uint32
binary.Read(r, binary.BigEndian, &xingFlags)
if xingFlags&0x1 == 0x0 {
return 0, fmt.Errorf("Xing header at %d lacks number of frames", xingHeaderStart)
}
var numFrames uint32
binary.Read(r, binary.BigEndian, &numFrames)
ms = int64(samplesPerFrame) * int64(numFrames) * 1000 / int64(samplingRate)
} else {
// Okay, no Xing VBR header. Assume that the file has a constant bitrate.
// (The other alternative is to read the whole file and examine each frame.)
ms = r.Size() / int64(bitrate) * 8
}
return time.Duration(ms) * time.Millisecond, nil
}