1
1
mirror of https://github.com/wader/fq.git synced 2024-11-27 14:14:58 +03:00
fq/format/wav/wav.go

214 lines
5.8 KiB
Go

package wav
// http://soundfile.sapp.org/doc/WaveFormat/
// https://github.com/FFmpeg/FFmpeg/blob/master/libavformat/wavdec.c
// https://tech.ebu.ch/docs/tech/tech3285.pdf
// http://www-mmsp.ece.mcgill.ca/Documents/AudioFormats/WAVE/WAVE.html
// TODO: audio/wav
// TODO: default little endian
import (
"fmt"
"strings"
"github.com/wader/fq/format"
"github.com/wader/fq/format/registry"
"github.com/wader/fq/pkg/decode"
"github.com/wader/fq/pkg/scalar"
)
var headerFormat decode.Group
var footerFormat decode.Group
func init() {
registry.MustRegister(decode.Format{
Name: format.WAV,
ProbeOrder: 10, // after most others (overlap some with webp)
Description: "WAV file",
Groups: []string{format.PROBE},
DecodeFn: wavDecode,
Dependencies: []decode.Dependency{
{Names: []string{format.ID3V2}, Group: &headerFormat},
{Names: []string{format.ID3V1, format.ID3V11}, Group: &footerFormat},
},
})
}
const (
formatExtensible = 0xfffe
)
// transformed from ffmpeg libavformat/riff.c
var audioFormatName = scalar.UToSymStr{
0x0001: "pcm",
0x0002: "adpcm_ms",
0x0003: "pcm_float",
/* must come after f32le in this list */
0x0006: "pcm_alaw",
0x0007: "pcm_mulaw",
0x000a: "wmavoice",
0x0010: "adpcm_ima_oki",
0x0011: "adpcm_ima_wav",
/* must come after adpcm_ima_wav in this list */
0x0017: "adpcm_ima_oki",
0x0020: "adpcm_yamaha",
0x0022: "truespeech",
0x0031: "gsm_ms",
0x0032: "gsm_ms", /* msn audio */
0x0038: "amr_nb", /* rogue format number */
0x0042: "g723_1",
0x0045: "adpcm_g726",
0x0014: "adpcm_g726", /* g723 Antex */
0x0040: "adpcm_g726", /* g721 Antex */
0x0050: "mp2",
0x0055: "mp3",
0x0057: "amr_nb",
0x0058: "amr_wb",
/* rogue format number */
0x0061: "adpcm_ima_dk4",
/* rogue format number */
0x0062: "adpcm_ima_dk3",
0x0064: "adpcm_g726",
0x0069: "adpcm_ima_wav",
0x0075: "metasound",
0x0083: "g729",
0x00ff: "aac",
0x0111: "g723_1",
0x0130: "sipr",
0x0135: "acelp_kelvin",
0x0160: "wmav1",
0x0161: "wmav2",
0x0162: "wmapro",
0x0163: "wmalossless",
0x0165: "xma1",
0x0166: "xma2",
0x0200: "adpcm_ct",
0x0215: "dvaudio",
0x0216: "dvaudio",
0x0270: "atrac3",
0x028f: "adpcm_g722",
0x0401: "imc",
0x0402: "iac",
0x0500: "on2avc",
0x0501: "on2avc",
0x1500: "gsm_ms",
0x1501: "truespeech",
0x1600: "aac",
0x1602: "aac_latm",
0x2000: "ac3",
0x2001: "dts",
0x2048: "sonic",
0x6c75: "pcm_mulaw",
0x706d: "aac",
0x4143: "aac",
0x594a: "xan_dpcm",
0x729a: "g729",
0xa100: "g723_1", /* Comverse Infosys Ltd. G723 1 */
0xa106: "aac",
0xa109: "speex",
0xf1ac: "flac",
('S' << 8) + 'F': "adpcm_swf",
/* HACK/FIXME: Does Vorbis in WAV/AVI have an (in)official ID? */
('V' << 8) + 'o': "vorbis",
formatExtensible: "extensible",
}
var (
subFormatPCMBytes = [16]byte{0x01, 0x00, 0x00, 0x00, 0x00, 0x00, 0x10, 0x00, 0x80, 0x00, 0x00, 0xaa, 0x00, 0x38, 0x9b, 0x71}
subFormatIEEEFloat = [16]byte{0x03, 0x00, 0x00, 0x00, 0x00, 0x00, 0x10, 0x00, 0x80, 0x00, 0x00, 0xaa, 0x00, 0x38, 0x9b, 0x71}
)
var subFormatNames = scalar.BytesToScalar{
{Bytes: subFormatPCMBytes[:], Scalar: scalar.S{Sym: "pcm"}},
{Bytes: subFormatIEEEFloat[:], Scalar: scalar.S{Sym: "ieee_float"}},
}
func decodeChunk(d *decode.D, expectedChunkID string, stringData bool) int64 { //nolint:unparam
d.Endian = decode.LittleEndian
chunks := map[string]func(d *decode.D){
"RIFF": func(d *decode.D) {
d.FieldUTF8("format", 4)
decodeChunks(d, false)
},
"fmt": func(d *decode.D) {
audioFormat := d.FieldU16("audio_format", audioFormatName)
d.FieldU16("num_channels")
d.FieldU32("sample_rate")
d.FieldU32("byte_rate")
d.FieldU16("block_align")
d.FieldU16("bits_per_sample")
if audioFormat == formatExtensible && d.BitsLeft() > 0 {
d.FieldU16("extension_size")
d.FieldU16("valid_bits_per_sample")
d.FieldU32("channel_mask")
d.FieldRawLen("sub_format", 16*8, subFormatNames)
}
},
"data": func(d *decode.D) {
d.FieldRawLen("samples", d.BitsLeft())
},
"LIST": func(d *decode.D) {
d.FieldUTF8("list_type", 4)
decodeChunks(d, true)
},
"fact": func(d *decode.D) {
d.FieldU32("sample_length")
},
}
trimChunkID := d.FieldStrFn("id", func(d *decode.D) string {
return strings.TrimSpace(d.UTF8(4))
})
if expectedChunkID != "" && trimChunkID != expectedChunkID {
d.Errorf(fmt.Sprintf("expected chunk id %q found %q", expectedChunkID, trimChunkID))
}
const restOfFileLen = 0xffffffff
chunkLen := int64(d.FieldUScalarFn("size", func(d *decode.D) scalar.S {
l := d.U32()
if l == restOfFileLen {
return scalar.S{Actual: l, ActualDisplay: scalar.NumberHex, Sym: "rest of file"}
}
return scalar.S{Actual: l, ActualDisplay: scalar.NumberDecimal}
}))
if chunkLen == restOfFileLen {
chunkLen = d.BitsLeft() / 8
}
if fn, ok := chunks[trimChunkID]; ok {
d.FramedFn(chunkLen*8, fn)
} else {
if stringData {
d.FieldUTF8("data", int(chunkLen), scalar.Trim(" \x00"))
} else {
d.FieldRawLen("data", chunkLen*8)
}
}
if chunkLen%2 != 0 {
d.FieldRawLen("align", 8)
}
return chunkLen + 8
}
func decodeChunks(d *decode.D, stringData bool) {
d.FieldStructArrayLoop("chunks", "chunk", d.NotEnd, func(d *decode.D) {
decodeChunk(d, "", stringData)
})
}
func wavDecode(d *decode.D, in interface{}) interface{} {
// there are wav files in the wild with id3v2 header id3v1 footer
_, _, _ = d.TryFieldFormat("header", headerFormat, nil)
decodeChunk(d, "RIFF", false)
_, _, _ = d.TryFieldFormat("footer", footerFormat, nil)
return nil
}