ffmpeg / libavformat / wav.c @ 5509bffa
History | View | Annotate | Download (12 KB)
1 |
/*
|
---|---|
2 |
* WAV encoder and decoder
|
3 |
* Copyright (c) 2001, 2002 Fabrice Bellard.
|
4 |
*
|
5 |
* This library is free software; you can redistribute it and/or
|
6 |
* modify it under the terms of the GNU Lesser General Public
|
7 |
* License as published by the Free Software Foundation; either
|
8 |
* version 2 of the License, or (at your option) any later version.
|
9 |
*
|
10 |
* This library is distributed in the hope that it will be useful,
|
11 |
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
12 |
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
13 |
* Lesser General Public License for more details.
|
14 |
*
|
15 |
* You should have received a copy of the GNU Lesser General Public
|
16 |
* License along with this library; if not, write to the Free Software
|
17 |
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
18 |
*/
|
19 |
#include "avformat.h" |
20 |
#include "avi.h" |
21 |
|
22 |
const CodecTag codec_wav_tags[] = {
|
23 |
{ CODEC_ID_MP2, 0x50 },
|
24 |
{ CODEC_ID_MP3, 0x55 },
|
25 |
{ CODEC_ID_AC3, 0x2000 },
|
26 |
{ CODEC_ID_DTS, 0x2001 },
|
27 |
{ CODEC_ID_PCM_S16LE, 0x01 },
|
28 |
{ CODEC_ID_PCM_U8, 0x01 }, /* must come after s16le in this list */ |
29 |
{ CODEC_ID_PCM_S24LE, 0x01 },
|
30 |
{ CODEC_ID_PCM_S32LE, 0x01 },
|
31 |
{ CODEC_ID_PCM_ALAW, 0x06 },
|
32 |
{ CODEC_ID_PCM_MULAW, 0x07 },
|
33 |
{ CODEC_ID_ADPCM_MS, 0x02 },
|
34 |
{ CODEC_ID_ADPCM_IMA_WAV, 0x11 },
|
35 |
{ CODEC_ID_ADPCM_YAMAHA, 0x20 },
|
36 |
{ CODEC_ID_ADPCM_G726, 0x45 },
|
37 |
{ CODEC_ID_ADPCM_IMA_DK4, 0x61 }, /* rogue format number */ |
38 |
{ CODEC_ID_ADPCM_IMA_DK3, 0x62 }, /* rogue format number */ |
39 |
{ CODEC_ID_WMAV1, 0x160 },
|
40 |
{ CODEC_ID_WMAV2, 0x161 },
|
41 |
{ CODEC_ID_AAC, 0x706d },
|
42 |
{ CODEC_ID_VORBIS, ('V'<<8)+'o' }, //HACK/FIXME, does vorbis in WAV/AVI have an (in)official id? |
43 |
{ CODEC_ID_SONIC, 0x2048 },
|
44 |
{ CODEC_ID_SONIC_LS, 0x2048 },
|
45 |
{ CODEC_ID_ADPCM_CT, 0x200 },
|
46 |
{ CODEC_ID_ADPCM_SWF, ('S'<<8)+'F' }, |
47 |
{ CODEC_ID_TRUESPEECH, 0x22 },
|
48 |
{ 0, 0 }, |
49 |
}; |
50 |
|
51 |
#ifdef CONFIG_MUXERS
|
52 |
/* WAVEFORMATEX header */
|
53 |
/* returns the size or -1 on error */
|
54 |
int put_wav_header(ByteIOContext *pb, AVCodecContext *enc)
|
55 |
{ |
56 |
int bps, blkalign, bytespersec;
|
57 |
int hdrsize = 18; |
58 |
|
59 |
if(!enc->codec_tag)
|
60 |
enc->codec_tag = codec_get_tag(codec_wav_tags, enc->codec_id); |
61 |
if(!enc->codec_tag)
|
62 |
return -1; |
63 |
|
64 |
put_le16(pb, enc->codec_tag); |
65 |
put_le16(pb, enc->channels); |
66 |
put_le32(pb, enc->sample_rate); |
67 |
if (enc->codec_id == CODEC_ID_PCM_U8 ||
|
68 |
enc->codec_id == CODEC_ID_PCM_ALAW || |
69 |
enc->codec_id == CODEC_ID_PCM_MULAW) { |
70 |
bps = 8;
|
71 |
} else if (enc->codec_id == CODEC_ID_MP2 || enc->codec_id == CODEC_ID_MP3) { |
72 |
bps = 0;
|
73 |
} else if (enc->codec_id == CODEC_ID_ADPCM_IMA_WAV || enc->codec_id == CODEC_ID_ADPCM_MS || enc->codec_id == CODEC_ID_ADPCM_G726 || enc->codec_id == CODEC_ID_ADPCM_YAMAHA) { // |
74 |
bps = 4;
|
75 |
} else if (enc->codec_id == CODEC_ID_PCM_S24LE) { |
76 |
bps = 24;
|
77 |
} else if (enc->codec_id == CODEC_ID_PCM_S32LE) { |
78 |
bps = 32;
|
79 |
} else {
|
80 |
bps = 16;
|
81 |
} |
82 |
|
83 |
if (enc->codec_id == CODEC_ID_MP2 || enc->codec_id == CODEC_ID_MP3) {
|
84 |
blkalign = enc->frame_size; //this is wrong, but seems many demuxers dont work if this is set correctly
|
85 |
//blkalign = 144 * enc->bit_rate/enc->sample_rate;
|
86 |
} else if (enc->codec_id == CODEC_ID_ADPCM_G726) { // |
87 |
blkalign = 1;
|
88 |
} else if (enc->block_align != 0) { /* specified by the codec */ |
89 |
blkalign = enc->block_align; |
90 |
} else
|
91 |
blkalign = enc->channels*bps >> 3;
|
92 |
if (enc->codec_id == CODEC_ID_PCM_U8 ||
|
93 |
enc->codec_id == CODEC_ID_PCM_S24LE || |
94 |
enc->codec_id == CODEC_ID_PCM_S32LE || |
95 |
enc->codec_id == CODEC_ID_PCM_S16LE) { |
96 |
bytespersec = enc->sample_rate * blkalign; |
97 |
} else {
|
98 |
bytespersec = enc->bit_rate / 8;
|
99 |
} |
100 |
put_le32(pb, bytespersec); /* bytes per second */
|
101 |
put_le16(pb, blkalign); /* block align */
|
102 |
put_le16(pb, bps); /* bits per sample */
|
103 |
if (enc->codec_id == CODEC_ID_MP3) {
|
104 |
put_le16(pb, 12); /* wav_extra_size */ |
105 |
hdrsize += 12;
|
106 |
put_le16(pb, 1); /* wID */ |
107 |
put_le32(pb, 2); /* fdwFlags */ |
108 |
put_le16(pb, 1152); /* nBlockSize */ |
109 |
put_le16(pb, 1); /* nFramesPerBlock */ |
110 |
put_le16(pb, 1393); /* nCodecDelay */ |
111 |
} else if (enc->codec_id == CODEC_ID_MP2) { |
112 |
put_le16(pb, 22); /* wav_extra_size */ |
113 |
hdrsize += 22;
|
114 |
put_le16(pb, 2); /* fwHeadLayer */ |
115 |
put_le32(pb, enc->bit_rate); /* dwHeadBitrate */
|
116 |
put_le16(pb, enc->channels == 2 ? 1 : 8); /* fwHeadMode */ |
117 |
put_le16(pb, 0); /* fwHeadModeExt */ |
118 |
put_le16(pb, 1); /* wHeadEmphasis */ |
119 |
put_le16(pb, 16); /* fwHeadFlags */ |
120 |
put_le32(pb, 0); /* dwPTSLow */ |
121 |
put_le32(pb, 0); /* dwPTSHigh */ |
122 |
} else if (enc->codec_id == CODEC_ID_ADPCM_IMA_WAV) { |
123 |
put_le16(pb, 2); /* wav_extra_size */ |
124 |
hdrsize += 2;
|
125 |
put_le16(pb, ((enc->block_align - 4 * enc->channels) / (4 * enc->channels)) * 8 + 1); /* wSamplesPerBlock */ |
126 |
} else if(enc->extradata_size){ |
127 |
put_le16(pb, enc->extradata_size); |
128 |
put_buffer(pb, enc->extradata, enc->extradata_size); |
129 |
hdrsize += enc->extradata_size; |
130 |
if(hdrsize&1){ |
131 |
hdrsize++; |
132 |
put_byte(pb, 0);
|
133 |
} |
134 |
} else {
|
135 |
hdrsize -= 2;
|
136 |
} |
137 |
|
138 |
return hdrsize;
|
139 |
} |
140 |
#endif //CONFIG_MUXERS |
141 |
|
142 |
/* We could be given one of the three possible structures here:
|
143 |
* WAVEFORMAT, PCMWAVEFORMAT or WAVEFORMATEX. Each structure
|
144 |
* is an expansion of the previous one with the fields added
|
145 |
* at the bottom. PCMWAVEFORMAT adds 'WORD wBitsPerSample' and
|
146 |
* WAVEFORMATEX adds 'WORD cbSize' and basically makes itself
|
147 |
* an openended structure.
|
148 |
*/
|
149 |
void get_wav_header(ByteIOContext *pb, AVCodecContext *codec, int size) |
150 |
{ |
151 |
int id;
|
152 |
|
153 |
id = get_le16(pb); |
154 |
codec->codec_type = CODEC_TYPE_AUDIO; |
155 |
codec->codec_tag = id; |
156 |
codec->channels = get_le16(pb); |
157 |
codec->sample_rate = get_le32(pb); |
158 |
codec->bit_rate = get_le32(pb) * 8;
|
159 |
codec->block_align = get_le16(pb); |
160 |
if (size == 14) { /* We're dealing with plain vanilla WAVEFORMAT */ |
161 |
codec->bits_per_sample = 8;
|
162 |
}else
|
163 |
codec->bits_per_sample = get_le16(pb); |
164 |
codec->codec_id = wav_codec_get_id(id, codec->bits_per_sample); |
165 |
|
166 |
if (size > 16) { /* We're obviously dealing with WAVEFORMATEX */ |
167 |
codec->extradata_size = get_le16(pb); |
168 |
if (codec->extradata_size > 0) { |
169 |
if (codec->extradata_size > size - 18) |
170 |
codec->extradata_size = size - 18;
|
171 |
codec->extradata = av_mallocz(codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE); |
172 |
get_buffer(pb, codec->extradata, codec->extradata_size); |
173 |
} else
|
174 |
codec->extradata_size = 0;
|
175 |
|
176 |
/* It is possible for the chunk to contain garbage at the end */
|
177 |
if (size - codec->extradata_size - 18 > 0) |
178 |
url_fskip(pb, size - codec->extradata_size - 18);
|
179 |
} |
180 |
} |
181 |
|
182 |
|
183 |
int wav_codec_get_id(unsigned int tag, int bps) |
184 |
{ |
185 |
int id;
|
186 |
id = codec_get_id(codec_wav_tags, tag); |
187 |
if (id <= 0) |
188 |
return id;
|
189 |
/* handle specific u8 codec */
|
190 |
if (id == CODEC_ID_PCM_S16LE && bps == 8) |
191 |
id = CODEC_ID_PCM_U8; |
192 |
if (id == CODEC_ID_PCM_S16LE && bps == 24) |
193 |
id = CODEC_ID_PCM_S24LE; |
194 |
if (id == CODEC_ID_PCM_S16LE && bps == 32) |
195 |
id = CODEC_ID_PCM_S32LE; |
196 |
return id;
|
197 |
} |
198 |
|
199 |
#ifdef CONFIG_MUXERS
|
200 |
typedef struct { |
201 |
offset_t data; |
202 |
} WAVContext; |
203 |
|
204 |
static int wav_write_header(AVFormatContext *s) |
205 |
{ |
206 |
WAVContext *wav = s->priv_data; |
207 |
ByteIOContext *pb = &s->pb; |
208 |
offset_t fmt; |
209 |
|
210 |
put_tag(pb, "RIFF");
|
211 |
put_le32(pb, 0); /* file length */ |
212 |
put_tag(pb, "WAVE");
|
213 |
|
214 |
/* format header */
|
215 |
fmt = start_tag(pb, "fmt ");
|
216 |
if (put_wav_header(pb, s->streams[0]->codec) < 0) { |
217 |
av_free(wav); |
218 |
return -1; |
219 |
} |
220 |
end_tag(pb, fmt); |
221 |
|
222 |
av_set_pts_info(s->streams[0], 64, 1, s->streams[0]->codec->sample_rate); |
223 |
|
224 |
/* data header */
|
225 |
wav->data = start_tag(pb, "data");
|
226 |
|
227 |
put_flush_packet(pb); |
228 |
|
229 |
return 0; |
230 |
} |
231 |
|
232 |
static int wav_write_packet(AVFormatContext *s, AVPacket *pkt) |
233 |
{ |
234 |
ByteIOContext *pb = &s->pb; |
235 |
put_buffer(pb, pkt->data, pkt->size); |
236 |
return 0; |
237 |
} |
238 |
|
239 |
static int wav_write_trailer(AVFormatContext *s) |
240 |
{ |
241 |
ByteIOContext *pb = &s->pb; |
242 |
WAVContext *wav = s->priv_data; |
243 |
offset_t file_size; |
244 |
|
245 |
if (!url_is_streamed(&s->pb)) {
|
246 |
end_tag(pb, wav->data); |
247 |
|
248 |
/* update file size */
|
249 |
file_size = url_ftell(pb); |
250 |
url_fseek(pb, 4, SEEK_SET);
|
251 |
put_le32(pb, (uint32_t)(file_size - 8));
|
252 |
url_fseek(pb, file_size, SEEK_SET); |
253 |
|
254 |
put_flush_packet(pb); |
255 |
} |
256 |
return 0; |
257 |
} |
258 |
#endif //CONFIG_MUXERS |
259 |
|
260 |
/* return the size of the found tag */
|
261 |
/* XXX: > 2GB ? */
|
262 |
static int find_tag(ByteIOContext *pb, uint32_t tag1) |
263 |
{ |
264 |
unsigned int tag; |
265 |
int size;
|
266 |
|
267 |
for(;;) {
|
268 |
if (url_feof(pb))
|
269 |
return -1; |
270 |
tag = get_le32(pb); |
271 |
size = get_le32(pb); |
272 |
if (tag == tag1)
|
273 |
break;
|
274 |
url_fseek(pb, size, SEEK_CUR); |
275 |
} |
276 |
if (size < 0) |
277 |
size = 0x7fffffff;
|
278 |
return size;
|
279 |
} |
280 |
|
281 |
static int wav_probe(AVProbeData *p) |
282 |
{ |
283 |
/* check file header */
|
284 |
if (p->buf_size <= 32) |
285 |
return 0; |
286 |
if (p->buf[0] == 'R' && p->buf[1] == 'I' && |
287 |
p->buf[2] == 'F' && p->buf[3] == 'F' && |
288 |
p->buf[8] == 'W' && p->buf[9] == 'A' && |
289 |
p->buf[10] == 'V' && p->buf[11] == 'E') |
290 |
return AVPROBE_SCORE_MAX;
|
291 |
else
|
292 |
return 0; |
293 |
} |
294 |
|
295 |
/* wav input */
|
296 |
static int wav_read_header(AVFormatContext *s, |
297 |
AVFormatParameters *ap) |
298 |
{ |
299 |
int size;
|
300 |
unsigned int tag; |
301 |
ByteIOContext *pb = &s->pb; |
302 |
AVStream *st; |
303 |
|
304 |
/* check RIFF header */
|
305 |
tag = get_le32(pb); |
306 |
|
307 |
if (tag != MKTAG('R', 'I', 'F', 'F')) |
308 |
return -1; |
309 |
get_le32(pb); /* file size */
|
310 |
tag = get_le32(pb); |
311 |
if (tag != MKTAG('W', 'A', 'V', 'E')) |
312 |
return -1; |
313 |
|
314 |
/* parse fmt header */
|
315 |
size = find_tag(pb, MKTAG('f', 'm', 't', ' ')); |
316 |
if (size < 0) |
317 |
return -1; |
318 |
st = av_new_stream(s, 0);
|
319 |
if (!st)
|
320 |
return AVERROR_NOMEM;
|
321 |
|
322 |
get_wav_header(pb, st->codec, size); |
323 |
st->need_parsing = 1;
|
324 |
|
325 |
av_set_pts_info(st, 64, 1, st->codec->sample_rate); |
326 |
|
327 |
size = find_tag(pb, MKTAG('d', 'a', 't', 'a')); |
328 |
if (size < 0) |
329 |
return -1; |
330 |
return 0; |
331 |
} |
332 |
|
333 |
#define MAX_SIZE 4096 |
334 |
|
335 |
static int wav_read_packet(AVFormatContext *s, |
336 |
AVPacket *pkt) |
337 |
{ |
338 |
int ret, size;
|
339 |
AVStream *st; |
340 |
|
341 |
if (url_feof(&s->pb))
|
342 |
return AVERROR_IO;
|
343 |
st = s->streams[0];
|
344 |
|
345 |
size = MAX_SIZE; |
346 |
if (st->codec->block_align > 1) { |
347 |
if (size < st->codec->block_align)
|
348 |
size = st->codec->block_align; |
349 |
size = (size / st->codec->block_align) * st->codec->block_align; |
350 |
} |
351 |
if (av_new_packet(pkt, size))
|
352 |
return AVERROR_IO;
|
353 |
pkt->stream_index = 0;
|
354 |
|
355 |
ret = get_buffer(&s->pb, pkt->data, pkt->size); |
356 |
if (ret < 0) |
357 |
av_free_packet(pkt); |
358 |
/* note: we need to modify the packet size here to handle the last
|
359 |
packet */
|
360 |
pkt->size = ret; |
361 |
return ret;
|
362 |
} |
363 |
|
364 |
static int wav_read_close(AVFormatContext *s) |
365 |
{ |
366 |
return 0; |
367 |
} |
368 |
|
369 |
static int wav_read_seek(AVFormatContext *s, |
370 |
int stream_index, int64_t timestamp, int flags) |
371 |
{ |
372 |
AVStream *st; |
373 |
|
374 |
st = s->streams[0];
|
375 |
switch(st->codec->codec_id) {
|
376 |
case CODEC_ID_MP2:
|
377 |
case CODEC_ID_MP3:
|
378 |
case CODEC_ID_AC3:
|
379 |
case CODEC_ID_DTS:
|
380 |
/* use generic seeking with dynamically generated indexes */
|
381 |
return -1; |
382 |
default:
|
383 |
break;
|
384 |
} |
385 |
return pcm_read_seek(s, stream_index, timestamp, flags);
|
386 |
} |
387 |
|
388 |
|
389 |
static AVInputFormat wav_iformat = {
|
390 |
"wav",
|
391 |
"wav format",
|
392 |
0,
|
393 |
wav_probe, |
394 |
wav_read_header, |
395 |
wav_read_packet, |
396 |
wav_read_close, |
397 |
wav_read_seek, |
398 |
}; |
399 |
|
400 |
#ifdef CONFIG_MUXERS
|
401 |
static AVOutputFormat wav_oformat = {
|
402 |
"wav",
|
403 |
"wav format",
|
404 |
"audio/x-wav",
|
405 |
"wav",
|
406 |
sizeof(WAVContext),
|
407 |
CODEC_ID_PCM_S16LE, |
408 |
CODEC_ID_NONE, |
409 |
wav_write_header, |
410 |
wav_write_packet, |
411 |
wav_write_trailer, |
412 |
}; |
413 |
#endif //CONFIG_MUXERS |
414 |
|
415 |
int ff_wav_init(void) |
416 |
{ |
417 |
av_register_input_format(&wav_iformat); |
418 |
#ifdef CONFIG_MUXERS
|
419 |
av_register_output_format(&wav_oformat); |
420 |
#endif //CONFIG_MUXERS |
421 |
return 0; |
422 |
} |