wav.c revision 1.12 1 1.12 christos /* $NetBSD: wav.c,v 1.12 2013/10/18 20:47:06 christos Exp $ */
2 1.3 mrg
3 1.1 mrg /*
4 1.9 mrg * Copyright (c) 2002, 2009 Matthew R. Green
5 1.1 mrg * All rights reserved.
6 1.1 mrg *
7 1.1 mrg * Redistribution and use in source and binary forms, with or without
8 1.1 mrg * modification, are permitted provided that the following conditions
9 1.1 mrg * are met:
10 1.1 mrg * 1. Redistributions of source code must retain the above copyright
11 1.1 mrg * notice, this list of conditions and the following disclaimer.
12 1.1 mrg * 2. Redistributions in binary form must reproduce the above copyright
13 1.1 mrg * notice, this list of conditions and the following disclaimer in the
14 1.1 mrg * documentation and/or other materials provided with the distribution.
15 1.1 mrg *
16 1.1 mrg * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
17 1.1 mrg * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18 1.1 mrg * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
19 1.1 mrg * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
20 1.1 mrg * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
21 1.1 mrg * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
22 1.1 mrg * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
23 1.1 mrg * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
24 1.1 mrg * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
25 1.1 mrg * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
26 1.1 mrg * SUCH DAMAGE.
27 1.1 mrg */
28 1.1 mrg
29 1.1 mrg /*
30 1.1 mrg * WAV support for the audio tools; thanks go to the sox utility for
31 1.1 mrg * clearing up issues with WAV files.
32 1.1 mrg */
33 1.6 agc #include <sys/cdefs.h>
34 1.6 agc
35 1.6 agc #ifndef lint
36 1.12 christos __RCSID("$NetBSD: wav.c,v 1.12 2013/10/18 20:47:06 christos Exp $");
37 1.6 agc #endif
38 1.6 agc
39 1.1 mrg
40 1.1 mrg #include <sys/types.h>
41 1.1 mrg #include <sys/audioio.h>
42 1.1 mrg #include <sys/ioctl.h>
43 1.1 mrg #include <sys/time.h>
44 1.1 mrg
45 1.1 mrg #include <ctype.h>
46 1.1 mrg #include <err.h>
47 1.1 mrg #include <stdio.h>
48 1.1 mrg #include <stdlib.h>
49 1.1 mrg #include <string.h>
50 1.9 mrg #include <stdint.h>
51 1.11 mrg #include <unistd.h>
52 1.1 mrg
53 1.1 mrg #include "libaudio.h"
54 1.11 mrg #include "auconv.h"
55 1.1 mrg
56 1.10 joerg static const struct {
57 1.1 mrg int wenc;
58 1.2 mrg const char *wname;
59 1.1 mrg } wavencs[] = {
60 1.1 mrg { WAVE_FORMAT_UNKNOWN, "Microsoft Official Unknown" },
61 1.1 mrg { WAVE_FORMAT_PCM, "Microsoft PCM" },
62 1.1 mrg { WAVE_FORMAT_ADPCM, "Microsoft ADPCM" },
63 1.1 mrg { WAVE_FORMAT_ALAW, "Microsoft A-law" },
64 1.5 wiz { WAVE_FORMAT_MULAW, "Microsoft mu-law" },
65 1.1 mrg { WAVE_FORMAT_OKI_ADPCM,"OKI ADPCM" },
66 1.1 mrg { WAVE_FORMAT_DIGISTD, "Digistd format" },
67 1.1 mrg { WAVE_FORMAT_DIGIFIX, "Digifix format" },
68 1.1 mrg { -1, "?Unknown?" },
69 1.1 mrg };
70 1.1 mrg
71 1.2 mrg const char *
72 1.2 mrg wav_enc_from_val(int encoding)
73 1.1 mrg {
74 1.1 mrg int i;
75 1.1 mrg
76 1.1 mrg for (i = 0; wavencs[i].wenc != -1; i++)
77 1.1 mrg if (wavencs[i].wenc == encoding)
78 1.1 mrg break;
79 1.1 mrg return (wavencs[i].wname);
80 1.1 mrg }
81 1.1 mrg
82 1.1 mrg /*
83 1.1 mrg * sample header is:
84 1.1 mrg *
85 1.1 mrg * RIFF\^@^C^@WAVEfmt ^P^@^@^@^A^@^B^@D<AC>^@^@^P<B1>^B^@^D^@^P^@data^@^@^C^@^@^@^@^@^@^@^@^@^@
86 1.1 mrg *
87 1.1 mrg */
88 1.1 mrg /*
89 1.1 mrg * WAV format helpers
90 1.1 mrg */
91 1.1 mrg /*
92 1.1 mrg * find a .wav header, etc. returns header length on success
93 1.1 mrg */
94 1.1 mrg ssize_t
95 1.10 joerg audio_wav_parse_hdr(void *hdr, size_t sz, u_int *enc, u_int *prec,
96 1.10 joerg u_int *sample, u_int *channels, size_t *datasize)
97 1.1 mrg {
98 1.1 mrg char *where = hdr, *owhere;
99 1.1 mrg wav_audioheaderpart part;
100 1.1 mrg wav_audioheaderfmt fmt;
101 1.9 mrg wav_audiohdrextensible ext;
102 1.1 mrg char *end = (((char *)hdr) + sz);
103 1.7 mrg u_int newenc, newprec;
104 1.9 mrg u_int16_t fmttag;
105 1.2 mrg static const char
106 1.2 mrg strfmt[4] = "fmt ",
107 1.2 mrg strRIFF[4] = "RIFF",
108 1.2 mrg strWAVE[4] = "WAVE",
109 1.2 mrg strdata[4] = "data";
110 1.2 mrg
111 1.1 mrg if (sz < 32)
112 1.1 mrg return (AUDIO_ENOENT);
113 1.1 mrg
114 1.2 mrg if (strncmp(where, strRIFF, sizeof strRIFF))
115 1.1 mrg return (AUDIO_ENOENT);
116 1.1 mrg where += 8;
117 1.2 mrg if (strncmp(where, strWAVE, sizeof strWAVE))
118 1.1 mrg return (AUDIO_ENOENT);
119 1.1 mrg where += 4;
120 1.1 mrg
121 1.1 mrg do {
122 1.1 mrg memcpy(&part, where, sizeof part);
123 1.1 mrg owhere = where;
124 1.1 mrg where += getle32(part.len) + 8;
125 1.2 mrg } while (where < end && strncmp(part.name, strfmt, sizeof strfmt));
126 1.1 mrg
127 1.1 mrg /* too short ? */
128 1.1 mrg if (where + sizeof fmt > end)
129 1.1 mrg return (AUDIO_ESHORTHDR);
130 1.1 mrg
131 1.1 mrg memcpy(&fmt, (owhere + 8), sizeof fmt);
132 1.1 mrg
133 1.9 mrg fmttag = getle16(fmt.tag);
134 1.9 mrg if (verbose)
135 1.9 mrg printf("WAVE format tag: %x\n", fmttag);
136 1.9 mrg
137 1.9 mrg if (fmttag == WAVE_FORMAT_EXTENSIBLE) {
138 1.9 mrg if ((uintptr_t)(where - owhere) < sizeof(fmt) + sizeof(ext))
139 1.9 mrg return (AUDIO_ESHORTHDR);
140 1.9 mrg memcpy(&ext, owhere + sizeof fmt, sizeof ext);
141 1.9 mrg if (getle16(ext.len) < sizeof(ext) - sizeof(ext.len))
142 1.9 mrg return (AUDIO_ESHORTHDR);
143 1.9 mrg fmttag = ext.sub_tag;
144 1.9 mrg if (verbose)
145 1.9 mrg printf("WAVE extensible sub tag: %x\n", fmttag);
146 1.9 mrg }
147 1.9 mrg
148 1.9 mrg switch (fmttag) {
149 1.1 mrg case WAVE_FORMAT_UNKNOWN:
150 1.1 mrg case IBM_FORMAT_MULAW:
151 1.1 mrg case IBM_FORMAT_ALAW:
152 1.1 mrg case IBM_FORMAT_ADPCM:
153 1.1 mrg default:
154 1.1 mrg return (AUDIO_EWAVUNSUPP);
155 1.1 mrg
156 1.1 mrg case WAVE_FORMAT_PCM:
157 1.9 mrg case WAVE_FORMAT_ADPCM:
158 1.9 mrg case WAVE_FORMAT_OKI_ADPCM:
159 1.9 mrg case WAVE_FORMAT_IMA_ADPCM:
160 1.9 mrg case WAVE_FORMAT_DIGIFIX:
161 1.9 mrg case WAVE_FORMAT_DIGISTD:
162 1.1 mrg switch (getle16(fmt.bits_per_sample)) {
163 1.1 mrg case 8:
164 1.1 mrg newprec = 8;
165 1.1 mrg break;
166 1.1 mrg case 16:
167 1.1 mrg newprec = 16;
168 1.1 mrg break;
169 1.1 mrg case 24:
170 1.1 mrg newprec = 24;
171 1.1 mrg break;
172 1.1 mrg case 32:
173 1.1 mrg newprec = 32;
174 1.1 mrg break;
175 1.1 mrg default:
176 1.1 mrg return (AUDIO_EWAVBADPCM);
177 1.1 mrg }
178 1.1 mrg if (newprec == 8)
179 1.1 mrg newenc = AUDIO_ENCODING_ULINEAR_LE;
180 1.1 mrg else
181 1.1 mrg newenc = AUDIO_ENCODING_SLINEAR_LE;
182 1.1 mrg break;
183 1.1 mrg case WAVE_FORMAT_ALAW:
184 1.1 mrg newenc = AUDIO_ENCODING_ALAW;
185 1.1 mrg newprec = 8;
186 1.1 mrg break;
187 1.1 mrg case WAVE_FORMAT_MULAW:
188 1.1 mrg newenc = AUDIO_ENCODING_ULAW;
189 1.1 mrg newprec = 8;
190 1.1 mrg break;
191 1.1 mrg }
192 1.1 mrg
193 1.1 mrg do {
194 1.1 mrg memcpy(&part, where, sizeof part);
195 1.1 mrg owhere = where;
196 1.1 mrg where += (getle32(part.len) + 8);
197 1.2 mrg } while (where < end && strncmp(part.name, strdata, sizeof strdata));
198 1.1 mrg
199 1.1 mrg if ((where - getle32(part.len)) <= end) {
200 1.1 mrg if (channels)
201 1.7 mrg *channels = (u_int)getle16(fmt.channels);
202 1.1 mrg if (sample)
203 1.1 mrg *sample = getle32(fmt.sample_rate);
204 1.1 mrg if (enc)
205 1.1 mrg *enc = newenc;
206 1.1 mrg if (prec)
207 1.1 mrg *prec = newprec;
208 1.1 mrg if (datasize)
209 1.1 mrg *datasize = (size_t)getle32(part.len);
210 1.1 mrg return (owhere - (char *)hdr + 8);
211 1.1 mrg }
212 1.1 mrg return (AUDIO_EWAVNODATA);
213 1.1 mrg }
214 1.11 mrg
215 1.11 mrg
216 1.11 mrg /*
217 1.11 mrg * prepare a WAV header for writing; we fill in hdrp, lenp and leftp,
218 1.11 mrg * and expect our caller (wav_write_header()) to use them.
219 1.11 mrg */
220 1.11 mrg int
221 1.11 mrg wav_prepare_header(struct write_info *wi, void **hdrp, size_t *lenp, int *leftp)
222 1.11 mrg {
223 1.11 mrg /*
224 1.11 mrg * WAV header we write looks like this:
225 1.11 mrg *
226 1.11 mrg * bytes purpose
227 1.11 mrg * 0-3 "RIFF"
228 1.11 mrg * 4-7 file length (minus 8)
229 1.11 mrg * 8-15 "WAVEfmt "
230 1.11 mrg * 16-19 format size
231 1.11 mrg * 20-21 format tag
232 1.11 mrg * 22-23 number of channels
233 1.11 mrg * 24-27 sample rate
234 1.11 mrg * 28-31 average bytes per second
235 1.11 mrg * 32-33 block alignment
236 1.11 mrg * 34-35 bits per sample
237 1.11 mrg *
238 1.11 mrg * then for ULAW and ALAW outputs, we have an extended chunk size
239 1.11 mrg * and a WAV "fact" to add:
240 1.11 mrg *
241 1.11 mrg * 36-37 length of extension (== 0)
242 1.11 mrg * 38-41 "fact"
243 1.11 mrg * 42-45 fact size
244 1.11 mrg * 46-49 number of samples written
245 1.11 mrg * 50-53 "data"
246 1.11 mrg * 54-57 data length
247 1.11 mrg * 58- raw audio data
248 1.11 mrg *
249 1.11 mrg * for PCM outputs we have just the data remaining:
250 1.11 mrg *
251 1.11 mrg * 36-39 "data"
252 1.11 mrg * 40-43 data length
253 1.11 mrg * 44- raw audio data
254 1.11 mrg *
255 1.11 mrg * RIFF\^@^C^@WAVEfmt ^P^@^@^@^A^@^B^@D<AC>^@^@^P<B1>^B^@^D^@^P^@data^@^@^C^@^@^@^@^@^@^@^@^@^@
256 1.11 mrg */
257 1.11 mrg static char wavheaderbuf[64];
258 1.11 mrg char *p = wavheaderbuf;
259 1.11 mrg const char *riff = "RIFF",
260 1.11 mrg *wavefmt = "WAVEfmt ",
261 1.11 mrg *fact = "fact",
262 1.11 mrg *data = "data";
263 1.11 mrg u_int32_t filelen, fmtsz, sps, abps, factsz = 4, nsample, datalen;
264 1.12 christos u_int16_t fmttag, nchan, align, extln = 0;
265 1.11 mrg
266 1.11 mrg if (wi->header_info)
267 1.11 mrg warnx("header information not supported for WAV");
268 1.11 mrg *leftp = 0;
269 1.11 mrg
270 1.11 mrg switch (wi->precision) {
271 1.11 mrg case 8:
272 1.11 mrg break;
273 1.11 mrg case 16:
274 1.11 mrg break;
275 1.11 mrg case 32:
276 1.11 mrg break;
277 1.11 mrg default:
278 1.11 mrg {
279 1.11 mrg static int warned = 0;
280 1.11 mrg
281 1.11 mrg if (warned == 0) {
282 1.11 mrg warnx("can not support precision of %d", wi->precision);
283 1.11 mrg warned = 1;
284 1.11 mrg }
285 1.11 mrg }
286 1.11 mrg return (-1);
287 1.11 mrg }
288 1.11 mrg
289 1.11 mrg switch (wi->encoding) {
290 1.11 mrg case AUDIO_ENCODING_ULAW:
291 1.11 mrg fmttag = WAVE_FORMAT_MULAW;
292 1.11 mrg fmtsz = 18;
293 1.11 mrg align = wi->channels;
294 1.11 mrg break;
295 1.11 mrg
296 1.11 mrg case AUDIO_ENCODING_ALAW:
297 1.11 mrg fmttag = WAVE_FORMAT_ALAW;
298 1.11 mrg fmtsz = 18;
299 1.11 mrg align = wi->channels;
300 1.11 mrg break;
301 1.11 mrg
302 1.11 mrg /*
303 1.11 mrg * we could try to support RIFX but it seems to be more portable
304 1.11 mrg * to output little-endian data for WAV files.
305 1.11 mrg */
306 1.11 mrg case AUDIO_ENCODING_ULINEAR_BE:
307 1.11 mrg case AUDIO_ENCODING_SLINEAR_BE:
308 1.11 mrg case AUDIO_ENCODING_ULINEAR_LE:
309 1.11 mrg case AUDIO_ENCODING_SLINEAR_LE:
310 1.11 mrg case AUDIO_ENCODING_PCM16:
311 1.11 mrg
312 1.11 mrg #if BYTE_ORDER == LITTLE_ENDIAN
313 1.11 mrg case AUDIO_ENCODING_ULINEAR:
314 1.11 mrg case AUDIO_ENCODING_SLINEAR:
315 1.11 mrg #endif
316 1.11 mrg fmttag = WAVE_FORMAT_PCM;
317 1.11 mrg fmtsz = 16;
318 1.11 mrg align = wi->channels * (wi->precision / 8);
319 1.11 mrg break;
320 1.11 mrg
321 1.11 mrg default:
322 1.11 mrg #if 0 // move into record.c, and maybe merge.c
323 1.11 mrg {
324 1.11 mrg static int warned = 0;
325 1.11 mrg
326 1.11 mrg if (warned == 0) {
327 1.11 mrg const char *s = wav_enc_from_val(wi->encoding);
328 1.11 mrg
329 1.11 mrg if (s == NULL)
330 1.11 mrg warnx("can not support encoding of %s", s);
331 1.11 mrg else
332 1.11 mrg warnx("can not support encoding of %d", wi->encoding);
333 1.11 mrg warned = 1;
334 1.11 mrg }
335 1.11 mrg }
336 1.11 mrg #endif
337 1.11 mrg wi->format = AUDIO_FORMAT_NONE;
338 1.11 mrg return (-1);
339 1.11 mrg }
340 1.11 mrg
341 1.11 mrg nchan = wi->channels;
342 1.11 mrg sps = wi->sample_rate;
343 1.11 mrg
344 1.11 mrg /* data length */
345 1.11 mrg if (wi->outfd == STDOUT_FILENO)
346 1.11 mrg datalen = 0;
347 1.11 mrg else if (wi->total_size != -1)
348 1.11 mrg datalen = wi->total_size;
349 1.11 mrg else
350 1.11 mrg datalen = 0;
351 1.11 mrg
352 1.11 mrg /* file length */
353 1.11 mrg filelen = 4 + (8 + fmtsz) + (8 + datalen);
354 1.11 mrg if (fmttag != WAVE_FORMAT_PCM)
355 1.11 mrg filelen += 8 + factsz;
356 1.11 mrg
357 1.11 mrg abps = (double)align*wi->sample_rate / (double)1 + 0.5;
358 1.11 mrg
359 1.11 mrg nsample = (datalen / wi->precision) / wi->sample_rate;
360 1.11 mrg
361 1.11 mrg /*
362 1.11 mrg * now we've calculated the info, write it out!
363 1.11 mrg */
364 1.11 mrg #define put32(x) do { \
365 1.11 mrg u_int32_t _f; \
366 1.11 mrg putle32(_f, (x)); \
367 1.11 mrg memcpy(p, &_f, 4); \
368 1.11 mrg } while (0)
369 1.11 mrg #define put16(x) do { \
370 1.11 mrg u_int16_t _f; \
371 1.11 mrg putle16(_f, (x)); \
372 1.11 mrg memcpy(p, &_f, 2); \
373 1.11 mrg } while (0)
374 1.11 mrg memcpy(p, riff, 4);
375 1.11 mrg p += 4; /* 4 */
376 1.11 mrg put32(filelen);
377 1.11 mrg p += 4; /* 8 */
378 1.11 mrg memcpy(p, wavefmt, 8);
379 1.11 mrg p += 8; /* 16 */
380 1.11 mrg put32(fmtsz);
381 1.11 mrg p += 4; /* 20 */
382 1.11 mrg put16(fmttag);
383 1.11 mrg p += 2; /* 22 */
384 1.11 mrg put16(nchan);
385 1.11 mrg p += 2; /* 24 */
386 1.11 mrg put32(sps);
387 1.11 mrg p += 4; /* 28 */
388 1.11 mrg put32(abps);
389 1.11 mrg p += 4; /* 32 */
390 1.11 mrg put16(align);
391 1.11 mrg p += 2; /* 34 */
392 1.11 mrg put16(wi->precision);
393 1.11 mrg p += 2; /* 36 */
394 1.11 mrg /* NON PCM formats have an extended chunk; write it */
395 1.11 mrg if (fmttag != WAVE_FORMAT_PCM) {
396 1.11 mrg put16(extln);
397 1.11 mrg p += 2; /* 38 */
398 1.11 mrg memcpy(p, fact, 4);
399 1.11 mrg p += 4; /* 42 */
400 1.11 mrg put32(factsz);
401 1.11 mrg p += 4; /* 46 */
402 1.11 mrg put32(nsample);
403 1.11 mrg p += 4; /* 50 */
404 1.11 mrg }
405 1.11 mrg memcpy(p, data, 4);
406 1.11 mrg p += 4; /* 40/54 */
407 1.11 mrg put32(datalen);
408 1.11 mrg p += 4; /* 44/58 */
409 1.11 mrg #undef put32
410 1.11 mrg #undef put16
411 1.11 mrg
412 1.11 mrg *hdrp = wavheaderbuf;
413 1.11 mrg *lenp = (p - wavheaderbuf);
414 1.11 mrg
415 1.11 mrg return 0;
416 1.11 mrg }
417 1.11 mrg
418 1.11 mrg write_conv_func
419 1.11 mrg wav_write_get_conv_func(struct write_info *wi)
420 1.11 mrg {
421 1.11 mrg write_conv_func conv_func = NULL;
422 1.11 mrg
423 1.11 mrg switch (wi->encoding) {
424 1.11 mrg
425 1.11 mrg /*
426 1.11 mrg * we could try to support RIFX but it seems to be more portable
427 1.11 mrg * to output little-endian data for WAV files.
428 1.11 mrg */
429 1.11 mrg case AUDIO_ENCODING_ULINEAR_BE:
430 1.11 mrg #if BYTE_ORDER == BIG_ENDIAN
431 1.11 mrg case AUDIO_ENCODING_ULINEAR:
432 1.11 mrg #endif
433 1.11 mrg if (wi->precision == 16)
434 1.11 mrg conv_func = change_sign16_swap_bytes_be;
435 1.11 mrg else if (wi->precision == 32)
436 1.11 mrg conv_func = change_sign32_swap_bytes_be;
437 1.11 mrg break;
438 1.11 mrg
439 1.11 mrg case AUDIO_ENCODING_SLINEAR_BE:
440 1.11 mrg #if BYTE_ORDER == BIG_ENDIAN
441 1.11 mrg case AUDIO_ENCODING_SLINEAR:
442 1.11 mrg #endif
443 1.11 mrg if (wi->precision == 8)
444 1.11 mrg conv_func = change_sign8;
445 1.11 mrg else if (wi->precision == 16)
446 1.11 mrg conv_func = swap_bytes;
447 1.11 mrg else if (wi->precision == 32)
448 1.11 mrg conv_func = swap_bytes32;
449 1.11 mrg break;
450 1.11 mrg
451 1.11 mrg case AUDIO_ENCODING_ULINEAR_LE:
452 1.11 mrg #if BYTE_ORDER == LITTLE_ENDIAN
453 1.11 mrg case AUDIO_ENCODING_ULINEAR:
454 1.11 mrg #endif
455 1.11 mrg if (wi->precision == 16)
456 1.11 mrg conv_func = change_sign16_le;
457 1.11 mrg else if (wi->precision == 32)
458 1.11 mrg conv_func = change_sign32_le;
459 1.11 mrg break;
460 1.11 mrg
461 1.11 mrg case AUDIO_ENCODING_SLINEAR_LE:
462 1.11 mrg case AUDIO_ENCODING_PCM16:
463 1.11 mrg #if BYTE_ORDER == LITTLE_ENDIAN
464 1.11 mrg case AUDIO_ENCODING_SLINEAR:
465 1.11 mrg #endif
466 1.11 mrg if (wi->precision == 8)
467 1.11 mrg conv_func = change_sign8;
468 1.11 mrg break;
469 1.11 mrg
470 1.11 mrg default:
471 1.11 mrg wi->format = AUDIO_FORMAT_NONE;
472 1.11 mrg }
473 1.11 mrg
474 1.11 mrg return conv_func;
475 1.11 mrg }
476