• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2 ** Copyright (C) 2002-2017 Erik de Castro Lopo <erikd@mega-nerd.com>
3 **
4 ** This program is free software; you can redistribute it and/or modify
5 ** it under the terms of the GNU Lesser General Public License as published by
6 ** the Free Software Foundation; either version 2.1 of the License, or
7 ** (at your option) any later version.
8 **
9 ** This program is distributed in the hope that it will be useful,
10 ** but WITHOUT ANY WARRANTY; without even the implied warranty of
11 ** MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12 ** GNU Lesser General Public License for more details.
13 **
14 ** You should have received a copy of the GNU Lesser General Public License
15 ** along with this program; if not, write to the Free Software
16 ** Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
17 */
18 
19 #include	"sfconfig.h"
20 
21 #include	<stdio.h>
22 #include	<fcntl.h>
23 #include	<string.h>
24 #include	<ctype.h>
25 
26 #include	"sndfile.h"
27 #include	"sfendian.h"
28 #include	"common.h"
29 
30 /*------------------------------------------------------------------------------
31 ** Macros to handle big/little endian issues.
32 */
33 
34 #define	SFE_HTK_BAD_FILE_LEN 	1666
35 #define	SFE_HTK_NOT_WAVEFORM	1667
36 
37 /*------------------------------------------------------------------------------
38 ** Private static functions.
39 */
40 
41 static	int		htk_close		(SF_PRIVATE *psf) ;
42 
43 static int		htk_write_header (SF_PRIVATE *psf, int calc_length) ;
44 static int		htk_read_header (SF_PRIVATE *psf) ;
45 
46 /*------------------------------------------------------------------------------
47 ** Public function.
48 */
49 
50 int
htk_open(SF_PRIVATE * psf)51 htk_open	(SF_PRIVATE *psf)
52 {	int		subformat ;
53 	int		error = 0 ;
54 
55 	if (psf->is_pipe)
56 		return SFE_HTK_NO_PIPE ;
57 
58 	if (psf->file.mode == SFM_READ || (psf->file.mode == SFM_RDWR && psf->filelength > 0))
59 	{	if ((error = htk_read_header (psf)))
60 			return error ;
61 		} ;
62 
63 	subformat = SF_CODEC (psf->sf.format) ;
64 
65 	if (psf->file.mode == SFM_WRITE || psf->file.mode == SFM_RDWR)
66 	{	if ((SF_CONTAINER (psf->sf.format)) != SF_FORMAT_HTK)
67 			return	SFE_BAD_OPEN_FORMAT ;
68 
69 		psf->endian = SF_ENDIAN_BIG ;
70 
71 		if (htk_write_header (psf, SF_FALSE))
72 			return psf->error ;
73 
74 		psf->write_header = htk_write_header ;
75 		} ;
76 
77 	psf->container_close = htk_close ;
78 
79 	psf->blockwidth = psf->bytewidth * psf->sf.channels ;
80 
81 	switch (subformat)
82 	{	case SF_FORMAT_PCM_16 :	/* 16-bit linear PCM. */
83 				error = pcm_init (psf) ;
84 				break ;
85 
86 		default : break ;
87 		} ;
88 
89 	return error ;
90 } /* htk_open */
91 
92 /*------------------------------------------------------------------------------
93 */
94 
95 static int
htk_close(SF_PRIVATE * psf)96 htk_close	(SF_PRIVATE *psf)
97 {
98 	if (psf->file.mode == SFM_WRITE || psf->file.mode == SFM_RDWR)
99 		htk_write_header (psf, SF_TRUE) ;
100 
101 	return 0 ;
102 } /* htk_close */
103 
104 static int
htk_write_header(SF_PRIVATE * psf,int calc_length)105 htk_write_header (SF_PRIVATE *psf, int calc_length)
106 {	sf_count_t	current ;
107 	int			sample_count, sample_period ;
108 
109 	current = psf_ftell (psf) ;
110 
111 	if (calc_length)
112 		psf->filelength = psf_get_filelen (psf) ;
113 
114 	/* Reset the current header length to zero. */
115 	psf->header.ptr [0] = 0 ;
116 	psf->header.indx = 0 ;
117 	psf_fseek (psf, 0, SEEK_SET) ;
118 
119 	if (psf->filelength > 12)
120 		sample_count = (psf->filelength - 12) / 2 ;
121 	else
122 		sample_count = 0 ;
123 
124 	sample_period = 10000000 / psf->sf.samplerate ;
125 
126 	psf_binheader_writef (psf, "E444", BHW4 (sample_count), BHW4 (sample_period), BHW4 (0x20000)) ;
127 
128 	/* Header construction complete so write it out. */
129 	psf_fwrite (psf->header.ptr, psf->header.indx, 1, psf) ;
130 
131 	if (psf->error)
132 		return psf->error ;
133 
134 	psf->dataoffset = psf->header.indx ;
135 
136 	if (current > 0)
137 		psf_fseek (psf, current, SEEK_SET) ;
138 
139 	return psf->error ;
140 } /* htk_write_header */
141 
142 /*
143 ** Found the following info in a comment block within Bill Schottstaedt's
144 ** sndlib library.
145 **
146 ** HTK format files consist of a contiguous sequence of samples preceded by a
147 ** header. Each sample is a vector of either 2-byte integers or 4-byte floats.
148 ** 2-byte integers are used for compressed forms as described below and for
149 ** vector quantised data as described later in section 5.11. HTK format data
150 ** files can also be used to store speech waveforms as described in section 5.8.
151 **
152 ** The HTK file format header is 12 bytes long and contains the following data
153 **   nSamples   -- number of samples in file (4-byte integer)
154 **   sampPeriod -- sample period in 100ns units (4-byte integer)
155 **   sampSize   -- number of bytes per sample (2-byte integer)
156 **   parmKind   -- a code indicating the sample kind (2-byte integer)
157 **
158 ** The parameter kind  consists of a 6 bit code representing the basic
159 ** parameter kind plus additional bits for each of the possible qualifiers.
160 ** The basic parameter kind codes are
161 **
162 **  0    WAVEFORM    sampled waveform
163 **  1    LPC         linear prediction filter coefficients
164 **  2    LPREFC      linear prediction reflection coefficients
165 **  3    LPCEPSTRA   LPC cepstral coefficients
166 **  4    LPDELCEP    LPC cepstra plus delta coefficients
167 **  5    IREFC       LPC reflection coef in 16 bit integer format
168 **  6    MFCC        mel-frequency cepstral coefficients
169 **  7    FBANK       log mel-filter bank channel outputs
170 **  8    MELSPEC     linear mel-filter bank channel outputs
171 **  9    USER        user defined sample kind
172 **  10   DISCRETE    vector quantised data
173 **
174 ** and the bit-encoding for the qualifiers (in octal) is
175 **   _E   000100      has energy
176 **   _N   000200      absolute energy suppressed
177 **   _D   000400      has delta coefficients
178 **   _A   001000      has acceleration coefficients
179 **   _C   002000      is compressed
180 **   _Z   004000      has zero mean static coef.
181 **   _K   010000      has CRC checksum
182 **   _O   020000      has 0'th cepstral coef.
183 */
184 
185 static int
htk_read_header(SF_PRIVATE * psf)186 htk_read_header (SF_PRIVATE *psf)
187 {	int		sample_count, sample_period, marker ;
188 
189 	psf_binheader_readf (psf, "pE444", 0, &sample_count, &sample_period, &marker) ;
190 
191 	if (2 * sample_count + 12 != psf->filelength)
192 		return SFE_HTK_BAD_FILE_LEN ;
193 
194 	if (marker != 0x20000)
195 		return SFE_HTK_NOT_WAVEFORM ;
196 
197 	psf->sf.channels = 1 ;
198 
199 	if (sample_period > 0)
200 	{	psf->sf.samplerate = 10000000 / sample_period ;
201 		psf_log_printf (psf, "HTK Waveform file\n  Sample Count  : %d\n  Sample Period : %d => %d Hz\n",
202 					sample_count, sample_period, psf->sf.samplerate) ;
203 		}
204 	else
205 	{	psf->sf.samplerate = 16000 ;
206 		psf_log_printf (psf, "HTK Waveform file\n  Sample Count  : %d\n  Sample Period : %d (should be > 0) => Guessed sample rate %d Hz\n",
207 					sample_count, sample_period, psf->sf.samplerate) ;
208 		} ;
209 
210 	psf->sf.format = SF_FORMAT_HTK | SF_FORMAT_PCM_16 ;
211 	psf->bytewidth = 2 ;
212 
213 	/* HTK always has a 12 byte header. */
214 	psf->dataoffset = 12 ;
215 	psf->endian = SF_ENDIAN_BIG ;
216 
217 	psf->datalength = psf->filelength - psf->dataoffset ;
218 
219 	psf->blockwidth = psf->sf.channels * psf->bytewidth ;
220 
221 	if (! psf->sf.frames && psf->blockwidth)
222 		psf->sf.frames = (psf->filelength - psf->dataoffset) / psf->blockwidth ;
223 
224 	return 0 ;
225 } /* htk_read_header */
226 
227