-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathenhance.c
executable file
·358 lines (287 loc) · 14.2 KB
/
enhance.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
/******************************************************
DEPARTMENT OF ELECTRICAL AND ELECTRONIC ENGINEERING
IMPERIAL COLLEGE LONDON
EE 3.19: Real Time Digital Signal Processing
Dr Paul Mitcheson and Daniel Harvey
PROJECT: Frame Processing
********* ENHANCE. C **********
Shell for speech enhancement
Demonstrates overlap-add frame processing (interrupt driven) on the DSK.
/*
* You should modify the code so that a speech enhancement project is built
* on top of this template.
*/
/**************************** Pre-processor statements ******************************/
// library required when using calloc
#include <stdlib.h>
// Included so program can make use of DSP/BIOS configuration tool.
#include "dsp_bios_cfg.h"
/* The file dsk6713.h must be included in every program that uses the BSL. This
example also includes dsk6713_aic23.h because it uses the
AIC23 codec module (audio interface). */
#include "dsk6713.h"
#include "dsk6713_aic23.h"
// math library (trig functions)
#include <math.h>
/* Some functions to help with Complex algebra and FFT. */
#include "cmplx.h"
#include "fft_functions.h"
// Some functions to help with writing/reading the audio ports when using interrupts.
#include <helper_functions_ISR.h>
#define WINCONST 0.85185 /* 0.46/0.54 for Hamming window */
#define FSAMP 8000.0 /* sample frequency, ensure this matches Config for AIC */
#define FFTLEN 256 /* fft length = frame length 256/8000 = 32 ms*/
#define NFREQ (1+FFTLEN/2) /* number of frequency bins from a real FFT */
#define OVERSAMP 4 /* oversampling ratio (2 or 4) */
#define FRAMEINC (FFTLEN/OVERSAMP) /* Frame increment */
#define CIRCBUF (FFTLEN+FRAMEINC) /* length of k/O buffers */
#define OUTGAIN 16000.0 /* Output gain for DAC */
#define INGAIN (1.0/16000.0) /* Input gain for ADC */
#define PI 3.141592653589793
#define TFRAME FRAMEINC/FSAMP /* time between calculation of each frame */
/******************************* Global declarations ********************************/
/* Audio port configuration settings: these values set registers in the AIC23 audio
interface to configure it. See TI doc SLWS106D 3-3 to 3-10 for more info. */
DSK6713_AIC23_Config Config = { \
/**********************************************************************/
/* REGISTER FUNCTION SETTINGS */
/**********************************************************************/\
0x0017, /* 0 LEFTINVOL Left line input channel volume 0dB */\
0x0017, /* 1 RIGHTINVOL Right line input channel volume 0dB */\
0x01f9, /* 2 LEFTHPVOL Left channel headphone volume 0dB */\
0x01f9, /* 3 RIGHTHPVOL Right channel headphone volume 0dB */\
0x0011, /* 4 ANAPATH Analog audio path control DAC on, Mic boost 20dB*/\
0x0000, /* 5 DIGPATH Digital audio path control All Filters off */\
0x0000, /* 6 DPOWERDOWN Power down control All Hardware on */\
0x0043, /* 7 DIGIF Digital audio interface format 16 bit */\
0x008d, /* 8 SAMPLERATE Sample rate control 8 KHZ-ensure matches FSAMP */\
0x0001 /* 9 DIGACT Digital interface activation On */\
/**********************************************************************/
};
// Codec handle:- a variable used to identify audio interface
DSK6713_AIC23_CodecHandle H_Codec;
float *inbuffer, *outbuffer; /* Input/output circular buffers */
float *inframe, *outframe; /* Input and output frames */
float *inwin, *outwin; /* Input and output windows */
/************* Array Declarations ************/
float *X_magnitude; /* Magnitude spectrum */
float *low_pass_noise,*low_pass_noise_prev; /* Low pass noise estimate array */
float *noise_estimate; /* Noise estimate array */
float *M1, *M2, *M3, *M4; /* 2.5 sec buffers to find minimum noise amp */
float *Pt_prev,*Pt; /* Low pass filtered input */
complex *intermediate; /* Complex array to perform FFT/IFFT calculations */
/**********************************************/
float ingain, outgain; /* ADC and DAC gains */
float cpufrac; /* Fraction of CPU time used */
/********** Constant Declarations *******************/
float g; /* Frequency dependent gain factor */
float kappa_4; /* Low pass filter constant */
float kappa_noise; /* constant for enhancement 3 */
float tau = 0.08; /* Time constant */
float alpha = 3.0; /* Alpha factor */
float lambda = 0.0003; /* Lambda value */
float tau_noise = 0.08; /* Time constant for enhancement 3*/
float ROTATE_TIME = 2; /* Parameter to control rotation of frames */
/*********************************************/
volatile int io_ptr=0; /* Input/ouput pointer for circular buffers */
volatile int frame_ptr=0; /* Frame pointer */
volatile int f_index=-1; /* Counts until 312 corresponding to 2.5 secs*/
/******************************* Function prototypes *******************************/
void init_hardware(void); /* Initialize codec */
void init_HWI(void); /* Initialize hardware interrupts */
void ISR_AIC(void); /* Interrupt service routine for codec */
void process_frame(void); /* Frame processing routine */
float find_min(float a, float b); /* Minimum function*/
float find_max(float a, float b); /* Maximum function*/
/********************************** Main routine ************************************/
void main()
{
int k; // used in various for loops
/* Initialize and zero fill arrays */
inbuffer = (float *) calloc(CIRCBUF, sizeof(float)); /* Input array */
outbuffer = (float *) calloc(CIRCBUF, sizeof(float)); /* Output array */
inframe = (float *) calloc(FFTLEN, sizeof(float)); /* Array for processing*/
outframe = (float *) calloc(FFTLEN, sizeof(float)); /* Array for processing*/
inwin = (float *) calloc(FFTLEN, sizeof(float)); /* Input window */
outwin = (float *) calloc(FFTLEN, sizeof(float)); /* Output window */
M1 = (float *) calloc(NFREQ, sizeof(float)); /* M1 */
M2 = (float *) calloc(NFREQ, sizeof(float)); /* M2 */
M3 = (float *) calloc(NFREQ, sizeof(float)); /* M3 */
M4 = (float *) calloc(NFREQ, sizeof(float)); /* M4 */
Pt = (float *) calloc(NFREQ, sizeof(float)); /* P(t) */
Pt_prev = (float *) calloc(NFREQ, sizeof(float)); /* P(t-1) */
X_magnitude = (float *) calloc(NFREQ, sizeof(float)); /* Magnitude spectrum */
noise_estimate = (float *) calloc(NFREQ, sizeof(float)); /* Noise estimate array */
low_pass_noise = (float *) calloc(NFREQ, sizeof(float)); /* Low pass noise estimate */
low_pass_noise_prev = (float *) calloc(NFREQ, sizeof(float)); /* Previous low pass noise estimate */
intermediate = (complex *) calloc(FFTLEN, sizeof(complex)); /* Complex buffer */
/* initialize board and the audio port */
init_hardware();
/* initialize hardware interrupts */
init_HWI();
/* initialize algorithm constants */
for (k=0;k<FFTLEN;k++)
{
inwin[k] = sqrt((1.0-WINCONST*cos(PI*(2*k+1)/FFTLEN))/OVERSAMP);
outwin[k] = inwin[k];
}
ingain=INGAIN;
outgain=OUTGAIN;
/* Calculate kappa constants */
kappa_4 = exp((double)(-(TFRAME)/tau));
kappa_noise = exp((double)(-(TFRAME)/tau_noise));
/* main loop, wait for interrupt */
while(1) process_frame();
}
/********************************** init_hardware() *********************************/
void init_hardware()
{
// Initialize the board support library, must be called first
DSK6713_init();
// Start the AIC23 codec using the settings defined above in config
H_Codec = DSK6713_AIC23_openCodec(0, &Config);
/* Function below sets the number of bits in word used by MSBSP (serial port) for
receives from AIC23 (audio port). We are using a 32 bit packet containing two
16 bit numbers hence 32BIT is set for receive */
MCBSP_FSETS(RCR1, RWDLEN1, 32BIT);
/* Configures interrupt to activate on each consecutive available 32 bits
from Audio port hence an interrupt is generated for each L & R sample pair */
MCBSP_FSETS(SPCR1, RINTM, FRM);
/* These commands do the same thing as above but applied to data transfers to the
audio port */
MCBSP_FSETS(XCR1, XWDLEN1, 32BIT);
MCBSP_FSETS(SPCR1, XINTM, FRM);
}
/********************************** init_HWI() **************************************/
void init_HWI(void)
{
IRQ_globalDisable(); // Globally disables interrupts
IRQ_nmiEnable(); // Enables the NMI interrupt (used by the debugger)
IRQ_map(IRQ_EVT_RINT1,4); // Maps an event to a physical interrupt
IRQ_enable(IRQ_EVT_RINT1); // Enables the event
IRQ_globalEnable(); // Globally enables interrupts
}
/******************************** process_frame() ***********************************/
void process_frame(void)
{
int k, m; /* used for loop counters */
int io_ptr0;
float *tmp_M4; /* used for buffer rotation */
float global_min; /* variable to hold the min out of all frames */
/* work out fraction of available CPU time used by algorithm */
cpufrac = ((float) (io_ptr & (FRAMEINC - 1)))/FRAMEINC;
/* wait until io_ptr is at the start of the current frame */
while((io_ptr/FRAMEINC) != frame_ptr);
/* then increment the framecount (wrapping if required) */
if (++frame_ptr >= (CIRCBUF/FRAMEINC)) frame_ptr=0;
/* Check for time condition and rotate buffers when necessary */
if (++f_index > (ROTATE_TIME/FRAMEINC*FSAMP)){
f_index = 0;
tmp_M4 = M4;
M4 = M3;
M3 = M2;
M2 = M1;
M1 = tmp_M4;
}
/* save a pointer to the position in the k/O buffers (inbuffer/outbuffer) where the
data should be read (inbuffer) and saved (outbuffer) for the purpose of processing */
io_ptr0=frame_ptr * FRAMEINC;
/* copy input data from inbuffer into inframe (starting from the pointer position) */
m=io_ptr0;
for (k=0;k<FFTLEN;k++)
{
inframe[k] = inbuffer[m] * inwin[k];
intermediate[k] = cmplx(inframe[k],0); /* store input to a complex form in order to calculate FFT */
if (++m >= CIRCBUF) m=0; /* wrap if required */
}
/************************* DO PROCESSING OF FRAME HERE **************************/
/* Perform FFT over the intermediate array */
fft(FFTLEN,intermediate);
/* Calculate the magnitude spectrum of the input signal |X(w)| */
/* loop over the number of frequency bins */
for (k = 0; k < NFREQ; k++)
{
X_magnitude[k] = cabs(intermediate[k]);
/* Enhancement 2: Low pass filtering in the power domain (Low pass filter version of X|(w)|^2) */
Pt[k] = sqrt(((1-kappa_4)*(X_magnitude[k]*X_magnitude[k]) + kappa_4*Pt_prev[k]*Pt_prev[k]));
}
/*Estimate the noise spectrum */
for (k = 0; k < NFREQ; k++)
{
if (f_index == 0){
M1[k] = Pt[k];
}
else{
M1[k] = find_min(M1[k], Pt[k]);
}
/* Find the minimum out of all Mi */
global_min = find_min( find_min(M1[k], M2[k]), find_min(M3[k], M4[k]) );
noise_estimate[k] = alpha*global_min; /* estimate the noise spectrum */
/* Enhancement 3: Low pass the calculated noise estimate */
low_pass_noise[k] = (1-kappa_noise)*noise_estimate[k] + kappa_noise*low_pass_noise_prev[k];
}
/* Subtract the noise spectrum */
for (k = 0; k < NFREQ; k++)
{
/* Enhancement 4 - Mode 3 */
g = find_max(lambda*(low_pass_noise[k]/Pt[k]), (1-(low_pass_noise[k]/Pt[k])));
/* Zero-phase filtering, subtract the noise spectrum */
intermediate[k] = rmul(g, intermediate[k]); /* Output NFREQ samples */
/* Symmetry of FFT to output rest/symmetrical samples */
intermediate[FFTLEN - k].r = intermediate[k].r;
intermediate[FFTLEN - k].i =- intermediate[k].i;
}
/* Update previous versions of arrays */
low_pass_noise_prev = low_pass_noise;
Pt_prev = Pt;
/* Perform inverse FFT */
ifft(FFTLEN,intermediate);
/* Write the filtered from noise signal to the output frame */
for (k = 0; k < FFTLEN; k++)
{
outframe[k]=intermediate[k].r;
}
/********************************************************************************/
/* multiply outframe by output window and overlap-add into output buffer */
m=io_ptr0;
/* this loop adds into outbuffer */
for (k=0;k<(FFTLEN-FRAMEINC);k++)
{
outbuffer[m] = outbuffer[m]+outframe[k]*outwin[k];
if (++m >= CIRCBUF) m=0; /* wrap if required */
}
/* this loop over-writes outbuffer */
for (;k<FFTLEN;k++)
{
outbuffer[m] = outframe[k]*outwin[k];
m++;
}
}
/*************************** INTERRUPT SERVICE ROUTINE *****************************/
/* Map this to the appropriate interrupt in the CDB file */
void ISR_AIC(void)
{
short sample;
/* Read and write the ADC and DAC using inbuffer and outbuffer */
sample = mono_read_16Bit();
inbuffer[io_ptr] = ((float)sample)*ingain;
/* write new output data */
mono_write_16Bit((int)(outbuffer[io_ptr]*outgain));
/* update io_ptr and check for buffer wraparound */
if (++io_ptr >= CIRCBUF) io_ptr=0;
}
/************************************************************************************/
/* Function to calculate the minimum between the two input arguments */
float find_min(float a, float b){
if (a > b)
return b;
else
return a;
}
/* Function to calculate the maximum between the two input arguments */
float find_max(float a, float b){
if (a > b)
return a;
else
return b;
}