forked from mjc14/beamforming
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathapply-delay-and-sum.cc
98 lines (80 loc) · 3.16 KB
/
apply-delay-and-sum.cc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
/* Created on 2016-08-16
* Author: Zhang Binbin
*/
#include <stdio.h>
#include "wav.h"
#include "tdoa.h"
#include "ds.h"
#include "parse-option.h"
int main(int argc, char *argv[]) {
const char *usage = "Do delay and sum beamforming\n"
"Usage: apply-delay-and-sum multi_channel_file output_file\n";
ParseOptions po(usage);
int tdoa_window = 4000;
po.Register("tdoa-window", &tdoa_window,
"window size for estimated tdoa, in sample point");
int beam_window = 4000;
po.Register("beam-window", &beam_window,
"window size for delay and sum, less than tdoa-window, in sample point");
int margin = 16;
po.Register("margin", &margin,
"constraint for tdoa estimation");
po.Read(argc, argv);
if (po.NumArgs() != 2) {
po.PrintUsage();
exit(1);
}
std::string input_file = po.GetArg(1),
output_file = po.GetArg(2);
WavReader wav_reader(input_file.c_str());
printf("input file %s info: \n"
"sample_rate %d \n"
"channels %d \n"
"bits_per_sample_ %d \n",
input_file.c_str(),
wav_reader.SampleRate(),
wav_reader.NumChannel(),
wav_reader.BitsPerSample());
int num_channel = wav_reader.NumChannel();
int num_sample = wav_reader.NumSample();
const float *pcm = wav_reader.Data();
float *out_pcm = (float *)calloc(sizeof(float), num_sample);
int *tdoa = (int *)calloc(sizeof(int), num_channel);
for (int i = 0; i < num_sample; i += beam_window) {
int tdoa_window_size = (i + tdoa_window > num_sample) ?
num_sample - i : tdoa_window;
int beam_window_size = (i + beam_window > num_sample) ?
num_sample - i : beam_window;
assert(beam_window_size <= tdoa_window_size);
// rearrange channel data
float *data = (float *)calloc(sizeof(float),
tdoa_window_size * num_channel);
float *beam_data = (float *)calloc(sizeof(float),
beam_window_size * num_channel);
for (int j = 0; j < num_channel; j++) {
for (int k = 0; k < tdoa_window_size; k++) {
data[j * tdoa_window_size + k] = pcm[(i + k) * num_channel + j];
}
for (int k = 0; k < beam_window_size; k++) {
beam_data[j * beam_window_size + k] = pcm[(i + k) * num_channel + j];
}
}
// calc delay
int tao = margin < tdoa_window_size / 2 ? margin : tdoa_window_size / 2;
GccPhatTdoa(data, num_channel, tdoa_window_size, 0, tao, tdoa);
for (int j = 0; j < num_channel; j++) {
printf("%d ", tdoa[j]);
}
printf("\n");
DelayAndSum(beam_data, num_channel, beam_window_size, tdoa, out_pcm + i);
free(data);
free(beam_data);
}
// Write outfile
WavWriter wav_writer(out_pcm, num_sample, 1,
wav_reader.SampleRate(), wav_reader.BitsPerSample());
wav_writer.Write(output_file.c_str());
free(out_pcm);
free(tdoa);
return 0;
}