-
Notifications
You must be signed in to change notification settings - Fork 108
/
Copy pathaudio_convert.h
193 lines (185 loc) · 5.03 KB
/
audio_convert.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
#ifndef AUDIO_CONVERT_H
#define AUDIO_CONVERT_H
#include <string.h>
#include <string>
#include <stdlib.h>
#include <vorbis/codec.h>
#include <vorbis/vorbisenc.h>
#if HAVE_LIBSAMPLERATE
#include <samplerate.h>
#endif
#include "endian.h"
#include "bswap.h"
class cAudioConvert {
public:
enum eSrcDstType {
_src,
_dst
};
enum eFormatType {
_format_raw,
_format_wav,
_format_ogg
};
enum eResult {
_rslt_ok,
_rslt_write_failed,
_rslt_open_for_read_failed,
_rslt_open_for_write_failed,
_rslt_wav_read_header_failed,
_rslt_wav_bad_header,
_rslt_ogg_bad_ogg_file,
_rslt_ogg_bad_bitstream,
_rslt_ogg_bad_first_page,
_rslt_ogg_bad_initial_header_packet,
_rslt_ogg_missing_vorbis_audiodata,
_rslt_ogg_corrupt_secondary_header,
_rslt_ogg_missing_vorbis_headers,
_rslt_ogg_failed_encode_initialization,
_rslt_failed_libsamplerate_init,
_rslt_failed_libsamplerate_process,
_rslt_unknown_format,
_rslt_no_library_needed
};
struct sAudioInfo {
sAudioInfo() {
memset(this, 0, sizeof(*this));
}
u_int32_t sampleRate;
u_int16_t channels;
u_int16_t bitsPerSample;
} __attribute__((packed));
struct sWavHeader {
void null() {
memset(this, 0, sizeof(*this));
}
void init() {
#if __GNUC__ >= 8
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wstringop-truncation"
#endif
strncpy(formatId1, "RIFF", 4);
chunkSize = 0;
strncpy(formatId2, "WAVEfmt ", 8);
lengthFormatData = 16;
format = 1;
strncpy(dataId, "data", 4);
dataSize = 0;
#if __GNUC__ >= 8
#pragma GCC diagnostic pop
#endif
}
void setFromAudioInfo(sAudioInfo *audioInfo) {
channels = audioInfo->channels;
sampleRate = audioInfo->sampleRate;
byteRate = audioInfo->sampleRate * audioInfo->channels * audioInfo->bitsPerSample / 8;
bytesPerSample = audioInfo->channels * audioInfo->bitsPerSample / 8;
bitsPerSampleChannel = audioInfo->bitsPerSample;
}
void setAudioInfo(sAudioInfo *audioInfo) {
audioInfo->channels = channels;
audioInfo->sampleRate = sampleRate;
audioInfo->bitsPerSample = bitsPerSampleChannel;
}
void setFileSize(long int fileSize) {
dataSize = fileSize - sizeof(sWavHeader);
chunkSize = fileSize - 8;
}
void prepareAfterRead() {
prepareEndian();
}
void prepareBeforeWrite() {
prepareEndian();
}
void prepareEndian();
bool checkHeader() {
return(!strncmp(formatId1, "RIFF", 4));
}
char formatId1[4];
u_int32_t chunkSize;
char formatId2[8];
u_int32_t lengthFormatData; // size of above
u_int16_t format; // 1 as PCM
u_int16_t channels;
u_int32_t sampleRate;
u_int32_t byteRate;
u_int16_t bytesPerSample;
u_int16_t bitsPerSampleChannel;
char dataId[4];
u_int32_t dataSize;
} __attribute__((packed));
struct sOgg {
sOgg() {
memset(this, 0, sizeof(*this));
}
~sOgg() {
ogg_stream_clear(&os);
vorbis_block_clear(&vb);
vorbis_dsp_clear(&vd);
vorbis_comment_clear(&vc);
vorbis_info_clear(&vi);
}
ogg_sync_state oy; /* sync and verify incoming physical bitstream */
ogg_stream_state os; /* take physical pages, weld into a logical stream of packets */
ogg_page og; /* one Ogg bitstream page. Vorbis packets are inside */
ogg_packet op; /* one raw packet of data for decode */
vorbis_info vi; /* struct that stores all the static vorbis bitstream settings */
vorbis_comment vc; /* struct that stores all the bitstream user comments */
vorbis_dsp_state vd; /* central working state for the packet->PCM decoder */
vorbis_block vb; /* local working space for packet->PCM decode */
int eos;
};
struct sOggDecode {
sOggDecode(unsigned sync_buffer_size) {
memset(this, 0, sizeof(*this));
this->sync_buffer_size = sync_buffer_size;
}
~sOggDecode() {
if(conv_buffer) {
delete [] conv_buffer;
}
}
unsigned sync_buffer_size;
char *sync_buffer;
ogg_int16_t *conv_buffer;
};
public:
cAudioConvert();
~cAudioConvert();
eResult getAudioInfo();
std::string jsonAudioInfo();
eResult readRaw(sAudioInfo *audioInfo);
eResult resampleRaw(sAudioInfo *audioInfo, const char *fileNameDst, unsigned sampleRateDst);
eResult readWav();
eResult loadWav(u_char **data, size_t *samples, bool pcm_float = false);
bool readWavHeader(sWavHeader *wavHeader);
eResult writeWavHeader(long int size = 0);
eResult writeWavData(u_char *data, unsigned datalen);
eResult writeWavEnd();
eResult readOgg();
eResult writeOggHeader();
eResult writeOggData(u_char *data, unsigned datalen);
eResult writeOggEnd();
eResult _writeOgg();
eResult write(u_char *data, unsigned datalen);
bool open();
bool open_for_write();
void close();
void linear_resample(int16_t* input, int16_t* output, int input_len, double ratio, int channels);
static std::string getRsltStr(eResult rslt);
void test();
public:
eSrcDstType srcDstType;
eFormatType formatType;
std::string fileName;
FILE *fileHandle;
cAudioConvert *destAudio;
sAudioInfo audioInfo;
float oggQuality;
std::string comment;
sOgg ogg;
bool headerIsWrited;
bool onlyGetAudioInfo;
unsigned resample_chunk_length;
};
#endif //AUDIO_CONVERT_H