-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathdecoder.cpp
185 lines (156 loc) · 5.08 KB
/
decoder.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
/*
* decoder.cpp
* read a file and compress using rangemapper by bits
*
Created by Zhiying Wang June 2014
Modified by Vida Ravanmehr Nov. 2016
*/
int decoder(char * argv[]) {
char FileName[400];//name of processed Wig file
char Type[40];
char T[40];
strcpy(FileName, argv[1]);
char tmpFileName[400];
//parameters that can be changed for testing
//the RANGE_SIZE_IN_BITS depends on your alphabet size
int alphabet_size;//256; //Please notice the size of the alphabet.
//int data_size;// = 39432012;
int RANGE_SIZE_IN_BITS=30;
//ranges_in_bits<32, it cannot be more than sizeof(int), which is 4 bytes=32 bits, otherwise makeRanges does not work
//range_in_bits is the number of bits used to represent the probabilities
// L=64-range_in_bits is the number of bits used to store the current range of low and high
//Need for any probability p of a symbol, p>= 1/2^(L-3). So L-3>=range_in_bits, or range_in_bits<=30
//int *data;
//double entropy;
//int expected_size;
//int cm_size;
int *cm;
//int actual_size;
//bool isOK;
//int i=0;
//int j=0;
//long int underflow; //count number of times low and high are too close
float totaltime=0;
//write to summary result file
FILE *fpResult=fopen("result","a");
if (fpResult == NULL) {
fprintf(stderr,"Can't open output result file!\n");
exit(1);
}
//start decoding
fprintf(fpResult,"====================\ndecoder.cpp start!\n");
for (int type=0; type<=2; type++){
if (type==0){
strcpy(Type,"DiffLocSeqMatlab1");
strcpy(T,"DiffLoc1");
//alphabet_size = 6134;
}
else if (type==1)
{
strcpy(Type,"DiffLocSeqMatlab2");
strcpy(T,"DiffLoc2");
//alphabet_size = 6134;
}
else
{
strcpy(Type,"DiffValSeqMatlab");
strcpy(T,"DiffVal");
//alphabet_size = 67955;
}
alphabet_size = 0;
//data_size=100000000;
//data = (int*)malloc(data_size * sizeof(int));
//decode
clock_t start_decoding = clock();
//read g_buffer from file
strcpy(tmpFileName,FileName);
strcat(tmpFileName,Type);
strcat(tmpFileName,"Code");
FILE *fpCode = fopen(tmpFileName, "rb");
if (fpCode == NULL) {
fprintf(stderr, "Can't open file %s!\n",tmpFileName);
exit(1);
}
//long int FileSize;
long int buffer_size;
fseek(fpCode, 0L, SEEK_END);
buffer_size = ftell(fpCode);
rewind(fpCode);
g_buffer = (unsigned char*)malloc(buffer_size);
if (g_buffer == NULL){
printf("Error! Allocation was not successful. \n");
exit(1);
}
fread(g_buffer,1,buffer_size,fpCode);
/*for (j=0; j<10; j++)
printf("%hhX ",g_buffer[j]);
printf("\nabove is g_buffer from file\n");
printf("actual_size %d and FileSize %ld\n", actual_size, FileSize);*/
//load count table file
strcpy(tmpFileName,FileName);
strcat(tmpFileName,T);
FILE *fpDiff = fopen(tmpFileName, "r");
if (fpDiff == NULL) {
fprintf(stderr, "Can't open file %s!\n",tmpFileName);
exit(1);
}
absize_txt(&alphabet_size, fpDiff);
cm = (int*)malloc((alphabet_size+2)*sizeof(int));
if (cm == NULL){
printf("Error! Allocation was not successful. \n");
exit(1);
}
makeRanges_txt(cm, alphabet_size, RANGE_SIZE_IN_BITS,fpDiff);
fclose(fpDiff);
//write index to a file
strcpy(tmpFileName,FileName);
strcat(tmpFileName,Type);
strcat(tmpFileName,"Decode");
FILE *fpDecode = fopen(tmpFileName, "w+");
if (fpDecode == NULL) {
fprintf(stderr, "Can't open file %s!\n",tmpFileName);
exit(1);
}
RangeMapper* rm_decode = new RangeMapper(RANGE_SIZE_IN_BITS);
current_byte = 0;
TMPREAD_COUNT = 0;
TMPREAD = 0x00;
rm_decode->init();
//printf("Begin to decode.\ndata[0]=%d,data[1]=%d,data[data_size-1]=%d\n",data[0],data[1],data[data_size-1]);
while (current_byte<buffer_size+1) {
int midpoint = rm_decode->getMidPoint();
//next is binary search algorithm that does not need having lookup array
int index = findInterval(cm, alphabet_size + 2, midpoint);
// printf("midpoint=%d,index=%d\n",midpoint,index);
if (index == alphabet_size){
/* ///////for test the tail of the code
int tmpbitcount=0;
printf("Finished! TMPWRITE_COUNT is %hhX\n",TMPWRITE_COUNT);
while (current_byte<actual_size){
readBit();
tmpbitcount++;
}
printf("tail bit number is %d\n",tmpbitcount);
///////for test the tail of the code
*/ break; //end of data marker
}
fprintf(fpDecode,"%d ",index);
rm_decode->decodeRange(cm[index], cm[index+1]);
}
delete rm_decode;
//if (lookup) free(lookup);
clock_t end_decoding = clock();
//end decoding
//write to summary result file
fprintf(fpResult,"\n\n//decoder.cpp//File is %s%s\n", FileName, Type);
fprintf(fpResult,"Time for decoding %2.3f sec.\n", (double)(end_decoding - start_decoding)/CLOCKS_PER_SEC);
totaltime =totaltime + (double)(end_decoding - start_decoding)/CLOCKS_PER_SEC;
free(g_buffer);
free(cm);
fclose(fpCode);
fclose(fpDecode);
}
fprintf(fpResult,"Total Time for decoding %2.3f sec.\n", totaltime);
fclose(fpResult);
return 1;
}