forked from parallella/pal
-
Notifications
You must be signed in to change notification settings - Fork 0
/
p_sort.c
100 lines (94 loc) · 2.16 KB
/
p_sort.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
#include <pal.h>
#include <stdlib.h>
#define SIFTDOWN_FUNC(name, type) \
static void name (type *a, const uint32_t start, const uint32_t end) \
{ \
for (uint32_t root = start; root * 2 + 1 <= end; ) { \
uint32_t child = root * 2 + 1; \
uint32_t swap = root; \
\
if (a[swap] < a[child]) \
swap = child; \
\
if ((child + 1) <= end && a[swap] < a[child + 1]) \
swap = child + 1; \
\
if (swap != root) { \
type tmp = a[root]; \
a[root] = a[swap]; \
a[swap] = tmp; \
root = swap; \
} else \
break; /* return, but that feels weird */ \
} \
}
SIFTDOWN_FUNC(_sift_down_f32, float);
SIFTDOWN_FUNC(_sift_down_u32, uint32_t);
#define SORT_FUNC(name, type, siftfunc) \
static void name (const type *a, type *c, const int n) \
{ \
if (n < 1) \
return; \
\
int count = (uint32_t) n; \
\
/* copy to out */ \
for (uint32_t i = 0; i < count; i++) \
c[i] = a[i]; \
\
/* heapify */ \
uint32_t start = (count - 2) / 2; \
\
while (1) { \
siftfunc(c, start, count - 1); \
if (start > 0) \
start--; \
else \
break; \
} \
\
/* sort */ \
for (uint32_t end = count - 1; end > 0;) { \
type tmp = c[end]; \
c[end] = c[0]; \
c[0] = tmp; \
end--; \
siftfunc(c, 0, end); \
} \
}
SORT_FUNC(_heapsort_f32, float, _sift_down_f32);
SORT_FUNC(_heapsort_u32, uint32_t, _sift_down_u32);
/**
*
* Sorts an array of float values using heapsort
*
* @param a Pointer to input vector
* @param c Pointer to result vector
* @param n Size of 'a' and 'c' vector.
* @param p Number of processor to use (task parallelism)
* @param team Team to work with
*
* @return None
*
*/
void p_sort_f32(float *a, float *c, int n, int p, p_team_t team)
{
_heapsort_f32(a, c, n);
}
/**
*
* Sorts an array of uint32_t values using heapsort
*
* @param a Pointer to input vector
* @param c Pointer to result vector
* @param n Size of 'a' and 'c' vector.
* @param p Number of processor to use (task parallelism)
* @param team Team to work with
*
* @return None
*
*/
void p_sort_u32(uint32_t *a, uint32_t *c, int n, int p, p_team_t team)
{
_heapsort_u32(a, c, n);
}