-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmorphology.cu
98 lines (88 loc) · 2.95 KB
/
morphology.cu
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
#include <cuda_runtime.h>
extern "C"
{
__global__ void dilation(int * src, int * dst, int p, int window_size, int n_window, int image_shape)
{
extern __shared__ int smem[];
int tx = threadIdx.x;
int ty = threadIdx.y;
int bx = blockIdx.x;
if (tx == 0)
{
for (int i = p - 1; i >= 0; i--)
{
if (i == p - 1)
smem[ty * p + i] = src[bx * p * n_window + ty * p + i];
else
smem[ty * p + i] = max(src[bx * p * n_window + ty * p + i], smem[ty * p + (i + 1)]);
}
}
else
{
for (int i = 0; i <= p - 1; i++)
{
if (i == 0)
smem[n_window * p + (ty * p) + i] = src[bx * p * n_window + ty * p + (i + p - 1)];
else
smem[n_window * p + (ty * p) + i] = max(src[bx * p *n_window + ty * p + (i + p - 1)],
smem[n_window * p + (ty * p) + (i - 1)]);
}
}
__syncthreads();
if (tx == 0)
{
for (int i = 0; i < p; i++)
{
// Skip first p-1 / 2 because of padding
int original_index = bx * p * n_window + ty * p + i + ((p - 1)/2);
if (original_index < image_shape)
{
dst[original_index] = max(smem[ty * p + i], smem[n_window * p + (ty * p) + i]);
}
}
}
}
}
extern "C"
{
__global__ void erosion(int * src, int * dst, int p, int window_size, int n_window, int image_shape)
{
extern __shared__ int smem[];
int tx = threadIdx.x;
int ty = threadIdx.y;
int bx = blockIdx.x;
if (tx == 0)
{
for (int i = p - 1; i >= 0; i--)
{
if (i == p - 1)
smem[ty * p + i] = src[bx * p * n_window + ty * p + i];
else
smem[ty * p + i] = min(src[bx * p * n_window + ty * p + i], smem[ty * p + (i + 1)]);
}
}
else
{
for (int i = 0; i <= p - 1; i++)
{
if (i == 0)
smem[n_window * p + (ty * p) + i] = src[bx * p * n_window + ty * p + (i + p - 1)];
else
smem[n_window * p + (ty * p) + i] = min(src[bx * p *n_window + ty * p + (i + p - 1)],
smem[n_window * p + (ty * p) + (i - 1)]);
}
}
__syncthreads();
if (tx == 0)
{
for (int i = 0; i < p; i++)
{
int original_index = bx * p * n_window + ty * p + i + ((p - 1)/2);
if (original_index < image_shape)
{
dst[original_index] = min(smem[ty * p + i], smem[n_window * p + (ty * p) + i]);
}
}
}
}
}