annotate fft_fixstart/main.cc @ 10:e38bef2012bc

fix sync bug. and NDrange option
author Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
date Mon, 11 Feb 2013 06:52:24 +0900
parents ed3d4a769bf3
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
1 #include <stdio.h>
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
2 #include <stdlib.h>
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
3 #include <math.h>
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
4 #include <sys/stat.h>
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
5 #include <fcntl.h>
4
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
6 #include <sys/time.h>
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
7
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
8 #ifdef __APPLE__
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
9 #include <OpenCL/opencl.h>
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
10 #else
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
11 #include <CL/cl.h>
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
12 #endif
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
13
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
14 #include "pgm.h"
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
15
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
16 #define PI 3.14159265358979
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
17
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
18 #define MAX_SOURCE_SIZE (0x100000)
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
19
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
20 #define AMP(a, b) (sqrt((a)*(a)+(b)*(b)))
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
21
4
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
22 static double st_time;
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
23 static double ed_time;
10
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
24 int ndrange_flag;
4
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
25
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
26 cl_device_id device_id = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
27 cl_context context = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
28 cl_command_queue queue = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
29 cl_program program = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
30 cl_device_type device_type = CL_DEVICE_TYPE_GPU;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
31
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
32 enum Mode {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
33 forward = 0,
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
34 inverse = 1
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
35 };
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
36
4
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
37 static double
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
38 getTime()
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
39 {
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
40 struct timeval tv;
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
41 gettimeofday(&tv, NULL);
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
42 return tv.tv_sec + (double)tv.tv_usec*1e-6;
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
43 }
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
44
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
45 int setWorkSize(size_t* gws, size_t* lws, cl_int x, cl_int y)
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
46 {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
47 switch(y) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
48 case 1:
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
49 gws[0] = x;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
50 gws[1] = 1;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
51 lws[0] = 1;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
52 lws[1] = 1;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
53 break;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
54 default:
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
55 gws[0] = x;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
56 gws[1] = y;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
57 lws[0] = 1;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
58 lws[1] = 1;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
59 break;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
60 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
61
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
62 return 0;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
63 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
64
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
65 int fftCore(cl_mem dst, cl_mem src, cl_mem spin, cl_int m, enum Mode direction)
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
66 {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
67 cl_int ret;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
68
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
69 cl_int iter;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
70 cl_uint flag;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
71
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
72 cl_int n = 1<<m;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
73
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
74 cl_event kernelDone;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
75
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
76 cl_kernel brev = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
77 cl_kernel bfly = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
78 cl_kernel norm = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
79
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
80 brev = clCreateKernel(program, "bitReverse", &ret);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
81 bfly = clCreateKernel(program, "butterfly", &ret);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
82 norm = clCreateKernel(program, "norm", &ret);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
83
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
84 size_t gws[2];
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
85 size_t lws[2];
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
86
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
87 switch (direction) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
88 case forward:flag = 0x00000000; break;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
89 case inverse:flag = 0x80000000; break;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
90 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
91
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
92 ret = clSetKernelArg(brev, 0, sizeof(cl_mem), (void *)&dst);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
93 ret = clSetKernelArg(brev, 1, sizeof(cl_mem), (void *)&src);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
94 ret = clSetKernelArg(brev, 2, sizeof(cl_int), (void *)&m);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
95 ret = clSetKernelArg(brev, 3, sizeof(cl_int), (void *)&n);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
96
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
97 ret = clSetKernelArg(bfly, 0, sizeof(cl_mem), (void *)&dst);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
98 ret = clSetKernelArg(bfly, 1, sizeof(cl_mem), (void *)&spin);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
99 ret = clSetKernelArg(bfly, 2, sizeof(cl_int), (void *)&m);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
100 ret = clSetKernelArg(bfly, 3, sizeof(cl_int), (void *)&n);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
101 ret = clSetKernelArg(bfly, 5, sizeof(cl_uint), (void *)&flag);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
102
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
103 ret = clSetKernelArg(norm, 0, sizeof(cl_mem), (void *)&dst);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
104 ret = clSetKernelArg(norm, 1, sizeof(cl_int), (void *)&n);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
105
10
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
106 /* Reversee bit ordering */
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
107 if (ndrange_flag == 1) {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
108 setWorkSize(gws, lws, n, n);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
109 ret = clEnqueueNDRangeKernel(queue, brev, 2, NULL, gws, lws, 0, NULL, NULL);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
110 } else {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
111 ret = clEnqueueTask(queue, brev, 0, NULL, NULL);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
112 }
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
113
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
114 /* Perform Butterfly Operations*/
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
115 setWorkSize(gws, lws, n/2, n);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
116 for (iter=1; iter <= m; iter++) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
117 ret = clSetKernelArg(bfly, 4, sizeof(cl_int), (void *)&iter);
10
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
118 if (ndrange_flag == 1) {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
119 ret = clEnqueueNDRangeKernel(queue, bfly, 2, NULL, gws, lws, 0, NULL, &kernelDone);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
120 } else {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
121 ret = clEnqueueTask(queue, bfly, 0, NULL, &kernelDone);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
122 }
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
123 ret = clWaitForEvents(1, &kernelDone);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
124 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
125
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
126 if (direction == inverse) {
10
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
127 if (ndrange_flag == 1) {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
128 setWorkSize(gws, lws, n, n);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
129 ret = clEnqueueNDRangeKernel(queue, norm, 2, NULL, gws, lws, 0, NULL, &kernelDone);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
130 } else {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
131 ret = clEnqueueTask(queue, norm, 0, NULL, &kernelDone);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
132 }
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
133 ret = clWaitForEvents(1, &kernelDone);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
134 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
135
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
136 ret = clReleaseKernel(bfly);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
137 ret = clReleaseKernel(brev);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
138 ret = clReleaseKernel(norm);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
139
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
140 return 0;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
141 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
142
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
143 char *
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
144 init(int argc, char**argv){
8
1b8da19bb31c change time measure point
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 6
diff changeset
145
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
146 char *filename = 0;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
147
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
148 for (int i = 1; argv[i]; ++i) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
149 if (strcmp(argv[i], "-file") == 0) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
150 filename = argv[i+1];
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
151 } else if (strcmp(argv[i], "-cpu") == 0) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
152 device_type = CL_DEVICE_TYPE_CPU;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
153 } else if (strcmp(argv[i], "-gpu") == 0) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
154 device_type = CL_DEVICE_TYPE_GPU;
9
ed3d4a769bf3 add divice type all
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 8
diff changeset
155 } else if (strcmp(argv[i], "-all") == 0) {
ed3d4a769bf3 add divice type all
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 8
diff changeset
156 device_type = CL_DEVICE_TYPE_ALL;
10
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
157 } else if (strcmp(argv[i], "-nd") == 0 ) {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
158 ndrange_flag = 1;
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
159 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
160 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
161 if ( (argc == 1)||(filename==0)) {
6
db074091ed0b minor change
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 5
diff changeset
162 printf("Usage: ./fft -file [image filename] -cpu or -gpu \n");
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
163 exit(-1);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
164 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
165
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
166 return filename;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
167 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
168
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
169 int main(int argc, char** argv) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
170 cl_mem xmobj = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
171 cl_mem rmobj = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
172 cl_mem wmobj = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
173 cl_kernel sfac = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
174 cl_kernel trns = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
175 cl_kernel hpfl = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
176
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
177 cl_platform_id platform_id = NULL;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
178
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
179 cl_uint ret_num_devices;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
180 cl_uint ret_num_platforms;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
181
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
182 cl_int ret;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
183
10
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
184
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
185 cl_float2 *xm;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
186 cl_float2 *rm;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
187 cl_float2 *wm;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
188
10
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
189 /*
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
190 * typedef union
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
191 * {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
192 * cl_float CL_ALIGNED(8) s[2];
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
193 * #if defined( __GNUC__) && ! defined( __STRICT_ANSI__ )
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
194 * __extension__ struct{ cl_float x, y; };
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
195 * __extension__ struct{ cl_float s0, s1; };
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
196 * __extension__ struct{ cl_float lo, hi; };
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
197 * #endif
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
198 * #if defined( __CL_FLOAT2__)
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
199 * __cl_float2 v2;
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
200 * #endif
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
201 * }cl_float2;
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
202 */
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
203
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
204 pgm_t ipgm;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
205 pgm_t opgm;
8
1b8da19bb31c change time measure point
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 6
diff changeset
206
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
207 const char fileName[] = "./fft.cl";
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
208 size_t source_size;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
209 char *source_str;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
210 cl_int i, j;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
211 cl_int n;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
212 cl_int m;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
213
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
214 size_t gws[2];
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
215 size_t lws[2];
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
216
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
217 /* Load kernel source code */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
218 int fd = open(fileName, O_RDONLY);
8
1b8da19bb31c change time measure point
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 6
diff changeset
219
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
220 if (fd<0) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
221 fprintf(stderr, "Failed to load kernel %s.\n",fileName);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
222 exit(1);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
223 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
224 struct stat stats;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
225 fstat(fd, &stats);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
226 off_t size = stats.st_size;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
227 if (size<=0) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
228 fprintf(stderr, "Failed to load kernel.\n");
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
229 exit(1);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
230 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
231 source_str = (char*)alloca(size);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
232 source_size = read(fd, source_str, size);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
233 close( fd );
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
234
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
235 char * pgm_file = init(argc,argv);
8
1b8da19bb31c change time measure point
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 6
diff changeset
236
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
237 /* Read image */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
238 int err = readPGM(&ipgm, pgm_file);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
239 if (err<0) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
240 fprintf(stderr, "Failed to read image file.\n");
8
1b8da19bb31c change time measure point
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 6
diff changeset
241 exit(1);
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
242 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
243
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
244 n = ipgm.width;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
245 m = (cl_int)(log((double)n)/log(2.0));
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
246
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
247 xm = (cl_float2 *)malloc(n * n * sizeof(cl_float2));
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
248 rm = (cl_float2 *)malloc(n * n * sizeof(cl_float2));
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
249 wm = (cl_float2 *)malloc(n / 2 * sizeof(cl_float2));
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
250
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
251 for (i=0; i < n; i++) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
252 for (j=0; j < n; j++) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
253 ((float*)xm)[(2*n*j)+2*i+0] = (float)ipgm.buf[n*j+i];
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
254 ((float*)xm)[(2*n*j)+2*i+1] = (float)0;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
255 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
256 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
257
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
258 /* Get platform/device */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
259 ret = clGetPlatformIDs(1, &platform_id, &ret_num_platforms);
5
3602b23914ad fix device type bug
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 4
diff changeset
260
3602b23914ad fix device type bug
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 4
diff changeset
261 ret = clGetDeviceIDs( platform_id, device_type, 1, &device_id, &ret_num_devices);
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
262
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
263 /* Create OpenCL context */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
264 context = clCreateContext(NULL, 1, &device_id, NULL, NULL, &ret);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
265
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
266 /* Create Command queue */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
267 queue = clCreateCommandQueue(context, device_id, 0, &ret);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
268
8
1b8da19bb31c change time measure point
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 6
diff changeset
269 st_time = getTime();
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
270 /* Create Buffer Objects */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
271 xmobj = clCreateBuffer(context, CL_MEM_READ_WRITE, n*n*sizeof(cl_float2), NULL, &ret);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
272 rmobj = clCreateBuffer(context, CL_MEM_READ_WRITE, n*n*sizeof(cl_float2), NULL, &ret);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
273 wmobj = clCreateBuffer(context, CL_MEM_READ_WRITE, (n/2)*sizeof(cl_float2), NULL, &ret);
10
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
274
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
275 /* Transfer data to memory buffer */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
276 ret = clEnqueueWriteBuffer(queue, xmobj, CL_TRUE, 0, n*n*sizeof(cl_float2), xm, 0, NULL, NULL);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
277
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
278 /* Create kernel program from source */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
279 program = clCreateProgramWithSource(context, 1, (const char **)&source_str, (const size_t *)&source_size, &ret);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
280
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
281 /* Build kernel program */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
282 ret = clBuildProgram(program, 1, &device_id, NULL, NULL, NULL);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
283
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
284 if (ret<0) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
285 size_t size;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
286 clGetProgramBuildInfo(program, device_id, CL_PROGRAM_BUILD_LOG, 0, NULL, &size);
8
1b8da19bb31c change time measure point
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 6
diff changeset
287
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
288 char *log = new char[size];
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
289 clGetProgramBuildInfo(program, device_id, CL_PROGRAM_BUILD_LOG, size, log, NULL);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
290 printf("%s ",log);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
291 exit (ret);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
292 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
293
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
294 /* Create OpenCL Kernel */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
295 sfac = clCreateKernel(program, "spinFact", &ret);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
296 trns = clCreateKernel(program, "transpose", &ret);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
297 hpfl = clCreateKernel(program, "highPassFilter", &ret);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
298
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
299 /* Create spin factor */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
300 ret = clSetKernelArg(sfac, 0, sizeof(cl_mem), (void *)&wmobj);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
301 ret = clSetKernelArg(sfac, 1, sizeof(cl_int), (void *)&n);
10
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
302 if (ndrange_flag == 1) {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
303 setWorkSize(gws, lws, n/2, 1);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
304 ret = clEnqueueNDRangeKernel(queue, sfac, 1, NULL, gws, lws, 0, NULL, NULL);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
305 } else {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
306 ret = clEnqueueTask(queue, sfac, 0, NULL, NULL);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
307 }
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
308
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
309 /* Butterfly Operation */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
310 fftCore(rmobj, xmobj, wmobj, m, forward);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
311
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
312 /* Transpose matrix */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
313 ret = clSetKernelArg(trns, 0, sizeof(cl_mem), (void *)&xmobj);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
314 ret = clSetKernelArg(trns, 1, sizeof(cl_mem), (void *)&rmobj);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
315 ret = clSetKernelArg(trns, 2, sizeof(cl_int), (void *)&n);
10
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
316 if (ndrange_flag == 1) {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
317 setWorkSize(gws, lws, n, n);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
318 ret = clEnqueueNDRangeKernel(queue, trns, 2, NULL, gws, lws, 0, NULL, NULL);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
319 } else {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
320 ret = clEnqueueTask(queue, trns, 0, NULL, NULL);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
321 }
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
322
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
323 /* Butterfly Operation */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
324 fftCore(rmobj, xmobj, wmobj, m, forward);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
325
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
326 /* Apply high-pass filter */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
327 cl_int radius = n/8;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
328 ret = clSetKernelArg(hpfl, 0, sizeof(cl_mem), (void *)&rmobj);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
329 ret = clSetKernelArg(hpfl, 1, sizeof(cl_int), (void *)&n);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
330 ret = clSetKernelArg(hpfl, 2, sizeof(cl_int), (void *)&radius);
10
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
331 if (ndrange_flag == 1) {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
332 setWorkSize(gws, lws, n, n);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
333 ret = clEnqueueNDRangeKernel(queue, hpfl, 2, NULL, gws, lws, 0, NULL, NULL);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
334 } else {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
335 ret = clEnqueueTask(queue, hpfl, 0, NULL, NULL);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
336 }
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
337
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
338 /* Inverse FFT */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
339
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
340 /* Butterfly Operation */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
341 fftCore(xmobj, rmobj, wmobj, m, inverse);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
342
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
343 /* Transpose matrix */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
344 ret = clSetKernelArg(trns, 0, sizeof(cl_mem), (void *)&rmobj);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
345 ret = clSetKernelArg(trns, 1, sizeof(cl_mem), (void *)&xmobj);
10
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
346 if (ndrange_flag == 1) {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
347 setWorkSize(gws, lws, n, n);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
348 ret = clEnqueueNDRangeKernel(queue, trns, 2, NULL, gws, lws, 0, NULL, NULL);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
349 } else {
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
350 ret = clEnqueueTask(queue, trns, 0, NULL, NULL);
e38bef2012bc fix sync bug. and NDrange option
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 9
diff changeset
351 }
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
352 /* Butterfly Operation */
8
1b8da19bb31c change time measure point
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 6
diff changeset
353
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
354 fftCore(xmobj, rmobj, wmobj, m, inverse);
8
1b8da19bb31c change time measure point
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 6
diff changeset
355
1b8da19bb31c change time measure point
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 6
diff changeset
356 /* Read data from memory buffer */
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
357 ret = clEnqueueReadBuffer(queue, xmobj, CL_TRUE, 0, n*n*sizeof(cl_float2), xm, 0, NULL, NULL);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
358
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
359 /* */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
360 float* ampd;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
361 ampd = (float*)malloc(n*n*sizeof(float));
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
362 for (i=0; i < n; i++) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
363 for (j=0; j < n; j++) {
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
364 ampd[n*((i))+((j))] = (AMP(((float*)xm)[(2*n*i)+2*j], ((float*)xm)[(2*n*i)+2*j+1]));
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
365 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
366 }
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
367 opgm.width = n;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
368 opgm.height = n;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
369 normalizeF2PGM(&opgm, ampd);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
370 free(ampd);
8
1b8da19bb31c change time measure point
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 6
diff changeset
371 ret = clFlush(queue);
1b8da19bb31c change time measure point
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 6
diff changeset
372 ret = clFinish(queue);
1b8da19bb31c change time measure point
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 6
diff changeset
373 ed_time = getTime();
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
374
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
375 /* Write out image */
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
376 writePGM(&opgm, "output.pgm");
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
377
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
378 /* Finalizations*/
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
379 ret = clFlush(queue);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
380 ret = clFinish(queue);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
381 ret = clReleaseKernel(hpfl);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
382 ret = clReleaseKernel(trns);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
383 ret = clReleaseKernel(sfac);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
384 ret = clReleaseProgram(program);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
385 ret = clReleaseMemObject(xmobj);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
386 ret = clReleaseMemObject(rmobj);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
387 ret = clReleaseMemObject(wmobj);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
388 ret = clReleaseCommandQueue(queue);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
389 ret = clReleaseContext(context);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
390
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
391 destroyPGM(&ipgm);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
392 destroyPGM(&opgm);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
393
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
394 free(wm);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
395 free(rm);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
396 free(xm);
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
397
4
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
398 fprintf(stdout, "image out put succeeded.\n");
8df0d3128672 add time measurement function
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents: 3
diff changeset
399 printf("Time: %0.6f\n",ed_time-st_time);
3
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
400 return 0;
f3cfea46e585 add fft_fixstar sample
Yuhi TOMARI <yuhi@cr.ie.u-ryukyu.ac.jp>
parents:
diff changeset
401 }