-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathpma.c
127 lines (107 loc) · 3.29 KB
/
pma.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
/**
* pma.c
* Implementation of Poormans Memory Allocator in OpenCL
* Copyright (C) 2013-2014 Roy Spliet, Delft University of Technology
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with this library; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301
* USA
*/
#include <CL/opencl.h>
#include <stddef.h>
#include <stdio.h>
#include <stdlib.h>
#include <sys/stat.h>
#include "pma.h"
/* XXX: Only works on true 64 bit arch */
cl_mem
_pma_create_64(cl_context ctx, cl_command_queue cq, unsigned int sblocks) {
cl_mem gQ;
cl_int error;
struct pma_heap_64 localHeap;
localHeap.bytes = sblocks + sizeof(struct pma_heap_64);
gQ = clCreateBuffer(ctx, CL_MEM_READ_WRITE, localHeap.bytes, NULL, &error);
if(error != CL_SUCCESS) {
printf("PMA: Could not allocate heap on-device\n");
return (cl_mem) 0;
}
error = clEnqueueWriteBuffer(cq, gQ, 0, 0, sizeof(struct pma_heap_64), &localHeap, 0, NULL, NULL);
if(error != CL_SUCCESS) {
printf("PMA: Could not setup heap on device\n");
return (cl_mem) 0;
}
clFinish(cq);
return gQ;
}
cl_mem
_pma_create_32(cl_context ctx, cl_command_queue cq, unsigned int sblocks) {
cl_mem gQ;
cl_int error;
struct pma_heap_32 localHeap;
localHeap.bytes = sblocks + sizeof(struct pma_heap_32);
gQ = clCreateBuffer(ctx, CL_MEM_READ_WRITE, localHeap.bytes, NULL, &error);
if(error != CL_SUCCESS) {
printf("PMA: Could not allocate heap on-device\n");
return (cl_mem) 0;
}
error = clEnqueueWriteBuffer(cq, gQ, 0, 0, sizeof(struct pma_heap_32), &localHeap, 0, NULL, NULL);
if(error != CL_SUCCESS) {
printf("PMA: Could not setup heap on device\n");
return (cl_mem) 0;
}
clFinish(cq);
return gQ;
}
cl_mem
pma_create(cl_device_id dev, cl_context ctx, cl_command_queue cq,
cl_program prg, unsigned int sblocks)
{
cl_int error;
cl_uint bits;
cl_mem q;
cl_kernel kernel;
const size_t threads = 1;
if(sblocks == 0)
return NULL;
error = clGetDeviceInfo(dev, CL_DEVICE_ADDRESS_BITS, sizeof(cl_uint),
&bits, NULL);
if(error) {
printf("PMA: could not discover device address space\n");
return NULL;
}
if(bits == 32) {
q = _pma_create_32(ctx, cq, sblocks);
} else {
q = _pma_create_64(ctx, cq, sblocks);
}
if(!q) {
printf("PMA: No heap!\n");
return NULL;
}
/* Initialise kernel */
kernel = clCreateKernel(prg, "clheap_init", &error);
if(error != CL_SUCCESS) {
printf("PMA: Could not create heap init kernel: %i\n", error);
return NULL;
}
clSetKernelArg(kernel, 0, sizeof(cl_mem), &q);
error = clEnqueueNDRangeKernel(cq, kernel, 1, NULL, &threads, NULL, 0, NULL, NULL);
error |= clFinish(cq);
if (error != CL_SUCCESS) {
printf("PMA: Could not execute heap init kernel: %i\n", error);
return NULL;
}
clReleaseKernel(kernel);
return q;
}