blob: 29199df665d3707d7ab7428b04c01e5ff43b0612 [file] [log] [blame]
//
// Copyright (c) 2017 The Khronos Group Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
#include "harness/compat.h"
#include <stdio.h>
#include <string.h>
#include <assert.h>
#include <sys/types.h>
#include <sys/stat.h>
#include "procs.h"
#include "harness/errorHelpers.h"
#define STRING_LENGTH 1024
void createKernelSourceCode(char *source, int num_pipes)
{
int i;
char str[256];
int str_length;
strcpy(source, "__kernel void test_multiple_pipe_write(__global int *src, ");
for(i = 0; i < num_pipes; i++) {
sprintf(str, "__write_only pipe int pipe%d, ", i);
strcat(source, str);
}
sprintf(str, "int num_pipes ) \n{\n int gid = get_global_id(0);\n reserve_id_t res_id;\n\n");
strcat(source, str);
sprintf(str, " if(gid < (get_global_size(0))/num_pipes)\n {\n res_id = reserve_write_pipe(pipe0, 1);\n if(is_valid_reserve_id(res_id))\n {\n");
strcat(source, str);
sprintf(str, " write_pipe(pipe0, res_id, 0, &src[gid]);\n commit_write_pipe(pipe0, res_id);\n }\n }\n");
strcat(source, str);
for(i = 1; i < num_pipes; i++){
sprintf(str, " else if(gid < (%d*get_global_size(0))/num_pipes)\n {\n res_id = reserve_write_pipe(pipe%d, 1);\n if(is_valid_reserve_id(res_id))\n {\n", i+1, i);
strcat(source, str);
sprintf(str, " write_pipe(pipe%d, res_id, 0, &src[gid]);\n commit_write_pipe(pipe%d, res_id);\n }\n }\n", i, i);
strcat(source, str);
}
strcat(source, "}\n\n__kernel void test_multiple_pipe_read(__global int *dst, ");
for(i = 0; i < num_pipes; i++) {
sprintf(str, "__read_only pipe int pipe%d, ", i);
strcat(source, str);
}
sprintf(str, "int num_pipes ) \n{\n int gid = get_global_id(0);\n reserve_id_t res_id;\n\n");
strcat(source, str);
sprintf(str, " if(gid < (get_global_size(0))/num_pipes)\n {\n res_id = reserve_read_pipe(pipe0, 1);\n if(is_valid_reserve_id(res_id))\n {\n");
strcat(source, str);
sprintf(str, " read_pipe(pipe0, res_id, 0, &dst[gid]);\n commit_read_pipe(pipe0, res_id);\n }\n }\n");
strcat(source, str);
for(i = 1; i < num_pipes; i++){
sprintf(str, " else if(gid < (%d*get_global_size(0))/num_pipes)\n {\n res_id = reserve_read_pipe(pipe%d, 1);\n if(is_valid_reserve_id(res_id))\n {\n", i+1, i);
strcat(source, str);
sprintf(str, " read_pipe(pipe%d, res_id, 0, &dst[gid]);\n commit_read_pipe(pipe%d, res_id);\n }\n }\n", i, i);
strcat(source, str);
}
strcat(source, "}");
str_length = strlen(source);
assert(str_length <= STRING_LENGTH*num_pipes);
}
static int verify_result(void *ptr1, void *ptr2, int n)
{
int i;
int sum_input = 0, sum_output = 0;
cl_char *inptr = (cl_char *)ptr1;
cl_char *outptr = (cl_char *)ptr2;
for(i = 0; i < n; i++)
{
sum_input += inptr[i];
sum_output += outptr[i];
}
if(sum_input != sum_output){
return -1;
}
return 0;
}
static int verify_result_int(void *ptr1, void *ptr2, int n)
{
int i;
int sum_input = 0, sum_output = 0;
cl_int *inptr = (cl_int *)ptr1;
cl_int *outptr = (cl_int *)ptr2;
for(i = 0; i < n; i++)
{
sum_input += inptr[i];
sum_output += outptr[i];
}
if(sum_input != sum_output){
return -1;
}
return 0;
}
int test_pipe_max_args(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
{
cl_mem pipes[1024];
cl_mem buffers[2];
void *outptr;
cl_int *inptr;
cl_program program;
cl_kernel kernel[2];
size_t global_work_size[3];
cl_int err;
cl_int size;
int num_pipe_elements = 1024;
int i, j;
int max_pipe_args;
char *source;
cl_event producer_sync_event = NULL;
cl_event consumer_sync_event = NULL;
MTdata d = init_genrand( gRandomSeed );
const char* kernelName[] = {"test_multiple_pipe_write", "test_multiple_pipe_read"};
size_t min_alignment = get_min_alignment(context);
err = clGetDeviceInfo(deviceID, CL_DEVICE_MAX_PIPE_ARGS, sizeof(max_pipe_args), (void*)&max_pipe_args, NULL);
if(err){
print_error(err, " clGetDeviceInfo failed\n");
return -1;
}
if(max_pipe_args < 16){
log_error("The device should support minimum 16 pipe objects that could be passed as arguments to the kernel");
return -1;
}
global_work_size[0] = (cl_uint)num_pipe_elements * max_pipe_args;
size = sizeof(int) * num_pipe_elements * max_pipe_args;
source = (char *)malloc(STRING_LENGTH * sizeof(char) * max_pipe_args);
inptr = (cl_int *)align_malloc(size, min_alignment);
for(i = 0; i < num_pipe_elements * max_pipe_args; i++){
inptr[i] = (int)genrand_int32(d);
}
buffers[0] = clCreateBuffer(context, CL_MEM_COPY_HOST_PTR, size, inptr, &err);
if(err){
clReleaseMemObject(buffers[0]);
free(source);
print_error(err, " clCreateBuffer failed\n");
return -1;
}
outptr = align_malloc(size, min_alignment);
buffers[1] = clCreateBuffer(context, CL_MEM_USE_HOST_PTR, size, outptr, &err);
if ( err ){
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free( outptr );
free(source);
print_error(err, " clCreateBuffer failed\n" );
return -1;
}
for(i = 0; i < max_pipe_args; i++){
pipes[i] = clCreatePipe(context, CL_MEM_HOST_NO_ACCESS, sizeof(int), num_pipe_elements, NULL, &err);
if(err){
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free( outptr );
free(source);
for(j = 0; j < i; j++) {
clReleaseMemObject(pipes[j]);
}
print_error(err, " clCreatePipe failed\n");
return -1;
}
}
createKernelSourceCode(source, max_pipe_args);
// Create producer kernel
err = create_single_kernel_helper_with_build_options(context, &program, &kernel[0], 1, (const char**)&source, kernelName[0], "-cl-std=CL2.0");
if(err){
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
for(j = 0; j < max_pipe_args; j++) {
clReleaseMemObject(pipes[j]);
}
align_free(outptr);
free(source);
print_error(err, "Error creating program\n");
return -1;
}
//Create consumer kernel
kernel[1] = clCreateKernel(program, kernelName[1], &err);
if( kernel[1] == NULL || err != CL_SUCCESS)
{
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
for(j = 0; j < max_pipe_args; j++) {
clReleaseMemObject(pipes[j]);
}
align_free(outptr);
free(source);
print_error(err, " Error creating kernel\n");
return -1;
}
err = clSetKernelArg(kernel[0], 0, sizeof(cl_mem), (void*)&buffers[0]);
for( i = 0; i < max_pipe_args; i++){
err |= clSetKernelArg(kernel[0], i+1, sizeof(cl_mem), (void*)&pipes[i]);
}
err |= clSetKernelArg(kernel[0], max_pipe_args + 1, sizeof(int), (void*)&max_pipe_args);
err |= clSetKernelArg(kernel[1], 0, sizeof(cl_mem), (void*)&buffers[1]);
for( i = 0; i < max_pipe_args; i++){
err |= clSetKernelArg(kernel[1], i+1, sizeof(cl_mem), (void*)&pipes[i]);
}
err |= clSetKernelArg(kernel[1], max_pipe_args + 1, sizeof(int), (void*)&max_pipe_args);
if ( err != CL_SUCCESS ){
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
for(j = 0; j < max_pipe_args; j++) {
clReleaseMemObject(pipes[j]);
}
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseProgram(program);
align_free(outptr);
free(source);
print_error(err, " clSetKernelArg failed");
return -1;
}
// Launch Producer kernel
err = clEnqueueNDRangeKernel( queue, kernel[0], 1, NULL, global_work_size, NULL, 0, NULL, &producer_sync_event );
if ( err != CL_SUCCESS ){
print_error( err, " clEnqueueNDRangeKernel failed" );
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
for(j = 0; j < max_pipe_args; j++) {
clReleaseMemObject(pipes[j]);
}
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(producer_sync_event);
clReleaseEvent(consumer_sync_event);
clReleaseProgram(program);
align_free(outptr);
free(source);
return -1;
}
// Launch Consumer kernel
err = clEnqueueNDRangeKernel( queue, kernel[1], 1, NULL, global_work_size, NULL, 1, &producer_sync_event, &consumer_sync_event );
if ( err != CL_SUCCESS ){
print_error( err, " clEnqueueNDRangeKernel failed" );
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
for(j = 0; j < max_pipe_args; j++) {
clReleaseMemObject(pipes[j]);
}
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(producer_sync_event);
clReleaseEvent(consumer_sync_event);
clReleaseProgram(program);
align_free(outptr);
free(source);
return -1;
}
err = clEnqueueReadBuffer(queue, buffers[1], true, 0, size, outptr, 1, &consumer_sync_event, NULL);
if ( err != CL_SUCCESS ){
print_error( err, " clEnqueueReadBuffer failed" );
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
for(j = 0; j < max_pipe_args; j++) {
clReleaseMemObject(pipes[j]);
}
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(producer_sync_event);
clReleaseEvent(consumer_sync_event);
clReleaseProgram(program);
align_free(outptr);
free(source);
return -1;
}
err = clWaitForEvents(1, &consumer_sync_event);
if ( err != CL_SUCCESS ){
print_error( err, " clWaitForEvents failed" );
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
for(j = 0; j < max_pipe_args; j++) {
clReleaseMemObject(pipes[j]);
}
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(producer_sync_event);
clReleaseEvent(consumer_sync_event);
clReleaseProgram(program);
align_free(outptr);
free(source);
return -1;
}
if( verify_result( inptr, outptr, num_pipe_elements*sizeof(cl_int))){
log_error("test_pipe_max_args failed\n");
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
for(j = 0; j < max_pipe_args; j++) {
clReleaseMemObject(pipes[j]);
}
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(producer_sync_event);
clReleaseEvent(consumer_sync_event);
clReleaseProgram(program);
align_free(outptr);
free(source);
return -1;
}
else {
log_info("test_pipe_max_args passed\n");
}
//cleanup
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
for(j = 0; j < max_pipe_args; j++) {
clReleaseMemObject(pipes[j]);
}
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(producer_sync_event);
clReleaseEvent(consumer_sync_event);
clReleaseProgram(program);
align_free(outptr);
free(source);
return 0;
}
int test_pipe_max_packet_size(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
{
cl_mem pipe;
cl_mem buffers[2];
void *outptr;
cl_char *inptr;
cl_program program;
cl_kernel kernel[2];
size_t global_work_size[3];
cl_int err;
size_t size;
int num_pipe_elements = 1024;
int i;
cl_uint max_pipe_packet_size;
char *source;
char str[256];
int str_length;
cl_event producer_sync_event = NULL;
cl_event consumer_sync_event = NULL;
MTdata d = init_genrand( gRandomSeed );
const char* kernelName[] = {"test_pipe_max_packet_size_write", "test_pipe_max_packet_size_read"};
size_t min_alignment = get_min_alignment(context);
global_work_size[0] = (cl_uint)num_pipe_elements;
source = (char*)malloc(STRING_LENGTH*sizeof(char));
err = clGetDeviceInfo(deviceID, CL_DEVICE_PIPE_MAX_PACKET_SIZE, sizeof(max_pipe_packet_size), (void*)&max_pipe_packet_size, NULL);
if(err){
print_error(err, " clGetDeviceInfo failed\n");
return -1;
}
if(max_pipe_packet_size < 1024){
log_error("The device should support minimum packet size of 1024 bytes");
return -1;
}
if(max_pipe_packet_size > (32*1024*1024/num_pipe_elements))
{
max_pipe_packet_size = 32*1024*1024/num_pipe_elements;
}
size = max_pipe_packet_size * num_pipe_elements;
inptr = (cl_char *)align_malloc(size, min_alignment);
for(i = 0; i < size; i++){
inptr[i] = (char)genrand_int32(d);
}
buffers[0] = clCreateBuffer(context, CL_MEM_COPY_HOST_PTR, size, inptr, &err);
if(err){
clReleaseMemObject(buffers[0]);
free(source);
print_error(err, " clCreateBuffer failed\n");
return -1;
}
outptr = align_malloc(size, min_alignment);
buffers[1] = clCreateBuffer(context, CL_MEM_USE_HOST_PTR, size, outptr, &err);
if ( err ){
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free( outptr );
free(source);
print_error(err, " clCreateBuffer failed\n" );
return -1;
}
pipe = clCreatePipe(context, CL_MEM_HOST_NO_ACCESS, max_pipe_packet_size, num_pipe_elements, NULL, &err);
if(err){
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free( outptr );
free(source);
clReleaseMemObject(pipe);
print_error(err, " clCreatePipe failed\n");
return -1;
}
sprintf(str, "typedef struct{\n char a[%d];\n}TestStruct;\n\n__kernel void test_pipe_max_packet_size_write(__global TestStruct *src, __write_only pipe TestStruct out_pipe)\n{\n", max_pipe_packet_size);
strcpy(source,str);
strcat(source, " int gid = get_global_id(0);\n reserve_id_t res_id;\n\n");
sprintf(str, " res_id = reserve_write_pipe(out_pipe, 1);\n if(is_valid_reserve_id(res_id))\n {\n");
strcat(source, str);
sprintf(str, " write_pipe(out_pipe, res_id, 0, &src[gid]);\n commit_write_pipe(out_pipe, res_id);\n }\n}\n\n");
strcat(source, str);
sprintf(str, "__kernel void test_pipe_max_packet_size_read(__read_only pipe TestStruct in_pipe, __global TestStruct *dst)\n{\n");
strcat(source, str);
strcat(source, " int gid = get_global_id(0);\n reserve_id_t res_id;\n\n");
sprintf(str, " res_id = reserve_read_pipe(in_pipe, 1);\n if(is_valid_reserve_id(res_id))\n {\n");
strcat(source, str);
sprintf(str, " read_pipe(in_pipe, res_id, 0, &dst[gid]);\n commit_read_pipe(in_pipe, res_id);\n }\n}\n\n");
strcat(source, str);
str_length = strlen(source);
assert(str_length <= STRING_LENGTH);
// Create producer kernel
err = create_single_kernel_helper_with_build_options(context, &program, &kernel[0], 1, (const char**)&source, kernelName[0], "-cl-std=CL2.0");
if(err){
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
clReleaseMemObject(pipe);
align_free(outptr);
free(source);
print_error(err, "Error creating program\n");
return -1;
}
//Create consumer kernel
kernel[1] = clCreateKernel(program, kernelName[1], &err);
if( kernel[1] == NULL || err != CL_SUCCESS)
{
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
clReleaseMemObject(pipe);
align_free(outptr);
free(source);
print_error(err, "Error creating kernel\n");
return -1;
}
err = clSetKernelArg(kernel[0], 0, sizeof(cl_mem), (void*)&buffers[0]);
err |= clSetKernelArg(kernel[0], 1, sizeof(cl_mem), (void*)&pipe);
err |= clSetKernelArg(kernel[1], 0, sizeof(cl_mem), (void*)&pipe);
err |= clSetKernelArg(kernel[1], 1, sizeof(cl_mem), (void*)&buffers[1]);
if ( err != CL_SUCCESS ){
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
clReleaseMemObject(pipe);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseProgram(program);
align_free(outptr);
free(source);
print_error(err, " clSetKernelArg failed");
return -1;
}
// Launch Producer kernel
err = clEnqueueNDRangeKernel( queue, kernel[0], 1, NULL, global_work_size, NULL, 0, NULL, &producer_sync_event );
if ( err != CL_SUCCESS ){
print_error( err, " clEnqueueNDRangeKernel failed" );
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
clReleaseMemObject(pipe);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(producer_sync_event);
clReleaseEvent(consumer_sync_event);
clReleaseProgram(program);
align_free(outptr);
free(source);
return -1;
}
// Launch Consumer kernel
err = clEnqueueNDRangeKernel( queue, kernel[1], 1, NULL, global_work_size, NULL, 1, &producer_sync_event, &consumer_sync_event );
if ( err != CL_SUCCESS ){
print_error( err, " clEnqueueNDRangeKernel failed" );
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
clReleaseMemObject(pipe);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(producer_sync_event);
clReleaseEvent(consumer_sync_event);
clReleaseProgram(program);
align_free(outptr);
free(source);
return -1;
}
err = clEnqueueReadBuffer(queue, buffers[1], true, 0, size, outptr, 1, &consumer_sync_event, NULL);
if ( err != CL_SUCCESS ){
print_error( err, " clEnqueueReadBuffer failed" );
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
clReleaseMemObject(pipe);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(producer_sync_event);
clReleaseEvent(consumer_sync_event);
clReleaseProgram(program);
align_free(outptr);
free(source);
return -1;
}
if( verify_result( inptr, outptr, size)){
log_error("test_pipe_max_packet_size failed\n");
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
clReleaseMemObject(pipe);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(producer_sync_event);
clReleaseEvent(consumer_sync_event);
clReleaseProgram(program);
align_free(outptr);
free(source);
return -1;
}
else {
log_info("test_pipe_max_packet_size passed\n");
}
//cleanup
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
clReleaseMemObject(pipe);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(producer_sync_event);
clReleaseEvent(consumer_sync_event);
clReleaseProgram(program);
align_free(outptr);
free(source);
return 0;
}
int test_pipe_max_active_reservations(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
{
cl_mem pipe;
cl_mem buffers[2];
cl_mem buf_reservations;
cl_mem buf_status;
cl_mem buf_reserve_id_t_size;
cl_mem buf_reserve_id_t_size_aligned;
cl_int *inptr;
void *outptr;
int size, i;
cl_program program;
cl_kernel kernel[3];
size_t global_work_size[3];
cl_int err;
int status = 0;
cl_uint max_active_reservations = 0;
cl_ulong max_global_size = 0;
int reserve_id_t_size;
int temp;
char *source;
char str[256];
int str_length;
cl_event sync_event = NULL;
cl_event read_event = NULL;
MTdata d = init_genrand( gRandomSeed );
const char* kernelName[3] = {"test_pipe_max_active_reservations_write", "test_pipe_max_active_reservations_read", "pipe_get_reserve_id_t_size"};
size_t min_alignment = get_min_alignment(context);
source = (char*)malloc(2*STRING_LENGTH*sizeof(char));
global_work_size[0] = 1;
err = clGetDeviceInfo(deviceID, CL_DEVICE_PIPE_MAX_ACTIVE_RESERVATIONS, sizeof(max_active_reservations), (void*)&max_active_reservations, NULL);
if(err){
print_error(err, " clGetDeviceInfo failed\n");
return -1;
}
err = clGetDeviceInfo(deviceID, CL_DEVICE_GLOBAL_MEM_SIZE, sizeof(max_global_size), (void*)&max_global_size, NULL);
if(err){
print_error(err, " clGetDeviceInfo failed\n");
return -1;
}
max_active_reservations = (max_active_reservations > max_global_size) ? 1<<16 : max_active_reservations;
if(max_active_reservations < 1){
log_error("The device should support minimum active reservations of 1");
return -1;
}
// To get reserve_id_t size
buf_reserve_id_t_size = clCreateBuffer(context, CL_MEM_HOST_READ_ONLY, sizeof(reserve_id_t_size), NULL, &err);
if ( err ){
clReleaseMemObject(buf_reserve_id_t_size);
print_error(err, " clCreateBuffer failed\n" );
return -1;
}
sprintf(str, "__kernel void test_pipe_max_active_reservations_write(__global int *src, __write_only pipe int out_pipe, __global char *reserve_id, __global int *reserve_id_t_size_aligned, __global int *status)\n{\n");
strcpy(source,str);
sprintf(str, " __global reserve_id_t *res_id_ptr;\n int reserve_idx;\n int commit_idx;\n");
strcat(source, str);
sprintf(str, " for(reserve_idx = 0; reserve_idx < %d; reserve_idx++)\n {\n", max_active_reservations);
strcat(source, str);
sprintf(str, " res_id_ptr = (__global reserve_id_t*)(reserve_id + reserve_idx*reserve_id_t_size_aligned[0]);\n");
strcat(source, str);
sprintf(str, " *res_id_ptr = reserve_write_pipe(out_pipe, 1);\n");
strcat(source, str);
sprintf(str, " if(is_valid_reserve_id(res_id_ptr[0]))\n {\n write_pipe(out_pipe, res_id_ptr[0], 0, &src[reserve_idx]);\n }\n");
strcat(source, str);
sprintf(str, " else\n {\n *status = -1;\n return;\n }\n }\n");
strcat(source, str);
sprintf(str, " for(commit_idx = 0; commit_idx < %d; commit_idx++)\n {\n", max_active_reservations);
strcat(source, str);
sprintf(str, " res_id_ptr = (__global reserve_id_t*)(reserve_id + commit_idx*reserve_id_t_size_aligned[0]);\n");
strcat(source, str);
sprintf(str, " commit_write_pipe(out_pipe, res_id_ptr[0]);\n }\n}\n\n");
strcat(source, str);
sprintf(str, "__kernel void test_pipe_max_active_reservations_read(__read_only pipe int in_pipe, __global int *dst, __global char *reserve_id, __global int *reserve_id_t_size_aligned, __global int *status)\n{\n");
strcat(source, str);
sprintf(str, " __global reserve_id_t *res_id_ptr;\n int reserve_idx;\n int commit_idx;\n");
strcat(source, str);
sprintf(str, " for(reserve_idx = 0; reserve_idx < %d; reserve_idx++)\n {\n", max_active_reservations);
strcat(source, str);
sprintf(str, " res_id_ptr = (__global reserve_id_t*)(reserve_id + reserve_idx*reserve_id_t_size_aligned[0]);\n");
strcat(source, str);
sprintf(str, " *res_id_ptr = reserve_read_pipe(in_pipe, 1);\n");
strcat(source, str);
sprintf(str, " if(is_valid_reserve_id(res_id_ptr[0]))\n {\n read_pipe(in_pipe, res_id_ptr[0], 0, &dst[reserve_idx]);\n }\n");
strcat(source, str);
sprintf(str, " else\n {\n *status = -1;\n return;\n }\n }\n");
strcat(source, str);
sprintf(str, " for(commit_idx = 0; commit_idx < %d; commit_idx++)\n {\n", max_active_reservations);
strcat(source, str);
sprintf(str, " res_id_ptr = (__global reserve_id_t*)(reserve_id + commit_idx*reserve_id_t_size_aligned[0]);\n");
strcat(source, str);
sprintf(str, " commit_read_pipe(in_pipe, res_id_ptr[0]);\n }\n}\n\n");
strcat(source, str);
sprintf(str, "__kernel void pipe_get_reserve_id_t_size(__global int *reserve_id_t_size) \n");
strcat(source, str);
sprintf(str, "{\n *reserve_id_t_size = sizeof(reserve_id_t);\n}\n");
strcat(source, str);
str_length = strlen(source);
assert(str_length <= 2*STRING_LENGTH);
// Create producer kernel
err = create_single_kernel_helper_with_build_options(context, &program, &kernel[0], 1, (const char**)&source, kernelName[0], "-cl-std=CL2.0");
if(err){
clReleaseMemObject(buf_reserve_id_t_size);
print_error(err, "Error creating program\n");
return -1;
}
// Create consumer kernel
kernel[1] = clCreateKernel(program, kernelName[1], &err);
if( kernel[1] == NULL || err != CL_SUCCESS)
{
clReleaseMemObject(buf_reserve_id_t_size);
print_error(err, "Error creating kernel\n");
return -1;
}
// Create size query kernel for reserve_id_t
kernel[2] = clCreateKernel(program, kernelName[2], &err);
if( kernel[2] == NULL || err != CL_SUCCESS)
{
clReleaseMemObject(buf_reserve_id_t_size);
print_error(err, "Error creating kernel\n");
return -1;
}
err = clSetKernelArg(kernel[2], 0, sizeof(cl_mem), (void*)&buf_reserve_id_t_size);
if(err){
clReleaseMemObject(buf_reserve_id_t_size);
print_error(err, "Error creating program\n");
return -1;
}
//Launch size query kernel for reserve_id_t
err = clEnqueueNDRangeKernel( queue, kernel[2], 1, NULL, global_work_size, NULL, 0, NULL, &sync_event );
if ( err != CL_SUCCESS ){
print_error( err, " clEnqueueNDRangeKernel failed" );
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseProgram(program);
return -1;
}
err = clEnqueueReadBuffer(queue, buf_reserve_id_t_size, true, 0, sizeof(reserve_id_t_size), &reserve_id_t_size, 1, &sync_event, &read_event);
if ( err != CL_SUCCESS ){
print_error( err, " clEnqueueReadBuffer failed" );
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseProgram(program);
return -1;
}
err = clWaitForEvents(1, &read_event);
if ( err != CL_SUCCESS ){
print_error( err, " clWaitForEvents failed" );
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseEvent(read_event);
clReleaseProgram(program);
return -1;
}
// Round reserve_id_t_size to the nearest power of 2
temp = 1;
while(temp < reserve_id_t_size)
temp *= 2;
reserve_id_t_size = temp;
size = sizeof(cl_int) * max_active_reservations;
inptr = (cl_int *)align_malloc(size, min_alignment);
for(i = 0; i < max_active_reservations; i++){
inptr[i] = (int)genrand_int32(d);
}
buffers[0] = clCreateBuffer(context, CL_MEM_COPY_HOST_PTR, size, inptr, &err);
if ( err ){
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buffers[0]);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseEvent(read_event);
clReleaseProgram(program);
print_error(err, " clCreateBuffer failed\n" );
return -1;
}
outptr = align_malloc(size, min_alignment);
buffers[1] = clCreateBuffer(context, CL_MEM_HOST_READ_ONLY, size, NULL, &err);
if ( err ){
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseEvent(read_event);
clReleaseProgram(program);
align_free(outptr);
print_error(err, " clCreateBuffer failed\n" );
return -1;
}
buf_reserve_id_t_size_aligned = clCreateBuffer(context, CL_MEM_COPY_HOST_PTR, sizeof(reserve_id_t_size), &reserve_id_t_size, &err);
if ( err ){
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseEvent(read_event);
clReleaseProgram(program);
print_error(err, " clCreateBuffer failed\n" );
return -1;
}
//For error status
buf_status = clCreateBuffer(context, CL_MEM_COPY_HOST_PTR, sizeof(int), &status, &err);
if ( err ){
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseEvent(read_event);
clReleaseProgram(program);
print_error(err, " clCreateBuffer failed\n" );
return -1;
}
pipe = clCreatePipe(context, CL_MEM_HOST_NO_ACCESS, sizeof(int), max_active_reservations, NULL, &err);
if(err){
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(pipe);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseEvent(read_event);
clReleaseProgram(program);
print_error(err, " clCreatePipe failed\n");
return -1;
}
// Global buffer to hold all active reservation ids
buf_reservations = clCreateBuffer(context, CL_MEM_HOST_NO_ACCESS, reserve_id_t_size*max_active_reservations, NULL, &err);
if ( err != CL_SUCCESS ){
print_error( err, " clCreateBuffer failed" );
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buf_reservations);
clReleaseMemObject(pipe);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseEvent(read_event);
clReleaseProgram(program);
return -1;
}
err = clSetKernelArg(kernel[0], 0, sizeof(cl_mem), (void*)&buffers[0]);
err |= clSetKernelArg(kernel[0], 1, sizeof(cl_mem), (void*)&pipe);
err |= clSetKernelArg(kernel[0], 2, sizeof(cl_mem), (void*)&buf_reservations);
err |= clSetKernelArg(kernel[0], 3, sizeof(cl_mem), (void*)&buf_reserve_id_t_size_aligned);
err |= clSetKernelArg(kernel[0], 4, sizeof(cl_mem), (void*)&buf_status);
if ( err != CL_SUCCESS ){
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buf_reservations);
clReleaseMemObject(pipe);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseProgram(program);
print_error(err, " clSetKernelArg failed");
return -1;
}
err = clSetKernelArg(kernel[1], 0, sizeof(cl_mem), (void*)&pipe);
err |= clSetKernelArg(kernel[1], 1, sizeof(cl_mem), (void*)&buffers[1]);
err |= clSetKernelArg(kernel[1], 2, sizeof(cl_mem), (void*)&buf_reservations);
err |= clSetKernelArg(kernel[1], 3, sizeof(cl_mem), (void*)&buf_reserve_id_t_size_aligned);
err |= clSetKernelArg(kernel[1], 4, sizeof(cl_mem), (void*)&buf_status);
if ( err != CL_SUCCESS ){
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buf_reservations);
clReleaseMemObject(pipe);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseProgram(program);
print_error(err, " clSetKernelArg failed");
return -1;
}
// Launch Producer kernel
err = clEnqueueNDRangeKernel(queue, kernel[0], 1, NULL, global_work_size, NULL, 0, NULL, &sync_event);
if ( err != CL_SUCCESS ){
print_error( err, " clEnqueueNDRangeKernel failed" );
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buf_reservations);
clReleaseMemObject(pipe);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseProgram(program);
return -1;
}
err = clEnqueueReadBuffer(queue, buf_status, true, 0, sizeof(int), &status, 1, &sync_event, NULL);
if ( err != CL_SUCCESS ){
print_error( err, " clEnqueueReadBuffer failed" );
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buf_reservations);
clReleaseMemObject(pipe);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseProgram(program);
return -1;
}
if(status != 0)
{
log_error("test_pipe_max_active_reservations failed\n");
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buf_reservations);
clReleaseMemObject(pipe);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(sync_event);
clReleaseProgram(program);
return -1;
}
// Launch Consumer kernel
err = clEnqueueNDRangeKernel(queue, kernel[1], 1, NULL, global_work_size, NULL, 0, NULL, &sync_event);
if ( err != CL_SUCCESS ){
print_error( err, " clEnqueueNDRangeKernel failed" );
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buf_reservations);
clReleaseMemObject(pipe);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseProgram(program);
return -1;
}
err = clEnqueueReadBuffer(queue, buf_status, true, 0, sizeof(int), &status, 1, &sync_event, NULL);
if ( err != CL_SUCCESS ){
print_error( err, " clEnqueueReadBuffer failed" );
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buf_reservations);
clReleaseMemObject(pipe);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseProgram(program);
return -1;
}
if(status != 0)
{
log_error("test_pipe_max_active_reservations failed\n");
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buf_reservations);
clReleaseMemObject(pipe);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(sync_event);
clReleaseProgram(program);
return -1;
}
err = clEnqueueReadBuffer(queue, buffers[1], true, 0, size, outptr, 1, &sync_event, NULL);
if ( err != CL_SUCCESS ){
print_error( err, " clEnqueueReadBuffer failed" );
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buf_reservations);
clReleaseMemObject(pipe);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseProgram(program);
return -1;
}
if( verify_result_int( inptr, outptr, max_active_reservations)){
log_error("test_pipe_max_active_reservations failed\n");
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buf_reservations);
clReleaseMemObject(pipe);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseKernel(kernel[2]);
clReleaseEvent(sync_event);
clReleaseProgram(program);
return -1;
}
else {
log_info("test_pipe_max_active_reservations passed\n");
}
//cleanup
clReleaseMemObject(buf_status);
clReleaseMemObject(buf_reserve_id_t_size);
clReleaseMemObject(buf_reserve_id_t_size_aligned);
clReleaseMemObject(buf_reservations);
clReleaseMemObject(pipe);
clReleaseMemObject(buffers[0]);
clReleaseMemObject(buffers[1]);
align_free(outptr);
clReleaseKernel(kernel[0]);
clReleaseKernel(kernel[1]);
clReleaseEvent(sync_event);
clReleaseProgram(program);
return 0;
}