test_conformance/basic/test_work_item_functions.cpp - external/github.com/KhronosGroup/OpenCL-CTS - Git at Google

 //
 // Copyright (c) 2017 The Khronos Group Inc.
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //    http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.
 //
 #include "harness/compat.h"

 #include <stdio.h>
 #include <stdlib.h>
 #include <string.h>
 #include <sys/types.h>
 #include <sys/stat.h>


 #include "procs.h"
 #include "harness/conversions.h"
 #include "harness/typeWrappers.h"

 struct work_item_data
 {
     cl_uint workDim;
     cl_uint globalSize[ 3 ];
     cl_uint globalID[ 3 ];
     cl_uint localSize[ 3 ];
     cl_uint localID[ 3 ];
     cl_uint numGroups[ 3 ];
     cl_uint groupID[ 3 ];
 };

 static const char *workItemKernelCode =
 "typedef struct {\n"
 "    uint workDim;\n"
 "    uint globalSize[ 3 ];\n"
 "    uint globalID[ 3 ];\n"
 "    uint localSize[ 3 ];\n"
 "    uint localID[ 3 ];\n"
 "    uint numGroups[ 3 ];\n"
 "    uint groupID[ 3 ];\n"
 " } work_item_data;\n"
 "\n"
 "__kernel void sample_kernel( __global work_item_data *outData )\n"
 "{\n"
 "    int id = get_global_id(0);\n"
 "   outData[ id ].workDim = (uint)get_work_dim();\n"
 "    for( uint i = 0; i < get_work_dim(); i++ )\n"
 "   {\n"
 "       outData[ id ].globalSize[ i ] = (uint)get_global_size( i );\n"
 "       outData[ id ].globalID[ i ] = (uint)get_global_id( i );\n"
 "       outData[ id ].localSize[ i ] = (uint)get_local_size( i );\n"
 "       outData[ id ].localID[ i ] = (uint)get_local_id( i );\n"
 "       outData[ id ].numGroups[ i ] = (uint)get_num_groups( i );\n"
 "       outData[ id ].groupID[ i ] = (uint)get_group_id( i );\n"
 "   }\n"
 "}";

 #define NUM_TESTS 1

 int test_work_item_functions(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
 {
     int error;

     clProgramWrapper program;
     clKernelWrapper kernel;
     clMemWrapper outData;
     work_item_data    testData[ 10240 ];
     size_t threads[3], localThreads[3];
     MTdata d;


     error = create_single_kernel_helper( context, &program, &kernel, 1, &workItemKernelCode, "sample_kernel" );
     test_error( error, "Unable to create testing kernel" );

     outData = clCreateBuffer( context, CL_MEM_READ_WRITE, sizeof( testData ), NULL, &error );
     test_error( error, "Unable to create output buffer" );

     error = clSetKernelArg( kernel, 0, sizeof( outData ), &outData );
     test_error( error, "Unable to set kernel arg" );

     d = init_genrand( gRandomSeed );
     for( size_t dim = 1; dim <= 3; dim++ )
     {
         for( int i = 0; i < NUM_TESTS; i++  )
         {
             size_t numItems = 1;
             for( size_t j = 0; j < dim; j++ )
             {
                 // All of our thread sizes should be within the max local sizes, since they're all <= 20
                 threads[ j ] = (size_t)random_in_range( 1, 20, d );
                 localThreads[ j ] = threads[ j ] / (size_t)random_in_range( 1, (int)threads[ j ], d );
                 while( localThreads[ j ] > 1 && ( threads[ j ] % localThreads[ j ] != 0 ) )
                     localThreads[ j ]--;

                 numItems *= threads[ j ];

                 // Hack for now: localThreads > 1 are iffy
                 localThreads[ j ] = 1;
             }
             error = clEnqueueNDRangeKernel( queue, kernel, (cl_uint)dim, NULL, threads, localThreads, 0, NULL, NULL );
             test_error( error, "Unable to run kernel" );

             error = clEnqueueReadBuffer( queue, outData, CL_TRUE, 0, sizeof( testData ), testData, 0, NULL, NULL );
             test_error( error, "Unable to read results" );

             // Validate
             for( size_t q = 0; q < threads[0]; q++ )
             {
                 // We can't really validate the actual value of each one, but we can validate that they're within a sane range
                 if( testData[ q ].workDim != (cl_uint)dim )
                 {
                     log_error( "ERROR: get_work_dim() did not return proper value for %d dimensions (expected %d, got %d)\n", (int)dim, (int)dim, (int)testData[ q ].workDim );
                     free_mtdata(d);
                     return -1;
                 }
                 for( size_t j = 0; j < dim; j++ )
                 {
                     if( testData[ q ].globalSize[ j ] != (cl_uint)threads[ j ] )
                     {
                         log_error( "ERROR: get_global_size(%d) did not return proper value for %d dimensions (expected %d, got %d)\n",
                                     (int)j, (int)dim, (int)threads[ j ], (int)testData[ q ].globalSize[ j ] );
                         free_mtdata(d);
                         return -1;
                     }
                     if (testData[q].globalID[j] >= (cl_uint)threads[j])
                     {
                         log_error( "ERROR: get_global_id(%d) did not return proper value for %d dimensions (max %d, got %d)\n",
                                   (int)j, (int)dim, (int)threads[ j ], (int)testData[ q ].globalID[ j ] );
                         free_mtdata(d);
                         return -1;
                     }
                     if( testData[ q ].localSize[ j ] != (cl_uint)localThreads[ j ] )
                     {
                         log_error( "ERROR: get_local_size(%d) did not return proper value for %d dimensions (expected %d, got %d)\n",
                                   (int)j, (int)dim, (int)localThreads[ j ], (int)testData[ q ].localSize[ j ] );
                         free_mtdata(d);
                         return -1;
                     }
                     if (testData[q].localID[j] >= (cl_uint)localThreads[j])
                     {
                         log_error( "ERROR: get_local_id(%d) did not return proper value for %d dimensions (max %d, got %d)\n",
                                   (int)j, (int)dim, (int)localThreads[ j ], (int)testData[ q ].localID[ j ] );
                         free_mtdata(d);
                         return -1;
                     }
                     size_t groupCount = ( threads[ j ] + localThreads[ j ] - 1 ) / localThreads[ j ];
                     if( testData[ q ].numGroups[ j ] != (cl_uint)groupCount )
                     {
                         log_error( "ERROR: get_num_groups(%d) did not return proper value for %d dimensions (expected %d with global dim %d and local dim %d, got %d)\n",
                                   (int)j, (int)dim, (int)groupCount, (int)threads[ j ], (int)localThreads[ j ], (int)testData[ q ].numGroups[ j ] );
                         free_mtdata(d);
                         return -1;
                     }
                     if (testData[q].groupID[j] >= (cl_uint)groupCount)
                     {
                         log_error( "ERROR: get_group_id(%d) did not return proper value for %d dimensions (max %d, got %d)\n",
                                   (int)j, (int)dim, (int)groupCount, (int)testData[ q ].groupID[ j ] );
                         free_mtdata(d);
                         return -1;
                     }
                 }
             }
         }
     }

     free_mtdata(d);
     return 0;
 }
	//
	// Copyright (c) 2017 The Khronos Group Inc.
	//
	// Licensed under the Apache License, Version 2.0 (the "License");
	// you may not use this file except in compliance with the License.
	// You may obtain a copy of the License at
	//
	// http://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing, software
	// distributed under the License is distributed on an "AS IS" BASIS,
	// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	// See the License for the specific language governing permissions and
	// limitations under the License.
	//
	#include "harness/compat.h"

	#include <stdio.h>
	#include <stdlib.h>
	#include <string.h>
	#include <sys/types.h>
	#include <sys/stat.h>


	#include "procs.h"
	#include "harness/conversions.h"
	#include "harness/typeWrappers.h"

	struct work_item_data
	{
	cl_uint workDim;
	cl_uint globalSize[ 3 ];
	cl_uint globalID[ 3 ];
	cl_uint localSize[ 3 ];
	cl_uint localID[ 3 ];
	cl_uint numGroups[ 3 ];
	cl_uint groupID[ 3 ];
	};

	static const char *workItemKernelCode =
	"typedef struct {\n"
	" uint workDim;\n"
	" uint globalSize[ 3 ];\n"
	" uint globalID[ 3 ];\n"
	" uint localSize[ 3 ];\n"
	" uint localID[ 3 ];\n"
	" uint numGroups[ 3 ];\n"
	" uint groupID[ 3 ];\n"
	" } work_item_data;\n"
	"\n"
	"__kernel void sample_kernel( __global work_item_data *outData )\n"
	"{\n"
	" int id = get_global_id(0);\n"
	" outData[ id ].workDim = (uint)get_work_dim();\n"
	" for( uint i = 0; i < get_work_dim(); i++ )\n"
	" {\n"
	" outData[ id ].globalSize[ i ] = (uint)get_global_size( i );\n"
	" outData[ id ].globalID[ i ] = (uint)get_global_id( i );\n"
	" outData[ id ].localSize[ i ] = (uint)get_local_size( i );\n"
	" outData[ id ].localID[ i ] = (uint)get_local_id( i );\n"
	" outData[ id ].numGroups[ i ] = (uint)get_num_groups( i );\n"
	" outData[ id ].groupID[ i ] = (uint)get_group_id( i );\n"
	" }\n"
	"}";

	#define NUM_TESTS 1

	int test_work_item_functions(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
	{
	int error;

	clProgramWrapper program;
	clKernelWrapper kernel;
	clMemWrapper outData;
	work_item_data testData[ 10240 ];
	size_t threads[3], localThreads[3];
	MTdata d;


	error = create_single_kernel_helper( context, &program, &kernel, 1, &workItemKernelCode, "sample_kernel" );
	test_error( error, "Unable to create testing kernel" );

	outData = clCreateBuffer( context, CL_MEM_READ_WRITE, sizeof( testData ), NULL, &error );
	test_error( error, "Unable to create output buffer" );

	error = clSetKernelArg( kernel, 0, sizeof( outData ), &outData );
	test_error( error, "Unable to set kernel arg" );

	d = init_genrand( gRandomSeed );
	for( size_t dim = 1; dim <= 3; dim++ )
	{
	for( int i = 0; i < NUM_TESTS; i++ )
	{
	size_t numItems = 1;
	for( size_t j = 0; j < dim; j++ )
	{
	// All of our thread sizes should be within the max local sizes, since they're all <= 20
	threads[ j ] = (size_t)random_in_range( 1, 20, d );
	localThreads[ j ] = threads[ j ] / (size_t)random_in_range( 1, (int)threads[ j ], d );
	while( localThreads[ j ] > 1 && ( threads[ j ] % localThreads[ j ] != 0 ) )
	localThreads[ j ]--;

	numItems *= threads[ j ];

	// Hack for now: localThreads > 1 are iffy
	localThreads[ j ] = 1;
	}
	error = clEnqueueNDRangeKernel( queue, kernel, (cl_uint)dim, NULL, threads, localThreads, 0, NULL, NULL );
	test_error( error, "Unable to run kernel" );

	error = clEnqueueReadBuffer( queue, outData, CL_TRUE, 0, sizeof( testData ), testData, 0, NULL, NULL );
	test_error( error, "Unable to read results" );

	// Validate
	for( size_t q = 0; q < threads[0]; q++ )
	{
	// We can't really validate the actual value of each one, but we can validate that they're within a sane range
	if( testData[ q ].workDim != (cl_uint)dim )
	{
	log_error( "ERROR: get_work_dim() did not return proper value for %d dimensions (expected %d, got %d)\n", (int)dim, (int)dim, (int)testData[ q ].workDim );
	free_mtdata(d);
	return -1;
	}
	for( size_t j = 0; j < dim; j++ )
	{
	if( testData[ q ].globalSize[ j ] != (cl_uint)threads[ j ] )
	{
	log_error( "ERROR: get_global_size(%d) did not return proper value for %d dimensions (expected %d, got %d)\n",
	(int)j, (int)dim, (int)threads[ j ], (int)testData[ q ].globalSize[ j ] );
	free_mtdata(d);
	return -1;
	}
	if (testData[q].globalID[j] >= (cl_uint)threads[j])
	{
	log_error( "ERROR: get_global_id(%d) did not return proper value for %d dimensions (max %d, got %d)\n",
	(int)j, (int)dim, (int)threads[ j ], (int)testData[ q ].globalID[ j ] );
	free_mtdata(d);
	return -1;
	}
	if( testData[ q ].localSize[ j ] != (cl_uint)localThreads[ j ] )
	{
	log_error( "ERROR: get_local_size(%d) did not return proper value for %d dimensions (expected %d, got %d)\n",
	(int)j, (int)dim, (int)localThreads[ j ], (int)testData[ q ].localSize[ j ] );
	free_mtdata(d);
	return -1;
	}
	if (testData[q].localID[j] >= (cl_uint)localThreads[j])
	{
	log_error( "ERROR: get_local_id(%d) did not return proper value for %d dimensions (max %d, got %d)\n",
	(int)j, (int)dim, (int)localThreads[ j ], (int)testData[ q ].localID[ j ] );
	free_mtdata(d);
	return -1;
	}
	size_t groupCount = ( threads[ j ] + localThreads[ j ] - 1 ) / localThreads[ j ];
	if( testData[ q ].numGroups[ j ] != (cl_uint)groupCount )
	{
	log_error( "ERROR: get_num_groups(%d) did not return proper value for %d dimensions (expected %d with global dim %d and local dim %d, got %d)\n",
	(int)j, (int)dim, (int)groupCount, (int)threads[ j ], (int)localThreads[ j ], (int)testData[ q ].numGroups[ j ] );
	free_mtdata(d);
	return -1;
	}
	if (testData[q].groupID[j] >= (cl_uint)groupCount)
	{
	log_error( "ERROR: get_group_id(%d) did not return proper value for %d dimensions (max %d, got %d)\n",
	(int)j, (int)dim, (int)groupCount, (int)testData[ q ].groupID[ j ] );
	free_mtdata(d);
	return -1;
	}
	}
	}
	}
	}

	free_mtdata(d);
	return 0;
	}