aboutsummaryrefslogtreecommitdiff
path: root/test_conformance/basic/test_vec_type_hint.cpp
blob: 33168b1369c57e7c33b64368fb65266559a9aa4b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
//
// Copyright (c) 2017 The Khronos Group Inc.
// 
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//    http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
#include "harness/compat.h"

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <sys/types.h>
#include <sys/stat.h>


#include "procs.h"
#include "harness/conversions.h"
#include "harness/typeWrappers.h"


static const char *sample_kernel = {
  "%s\n" // optional pragma string
  "__kernel __attribute__((vec_type_hint(%s%s))) void sample_test(__global int *src, __global int *dst)\n"
  "{\n"
  "    int  tid = get_global_id(0);\n"
  "     dst[tid] = src[tid];\n"
  "\n"
  "}\n"
};

int test_vec_type_hint(cl_device_id deviceID, cl_context context, cl_command_queue queue, int num_elements)
{
  int error;
  int vec_type_index, vec_size_index;

  ExplicitType vecType[] = { kChar, kUChar, kShort, kUShort, kInt, kUInt, kLong, kULong, kFloat, kDouble };
    const char *size_names[] = {"", "2", "4", "8", "16"};
    char *program_source;

  program_source = (char*)malloc(sizeof(char)*4096);

  for (vec_type_index=0; vec_type_index<10; vec_type_index++) {
    if (vecType[vec_type_index] == kDouble) {
      if (!is_extension_available(deviceID, "cl_khr_fp64")) {
        log_info("Extension cl_khr_fp64 not supported; skipping double tests.\n");
        continue;
      }
      log_info("Testing doubles.\n");
    }

    if (vecType[vec_type_index] == kLong || vecType[vec_type_index] == kULong)
    {
        if (!gHasLong)
        {
            log_info("Extension cl_khr_int64 not supported; skipping long tests.\n");
            continue;
        }
    }

    for (vec_size_index=0; vec_size_index<5; vec_size_index++) {
      clProgramWrapper program;
      clKernelWrapper kernel;
      clMemWrapper in, out;
      size_t global[] = {1,1,1};

      log_info("Testing __attribute__((vec_type_hint(%s%s))...\n", get_explicit_type_name(vecType[vec_type_index]), size_names[vec_size_index]);

      program_source[0] = '\0';
      sprintf(program_source, sample_kernel,
              (vecType[vec_type_index] == kDouble) ? "#pragma OPENCL EXTENSION cl_khr_fp64 : enable" : "",
              get_explicit_type_name(vecType[vec_type_index]), size_names[vec_size_index]);

      error = create_single_kernel_helper( context, &program, &kernel, 1, (const char**)&program_source, "sample_test" );
      if( error != 0 )
        return error;

      in = clCreateBuffer(context, CL_MEM_READ_ONLY, sizeof(cl_int)*10, NULL, &error);
      test_error(error, "clCreateBuffer failed");
      out = clCreateBuffer(context, CL_MEM_WRITE_ONLY, sizeof(cl_int)*10, NULL, &error);
      test_error(error, "clCreateBuffer failed");

      error = clSetKernelArg(kernel, 0, sizeof(in), &in);
      test_error(error, "clSetKernelArg failed");
      error = clSetKernelArg(kernel, 1, sizeof(out), &out);
      test_error(error, "clSetKernelArg failed");

      error = clEnqueueNDRangeKernel(queue, kernel, 3, NULL, global, NULL, 0, NULL, NULL);
      test_error(error, "clEnqueueNDRangeKernel failed");

      error = clFinish(queue);
      test_error(error, "clFinish failed");
    }
  }

  free(program_source);

  return 0;
}