aboutsummaryrefslogtreecommitdiff
path: root/test_conformance/SVM/test_shared_address_space_fine_grain.cpp
blob: a98a880c7d57fbedfc137390aa7ce789c26ec963 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
//
// Copyright (c) 2017 The Khronos Group Inc.
// 
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//    http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
#include "common.h"


// This tests that all devices and the host share a common address space using fine-grain mode with no buffers.
// This is done by creating a linked list on a device and then verifying the correctness of the list
// on another device or the host.  This basic test is performed for all combinations of devices and the host that exist within
// the platform.  The test passes only if every combination passes.
int test_svm_shared_address_space_fine_grain(cl_device_id deviceID, cl_context context2, cl_command_queue queue, int num_elements)
{
  clContextWrapper    context = NULL;
  clProgramWrapper    program = NULL;
  cl_uint     num_devices = 0;
  cl_int      error = CL_SUCCESS;
  clCommandQueueWrapper queues[MAXQ];

  error = create_cl_objects(deviceID, &linked_list_create_and_verify_kernels[0], &context, &program, &queues[0], &num_devices, CL_DEVICE_SVM_FINE_GRAIN_SYSTEM);
  if(error == 1) return 0; // no devices capable of requested SVM level, so don't execute but count test as passing.
  if(error < 0) return -1; // fail test.

  size_t numLists =  num_elements;
  cl_int ListLength = 32;

  clKernelWrapper kernel_create_lists = clCreateKernel(program, "create_linked_lists", &error);
  test_error(error, "clCreateKernel failed");

  clKernelWrapper kernel_verify_lists = clCreateKernel(program, "verify_linked_lists", &error);
  test_error(error, "clCreateKernel failed");

  // this allocation holds the linked list nodes.
  // FIXME: remove the alignment once prototype can handle it
  Node* pNodes = (Node*) align_malloc(numLists*ListLength*sizeof(Node),128);
  test_error2(error, pNodes, "malloc failed");

  // this allocation holds an index into the nodes buffer, it is used for node allocation
  size_t* pAllocator = (size_t*) align_malloc(sizeof(cl_int), 128);
  test_error2(error, pAllocator, "malloc failed");

  // this allocation holds the count of correct nodes, which is computed by the verify kernel.
  cl_int* pNum_correct = (cl_int*) align_malloc(sizeof(cl_int), 128);
  test_error2(error, pNum_correct, "malloc failed");


  error |= clSetKernelArgSVMPointer(kernel_create_lists, 0, pNodes);
  error |= clSetKernelArgSVMPointer(kernel_create_lists, 1, pAllocator);
  error |= clSetKernelArg(kernel_create_lists, 2, sizeof(cl_int),(void *) &ListLength);

  error |= clSetKernelArgSVMPointer(kernel_verify_lists, 0, pNodes);
  error |= clSetKernelArgSVMPointer(kernel_verify_lists, 1, pNum_correct);
  error |= clSetKernelArg(kernel_verify_lists, 2, sizeof(cl_int),   (void *) &ListLength);
  test_error(error, "clSetKernelArg failed");

  // Create linked list on one device and verify on another device (or the host).
  // Do this for all possible combinations of devices and host within the platform.
  for (int ci=0; ci<(int)num_devices+1; ci++)  // ci is CreationIndex, index of device/q to create linked list on
  {
    for (int vi=0; vi<(int)num_devices+1; vi++)  // vi is VerificationIndex, index of device/q to verify linked list on
    {
      if(ci == num_devices) // last device index represents the host, note the num_device+1 above.
      {
        log_info("creating linked list on host ");
        create_linked_lists(pNodes, numLists, ListLength);
      }
      else
      {
        error = create_linked_lists_on_device_no_map(ci, queues[ci], pAllocator, kernel_create_lists, numLists);
        if(error) return -1;
      }

      if(vi == num_devices)
      {
        error = verify_linked_lists(pNodes, numLists, ListLength);
        if(error) return -1;
      }
      else
      {
        error = verify_linked_lists_on_device_no_map(vi, queues[vi], pNum_correct, kernel_verify_lists, ListLength, numLists);
        if(error) return -1;
      }
    }
  }

  align_free(pNodes);
  align_free(pAllocator);
  align_free(pNum_correct);
  return 0;
}