Hardware Locality (hwloc)  1.11.8
opencl.h
1 /*
2  * Copyright © 2012-2017 Inria. All rights reserved.
3  * Copyright © 2013 Université Bordeaux. All right reserved.
4  * See COPYING in top-level directory.
5  */
6 
14 #ifndef HWLOC_OPENCL_H
15 #define HWLOC_OPENCL_H
16 
17 #include <hwloc.h>
18 #include <hwloc/autogen/config.h>
19 #include <hwloc/helper.h>
20 #ifdef HWLOC_LINUX_SYS
21 #include <hwloc/linux.h>
22 #endif
23 
24 #include <CL/cl.h>
25 #include <CL/cl_ext.h>
26 
27 #include <stdio.h>
28 
29 
30 #ifdef __cplusplus
31 extern "C" {
32 #endif
33 
34 
63 static __hwloc_inline int
64 hwloc_opencl_get_device_cpuset(hwloc_topology_t topology __hwloc_attribute_unused,
65  cl_device_id device __hwloc_attribute_unused,
66  hwloc_cpuset_t set)
67 {
68 #if (defined HWLOC_LINUX_SYS) && (defined CL_DEVICE_TOPOLOGY_AMD)
69  /* If we're on Linux + AMD OpenCL, use the AMD extension + the sysfs mechanism to get the local cpus */
70 #define HWLOC_OPENCL_DEVICE_SYSFS_PATH_MAX 128
71  char path[HWLOC_OPENCL_DEVICE_SYSFS_PATH_MAX];
72  FILE *sysfile = NULL;
73  cl_device_topology_amd amdtopo;
74  cl_int clret;
75 
76  if (!hwloc_topology_is_thissystem(topology)) {
77  errno = EINVAL;
78  return -1;
79  }
80 
81  clret = clGetDeviceInfo(device, CL_DEVICE_TOPOLOGY_AMD, sizeof(amdtopo), &amdtopo, NULL);
82  if (CL_SUCCESS != clret) {
84  return 0;
85  }
86  if (CL_DEVICE_TOPOLOGY_TYPE_PCIE_AMD != amdtopo.raw.type) {
88  return 0;
89  }
90 
91  sprintf(path, "/sys/bus/pci/devices/0000:%02x:%02x.%01x/local_cpus",
92  (unsigned) amdtopo.pcie.bus, (unsigned) amdtopo.pcie.device, (unsigned) amdtopo.pcie.function);
93  sysfile = fopen(path, "r");
94  if (!sysfile)
95  return -1;
96 
97  if (hwloc_linux_parse_cpumap_file(sysfile, set) < 0
98  || hwloc_bitmap_iszero(set))
100 
101  fclose(sysfile);
102 #else
103  /* Non-Linux + AMD OpenCL systems simply get a full cpuset */
105 #endif
106  return 0;
107 }
108 
124 static __hwloc_inline hwloc_obj_t
126  unsigned platform_index, unsigned device_index)
127 {
128  unsigned x = (unsigned) -1, y = (unsigned) -1;
129  hwloc_obj_t osdev = NULL;
130  while ((osdev = hwloc_get_next_osdev(topology, osdev)) != NULL) {
131  if (HWLOC_OBJ_OSDEV_COPROC == osdev->attr->osdev.type
132  && osdev->name
133  && sscanf(osdev->name, "opencl%ud%u", &x, &y) == 2
134  && platform_index == x && device_index == y)
135  return osdev;
136  }
137  return NULL;
138 }
139 
153 static __hwloc_inline hwloc_obj_t
154 hwloc_opencl_get_device_osdev(hwloc_topology_t topology __hwloc_attribute_unused,
155  cl_device_id device __hwloc_attribute_unused)
156 {
157 #ifdef CL_DEVICE_TOPOLOGY_AMD
158  hwloc_obj_t osdev;
159  cl_device_topology_amd amdtopo;
160  cl_int clret;
161 
162  clret = clGetDeviceInfo(device, CL_DEVICE_TOPOLOGY_AMD, sizeof(amdtopo), &amdtopo, NULL);
163  if (CL_SUCCESS != clret) {
164  errno = EINVAL;
165  return NULL;
166  }
167  if (CL_DEVICE_TOPOLOGY_TYPE_PCIE_AMD != amdtopo.raw.type) {
168  errno = EINVAL;
169  return NULL;
170  }
171 
172  osdev = NULL;
173  while ((osdev = hwloc_get_next_osdev(topology, osdev)) != NULL) {
174  hwloc_obj_t pcidev = osdev->parent;
175  if (strncmp(osdev->name, "opencl", 6))
176  continue;
177  if (pcidev
178  && pcidev->type == HWLOC_OBJ_PCI_DEVICE
179  && pcidev->attr->pcidev.domain == 0
180  && pcidev->attr->pcidev.bus == amdtopo.pcie.bus
181  && pcidev->attr->pcidev.dev == amdtopo.pcie.device
182  && pcidev->attr->pcidev.func == amdtopo.pcie.function)
183  return osdev;
184  }
185 
186  return NULL;
187 #else
188  return NULL;
189 #endif
190 }
191 
195 #ifdef __cplusplus
196 } /* extern "C" */
197 #endif
198 
199 
200 #endif /* HWLOC_OPENCL_H */
static hwloc_obj_t hwloc_opencl_get_device_osdev_by_index(hwloc_topology_t topology, unsigned platform_index, unsigned device_index)
Get the hwloc OS device object corresponding to the OpenCL device for the given indexes.
Definition: opencl.h:125
static int hwloc_opencl_get_device_cpuset(hwloc_topology_t topology, cl_device_id device, hwloc_cpuset_t set)
Get the CPU set of logical processors that are physically close to OpenCL device device.
Definition: opencl.h:64
static hwloc_obj_t hwloc_opencl_get_device_osdev(hwloc_topology_t topology, cl_device_id device)
Get the hwloc OS device object corresponding to OpenCL device device.
Definition: opencl.h:154
int hwloc_bitmap_iszero(hwloc_const_bitmap_t bitmap)
Test whether bitmap bitmap is empty.
int hwloc_topology_is_thissystem(hwloc_topology_t restrict topology)
Does the topology context come from this system?
unsigned short domain
Definition: hwloc.h:527
static hwloc_obj_t hwloc_get_next_osdev(hwloc_topology_t topology, hwloc_obj_t prev)
Get the next OS device in the system.
Definition: helper.h:1252
union hwloc_obj_attr_u * attr
Object type-specific Attributes, may be NULL if no attribute value was found.
Definition: hwloc.h:368
PCI device. These objects have neither CPU sets nor node sets. They are not added to the topology unl...
Definition: hwloc.h:241
void hwloc_bitmap_copy(hwloc_bitmap_t dst, hwloc_const_bitmap_t src)
Copy the contents of bitmap src into the already allocated bitmap dst.
unsigned char func
Definition: hwloc.h:528
struct hwloc_obj_attr_u::hwloc_pcidev_attr_s pcidev
unsigned char bus
Definition: hwloc.h:528
struct hwloc_obj * parent
Parent, NULL if root (system object)
Definition: hwloc.h:388
static hwloc_const_cpuset_t hwloc_topology_get_complete_cpuset(hwloc_topology_t topology)
Get complete CPU set.
Definition: helper.h:803
unsigned char dev
Definition: hwloc.h:528
Structure of a topology object.
Definition: hwloc.h:353
int hwloc_linux_parse_cpumap_file(FILE *file, hwloc_cpuset_t set)
Convert a linux kernel cpumap file file into hwloc CPU set.
char * name
Object-specific name if any. Mostly used for identifying OS devices and Misc objects where a name str...
Definition: hwloc.h:361
hwloc_obj_type_t type
Type of object.
Definition: hwloc.h:355
struct hwloc_obj_attr_u::hwloc_osdev_attr_s osdev
struct hwloc_topology * hwloc_topology_t
Topology context.
Definition: hwloc.h:617
Operating system co-processor device. For instance "mic0" for a Xeon Phi (MIC) on Linux...
Definition: hwloc.h:292
hwloc_bitmap_t hwloc_cpuset_t
A CPU set is a bitmap whose bits are set according to CPU physical OS indexes.
Definition: hwloc.h:133
hwloc_obj_osdev_type_t type
Definition: hwloc.h:551