Hardware Locality (hwloc) 2.9.0
cudart.h
1/*
2 * Copyright © 2010-2021 Inria. All rights reserved.
3 * Copyright © 2010-2011 Université Bordeaux
4 * Copyright © 2011 Cisco Systems, Inc. All rights reserved.
5 * See COPYING in top-level directory.
6 */
7
16#ifndef HWLOC_CUDART_H
17#define HWLOC_CUDART_H
18
19#include "hwloc.h"
20#include "hwloc/autogen/config.h"
21#include "hwloc/helper.h"
22#ifdef HWLOC_LINUX_SYS
23#include "hwloc/linux.h"
24#endif
25
26#include <cuda.h> /* for CUDA_VERSION */
27#include <cuda_runtime_api.h>
28
29
30#ifdef __cplusplus
31extern "C" {
32#endif
33
34
47static __hwloc_inline int
48hwloc_cudart_get_device_pci_ids(hwloc_topology_t topology __hwloc_attribute_unused,
49 int idx, int *domain, int *bus, int *dev)
50{
51 cudaError_t cerr;
52 struct cudaDeviceProp prop;
53
54 cerr = cudaGetDeviceProperties(&prop, idx);
55 if (cerr) {
56 errno = ENOSYS;
57 return -1;
58 }
59
60#if CUDA_VERSION >= 4000
61 *domain = prop.pciDomainID;
62#else
63 *domain = 0;
64#endif
65
66 *bus = prop.pciBusID;
67 *dev = prop.pciDeviceID;
68
69 return 0;
70}
71
88static __hwloc_inline int
89hwloc_cudart_get_device_cpuset(hwloc_topology_t topology __hwloc_attribute_unused,
90 int idx, hwloc_cpuset_t set)
91{
92#ifdef HWLOC_LINUX_SYS
93 /* If we're on Linux, use the sysfs mechanism to get the local cpus */
94#define HWLOC_CUDART_DEVICE_SYSFS_PATH_MAX 128
95 char path[HWLOC_CUDART_DEVICE_SYSFS_PATH_MAX];
96 int domain, bus, dev;
97
98 if (hwloc_cudart_get_device_pci_ids(topology, idx, &domain, &bus, &dev))
99 return -1;
100
101 if (!hwloc_topology_is_thissystem(topology)) {
102 errno = EINVAL;
103 return -1;
104 }
105
106 sprintf(path, "/sys/bus/pci/devices/%04x:%02x:%02x.0/local_cpus", (unsigned) domain, (unsigned) bus, (unsigned) dev);
107 if (hwloc_linux_read_path_as_cpumask(path, set) < 0
108 || hwloc_bitmap_iszero(set))
110#else
111 /* Non-Linux systems simply get a full cpuset */
113#endif
114 return 0;
115}
116
127static __hwloc_inline hwloc_obj_t
129{
130 int domain, bus, dev;
131
132 if (hwloc_cudart_get_device_pci_ids(topology, idx, &domain, &bus, &dev))
133 return NULL;
134
135 return hwloc_get_pcidev_by_busid(topology, domain, bus, dev, 0);
136}
137
155static __hwloc_inline hwloc_obj_t
157{
158 hwloc_obj_t osdev = NULL;
159 while ((osdev = hwloc_get_next_osdev(topology, osdev)) != NULL) {
161 && osdev->name
162 && !strncmp("cuda", osdev->name, 4)
163 && atoi(osdev->name + 4) == (int) idx)
164 return osdev;
165 }
166 return NULL;
167}
168
172#ifdef __cplusplus
173} /* extern "C" */
174#endif
175
176
177#endif /* HWLOC_CUDART_H */
hwloc_bitmap_t hwloc_cpuset_t
A CPU set is a bitmap whose bits are set according to CPU physical OS indexes.
Definition hwloc.h:140
@ HWLOC_OBJ_OSDEV_COPROC
Operating system co-processor device. For instance "opencl0d0" for a OpenCL device,...
Definition hwloc.h:353
struct hwloc_topology * hwloc_topology_t
Topology context.
Definition hwloc.h:692
int hwloc_topology_is_thissystem(hwloc_topology_t restrict topology)
Does the topology context come from this system?
hwloc_const_cpuset_t hwloc_topology_get_complete_cpuset(hwloc_topology_t topology)
Get complete CPU set.
static hwloc_obj_t hwloc_get_next_osdev(hwloc_topology_t topology, hwloc_obj_t prev)
Get the next OS device in the system.
Definition helper.h:1191
static hwloc_obj_t hwloc_get_pcidev_by_busid(hwloc_topology_t topology, unsigned domain, unsigned bus, unsigned dev, unsigned func)
Find the PCI device object matching the PCI bus id given domain, bus device and function PCI bus id.
Definition helper.h:1154
int hwloc_bitmap_iszero(hwloc_const_bitmap_t bitmap)
Test whether bitmap bitmap is empty.
int hwloc_bitmap_copy(hwloc_bitmap_t dst, hwloc_const_bitmap_t src)
Copy the contents of bitmap src into the already allocated bitmap dst.
int hwloc_linux_read_path_as_cpumask(const char *path, hwloc_bitmap_t set)
Convert a linux kernel cpumask file path into a hwloc bitmap set.
static int hwloc_cudart_get_device_cpuset(hwloc_topology_t topology, int idx, hwloc_cpuset_t set)
Get the CPU set of processors that are physically close to device idx.
Definition cudart.h:89
static hwloc_obj_t hwloc_cudart_get_device_osdev_by_index(hwloc_topology_t topology, unsigned idx)
Get the hwloc OS device object corresponding to the CUDA device whose index is idx.
Definition cudart.h:156
static int hwloc_cudart_get_device_pci_ids(hwloc_topology_t topology, int idx, int *domain, int *bus, int *dev)
Return the domain, bus and device IDs of the CUDA device whose index is idx.
Definition cudart.h:48
static hwloc_obj_t hwloc_cudart_get_device_pcidev(hwloc_topology_t topology, int idx)
Get the hwloc PCI device object corresponding to the CUDA device whose index is idx.
Definition cudart.h:128
Structure of a topology object.
Definition hwloc.h:396
char * name
Object-specific name if any. Mostly used for identifying OS devices and Misc objects where a name str...
Definition hwloc.h:408
union hwloc_obj_attr_u * attr
Object type-specific Attributes, may be NULL if no attribute value was found.
Definition hwloc.h:415
struct hwloc_obj_attr_u::hwloc_osdev_attr_s osdev
hwloc_obj_osdev_type_t type
Definition hwloc.h:666