2022-05-09 13:18:59 -07:00
|
|
|
/*******************************************************************************
|
2023-10-17 09:25:29 -07:00
|
|
|
Copyright (c) 2016-2023 NVIDIA Corporation
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
of this software and associated documentation files (the "Software"), to
|
|
|
|
deal in the Software without restriction, including without limitation the
|
|
|
|
rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
|
|
|
|
sell copies of the Software, and to permit persons to whom the Software is
|
|
|
|
furnished to do so, subject to the following conditions:
|
|
|
|
|
|
|
|
The above copyright notice and this permission notice shall be
|
|
|
|
included in all copies or substantial portions of the Software.
|
|
|
|
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
|
|
THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
|
|
FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
|
|
DEALINGS IN THE SOFTWARE.
|
|
|
|
|
|
|
|
*******************************************************************************/
|
|
|
|
|
|
|
|
#ifndef __UVM_PROCESSORS_H__
|
|
|
|
#define __UVM_PROCESSORS_H__
|
|
|
|
|
|
|
|
#include "uvm_linux.h"
|
|
|
|
#include "uvm_common.h"
|
2023-10-17 09:25:29 -07:00
|
|
|
#include <linux/numa.h>
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
// Processor identifiers
|
|
|
|
// =====================
|
|
|
|
//
|
|
|
|
// UVM uses its own identifiers to refer to the processors in the system. For
|
|
|
|
// simplicity (and performance), integers are used. However, in order to
|
2024-01-24 17:51:53 +01:00
|
|
|
// provide type safety, they are wrapped within the uvm_parent_processor_id_t
|
|
|
|
// struct.
|
2022-05-09 13:18:59 -07:00
|
|
|
// The range of valid identifiers needs to cover the maximum number of
|
|
|
|
// supported GPUs on a system plus the CPU. CPU is assigned value 0, and GPUs
|
2023-10-17 09:25:29 -07:00
|
|
|
// range: [1, UVM_PARENT_ID_MAX_GPUS].
|
2022-05-09 13:18:59 -07:00
|
|
|
//
|
|
|
|
// There are some functions that only expect GPU identifiers and, in order to
|
2023-10-17 09:25:29 -07:00
|
|
|
// make it clearer, the uvm_parent_gpu_id_t alias type is provided. However, as
|
2024-01-24 17:51:53 +01:00
|
|
|
// this type is just a typedef of uvm_parent_processor_id_t, there is no type
|
|
|
|
// checking performed by the compiler.
|
2022-05-09 13:18:59 -07:00
|
|
|
//
|
|
|
|
// Identifier value vs index
|
|
|
|
// -------------------------
|
|
|
|
//
|
|
|
|
// Although we can rely on helpers for most of the operations related to
|
|
|
|
// processor ids, there are some scenarios in which we need to obtain their
|
|
|
|
// numerical value. Notably:
|
|
|
|
// - Logging
|
|
|
|
// - Array indexing
|
|
|
|
//
|
|
|
|
// Therefore, a helper is provided to obtain this value. However, there is a
|
|
|
|
// special case for array indexing, as there are some arrays that only contain
|
|
|
|
// entries for GPUs. In that case, the array cannot be directly indexed with
|
|
|
|
// the identifier's value. Instead, we use a helper that provides the index of
|
|
|
|
// the GPU within the GPU id space (basically id - 1).
|
|
|
|
//
|
|
|
|
// In the diagram below, MAX_SUB is used to abbreviate
|
2023-10-17 09:25:29 -07:00
|
|
|
// UVM_PARENT_ID_MAX_SUB_PROCESSORS.
|
2022-05-09 13:18:59 -07:00
|
|
|
//
|
2024-01-24 17:51:53 +01:00
|
|
|
// |-------------------------- uvm_parent_processor_id_t ---------------------------------------------|
|
|
|
|
// | |
|
|
|
|
// | |----------------------- uvm_parent_gpu_id_t -----------------------------------------------||
|
|
|
|
// | | ||
|
|
|
|
// Proc type | CPU | GPU | ... | GPU | ... GPU ||
|
|
|
|
// | | | | | ||
|
|
|
|
// ID values | 0 | 1 | ... | i+1 | ... UVM_PARENT_ID_MAX_PROCESSORS-1 ||
|
|
|
|
// | | | | | ||
|
|
|
|
// GPU index | | 0 | ... | i | ... UVM_PARENT_ID_MAX_GPUS-1 ||
|
|
|
|
// | | | | | ||
|
|
|
|
// + + + + + ++
|
|
|
|
// | | |-------------| | |-----------------------------| ||
|
|
|
|
// | | | | | ||
|
|
|
|
// GPU index | | 0 ... MAX_SUB-1 | ... | i*MAX_SUB ... (i+1)*MAX_SUB-1 | ... UVM_ID_MAX_GPUS-1 ||
|
|
|
|
// | | | | | ||
|
|
|
|
// ID values | 0 | 1 ... MAX_SUB | ... | (i*MAX_SUB)+1 ... (i+1)*MAX_SUB | ... UVM_ID_MAX_PROCESSORS-1 ||
|
|
|
|
// | | | | | ||
|
|
|
|
// Proc type | CPU | GPU ... GPU | ... | GPU ... GPU | ... GPU ||
|
|
|
|
// | | ||
|
|
|
|
// | |-------------------------------------- uvm_gpu_id_t ---------------------------------------||
|
|
|
|
// | |
|
|
|
|
// |----------------------------------------- uvm_processor_id_t -------------------------------------|
|
2022-05-09 13:18:59 -07:00
|
|
|
//
|
|
|
|
// When SMC is enabled, each GPU partition gets its own uvm_gpu_t object.
|
|
|
|
|
|
|
|
#define UVM_PROCESSOR_MASK(mask_t, \
|
|
|
|
prefix_fn_mask, \
|
|
|
|
maxval, \
|
|
|
|
proc_id_t, \
|
|
|
|
proc_id_ctor) \
|
|
|
|
\
|
|
|
|
typedef struct \
|
|
|
|
{ \
|
|
|
|
DECLARE_BITMAP(bitmap, maxval); \
|
|
|
|
} mask_t; \
|
|
|
|
\
|
|
|
|
static bool prefix_fn_mask##_test(const mask_t *mask, proc_id_t id) \
|
|
|
|
{ \
|
|
|
|
UVM_ASSERT_MSG(id.val < (maxval), "id %u\n", id.val); \
|
|
|
|
\
|
|
|
|
return test_bit(id.val, mask->bitmap); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static void prefix_fn_mask##_set_atomic(mask_t *mask, proc_id_t id) \
|
|
|
|
{ \
|
|
|
|
UVM_ASSERT_MSG(id.val < (maxval), "id %u\n", id.val); \
|
|
|
|
\
|
|
|
|
set_bit(id.val, mask->bitmap); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static void prefix_fn_mask##_set(mask_t *mask, proc_id_t id) \
|
|
|
|
{ \
|
|
|
|
UVM_ASSERT_MSG(id.val < (maxval), "id %u\n", id.val); \
|
|
|
|
\
|
|
|
|
__set_bit(id.val, mask->bitmap); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static void prefix_fn_mask##_clear_atomic(mask_t *mask, proc_id_t id) \
|
|
|
|
{ \
|
|
|
|
UVM_ASSERT_MSG(id.val < (maxval), "id %u\n", id.val); \
|
|
|
|
\
|
|
|
|
clear_bit(id.val, mask->bitmap); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static void prefix_fn_mask##_clear(mask_t *mask, proc_id_t id) \
|
|
|
|
{ \
|
|
|
|
UVM_ASSERT_MSG(id.val < (maxval), "id %u\n", id.val); \
|
|
|
|
\
|
|
|
|
__clear_bit(id.val, mask->bitmap); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static bool prefix_fn_mask##_test_and_set_atomic(mask_t *mask, proc_id_t id) \
|
|
|
|
{ \
|
|
|
|
UVM_ASSERT_MSG(id.val < (maxval), "id %u\n", id.val); \
|
|
|
|
\
|
|
|
|
return test_and_set_bit(id.val, mask->bitmap); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static bool prefix_fn_mask##_test_and_set(mask_t *mask, proc_id_t id) \
|
|
|
|
{ \
|
|
|
|
UVM_ASSERT_MSG(id.val < (maxval), "id %u\n", id.val); \
|
|
|
|
\
|
|
|
|
return __test_and_set_bit(id.val, mask->bitmap); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static bool prefix_fn_mask##_test_and_clear_atomic(mask_t *mask, proc_id_t id) \
|
|
|
|
{ \
|
|
|
|
UVM_ASSERT_MSG(id.val < (maxval), "id %u\n", id.val); \
|
|
|
|
\
|
|
|
|
return test_and_clear_bit(id.val, mask->bitmap); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static bool prefix_fn_mask##_test_and_clear(mask_t *mask, proc_id_t id) \
|
|
|
|
{ \
|
|
|
|
UVM_ASSERT_MSG(id.val < (maxval), "id %u\n", id.val); \
|
|
|
|
\
|
|
|
|
return __test_and_clear_bit(id.val, mask->bitmap); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static void prefix_fn_mask##_zero(mask_t *mask) \
|
|
|
|
{ \
|
|
|
|
bitmap_zero(mask->bitmap, (maxval)); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static bool prefix_fn_mask##_empty(const mask_t *mask) \
|
|
|
|
{ \
|
|
|
|
return bitmap_empty(mask->bitmap, (maxval)); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static void prefix_fn_mask##_copy(mask_t *dst, const mask_t *src) \
|
|
|
|
{ \
|
|
|
|
bitmap_copy(dst->bitmap, src->bitmap, (maxval)); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static bool prefix_fn_mask##_and(mask_t *dst, const mask_t *src1, const mask_t *src2) \
|
|
|
|
{ \
|
|
|
|
return bitmap_and(dst->bitmap, src1->bitmap, src2->bitmap, (maxval)) != 0; \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static void prefix_fn_mask##_or(mask_t *dst, const mask_t *src1, const mask_t *src2) \
|
|
|
|
{ \
|
|
|
|
bitmap_or(dst->bitmap, src1->bitmap, src2->bitmap, (maxval)); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static bool prefix_fn_mask##_andnot(mask_t *dst, const mask_t *src1, const mask_t *src2) \
|
|
|
|
{ \
|
|
|
|
return bitmap_andnot(dst->bitmap, src1->bitmap, src2->bitmap, (maxval)); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static void prefix_fn_mask##_xor(mask_t *dst, const mask_t *src1, const mask_t *src2) \
|
|
|
|
{ \
|
|
|
|
bitmap_xor(dst->bitmap, src1->bitmap, src2->bitmap, (maxval)); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static proc_id_t prefix_fn_mask##_find_first_id(const mask_t *mask) \
|
|
|
|
{ \
|
|
|
|
return proc_id_ctor(find_first_bit(mask->bitmap, (maxval))); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static proc_id_t prefix_fn_mask##_find_first_gpu_id(const mask_t *mask) \
|
|
|
|
{ \
|
2023-10-17 09:25:29 -07:00
|
|
|
return proc_id_ctor(find_next_bit(mask->bitmap, (maxval), UVM_PARENT_ID_GPU0_VALUE)); \
|
2022-05-09 13:18:59 -07:00
|
|
|
} \
|
|
|
|
\
|
|
|
|
static proc_id_t prefix_fn_mask##_find_next_id(const mask_t *mask, proc_id_t min_id) \
|
|
|
|
{ \
|
|
|
|
return proc_id_ctor(find_next_bit(mask->bitmap, (maxval), min_id.val)); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static proc_id_t prefix_fn_mask##_find_next_gpu_id(const mask_t *mask, proc_id_t min_gpu_id) \
|
|
|
|
{ \
|
|
|
|
return proc_id_ctor(find_next_bit(mask->bitmap, (maxval), min_gpu_id.val)); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static proc_id_t prefix_fn_mask##_find_first_unset_id(const mask_t *mask) \
|
|
|
|
{ \
|
|
|
|
return proc_id_ctor(find_first_zero_bit(mask->bitmap, (maxval))); \
|
|
|
|
} \
|
|
|
|
\
|
2024-01-24 17:51:53 +01:00
|
|
|
static proc_id_t prefix_fn_mask##_find_next_unset_id(const mask_t *mask, proc_id_t min_id) \
|
2022-05-09 13:18:59 -07:00
|
|
|
{ \
|
|
|
|
return proc_id_ctor(find_next_zero_bit(mask->bitmap, (maxval), min_id.val)); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static bool prefix_fn_mask##_equal(const mask_t *mask_in1, const mask_t *mask_in2) \
|
|
|
|
{ \
|
|
|
|
return bitmap_equal(mask_in1->bitmap, mask_in2->bitmap, (maxval)) != 0; \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static bool prefix_fn_mask##_subset(const mask_t *subset, const mask_t *mask) \
|
|
|
|
{ \
|
|
|
|
return bitmap_subset(subset->bitmap, mask->bitmap, (maxval)) != 0; \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static NvU32 prefix_fn_mask##_get_count(const mask_t *mask) \
|
|
|
|
{ \
|
|
|
|
return bitmap_weight(mask->bitmap, (maxval)); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static NvU32 prefix_fn_mask##_get_gpu_count(const mask_t *mask) \
|
|
|
|
{ \
|
|
|
|
NvU32 gpu_count = prefix_fn_mask##_get_count(mask); \
|
|
|
|
\
|
2023-10-17 09:25:29 -07:00
|
|
|
if (prefix_fn_mask##_test(mask, proc_id_ctor(UVM_PARENT_ID_CPU_VALUE))) \
|
2022-05-09 13:18:59 -07:00
|
|
|
--gpu_count; \
|
|
|
|
\
|
|
|
|
return gpu_count; \
|
|
|
|
}
|
|
|
|
|
|
|
|
typedef struct
|
|
|
|
{
|
|
|
|
NvU32 val;
|
2023-10-17 09:25:29 -07:00
|
|
|
} uvm_parent_processor_id_t;
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
typedef struct
|
|
|
|
{
|
|
|
|
NvU32 val;
|
2024-01-24 17:51:53 +01:00
|
|
|
} uvm_processor_id_t;
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
typedef uvm_parent_processor_id_t uvm_parent_gpu_id_t;
|
2024-01-24 17:51:53 +01:00
|
|
|
typedef uvm_processor_id_t uvm_gpu_id_t;
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
// Static value assigned to the CPU
|
2023-10-17 09:25:29 -07:00
|
|
|
#define UVM_PARENT_ID_CPU_VALUE 0
|
|
|
|
#define UVM_PARENT_ID_GPU0_VALUE (UVM_PARENT_ID_CPU_VALUE + 1)
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
// ID values for the CPU and first GPU, respectively; the values for both types
|
|
|
|
// of IDs must match to enable sharing of UVM_PROCESSOR_MASK().
|
2024-01-24 17:51:53 +01:00
|
|
|
#define UVM_ID_CPU_VALUE UVM_PARENT_ID_CPU_VALUE
|
|
|
|
#define UVM_ID_GPU0_VALUE UVM_PARENT_ID_GPU0_VALUE
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
// Maximum number of GPUs/processors that can be represented with the id types
|
2024-01-24 17:51:53 +01:00
|
|
|
#define UVM_PARENT_ID_MAX_GPUS NV_MAX_DEVICES
|
|
|
|
#define UVM_PARENT_ID_MAX_PROCESSORS (UVM_PARENT_ID_MAX_GPUS + 1)
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
#define UVM_PARENT_ID_MAX_SUB_PROCESSORS 8
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
#define UVM_ID_MAX_GPUS (UVM_PARENT_ID_MAX_GPUS * UVM_PARENT_ID_MAX_SUB_PROCESSORS)
|
|
|
|
#define UVM_ID_MAX_PROCESSORS (UVM_ID_MAX_GPUS + 1)
|
|
|
|
#define UVM_MAX_UNIQUE_GPU_PAIRS SUM_FROM_0_TO_N(UVM_ID_MAX_GPUS - 1)
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
#define UVM_PARENT_ID_CPU ((uvm_parent_processor_id_t) { .val = UVM_PARENT_ID_CPU_VALUE })
|
|
|
|
#define UVM_PARENT_ID_INVALID ((uvm_parent_processor_id_t) { .val = UVM_PARENT_ID_MAX_PROCESSORS })
|
2024-01-24 17:51:53 +01:00
|
|
|
#define UVM_ID_CPU ((uvm_processor_id_t) { .val = UVM_ID_CPU_VALUE })
|
|
|
|
#define UVM_ID_INVALID ((uvm_processor_id_t) { .val = UVM_ID_MAX_PROCESSORS })
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
#define UVM_PARENT_ID_CHECK_BOUNDS(id) UVM_ASSERT_MSG(id.val <= UVM_PARENT_ID_MAX_PROCESSORS, "id %u\n", id.val)
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
#define UVM_ID_CHECK_BOUNDS(id) UVM_ASSERT_MSG(id.val <= UVM_ID_MAX_PROCESSORS, "id %u\n", id.val)
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
static int uvm_parent_id_cmp(uvm_parent_processor_id_t id1, uvm_parent_processor_id_t id2)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_PARENT_ID_CHECK_BOUNDS(id1);
|
|
|
|
UVM_PARENT_ID_CHECK_BOUNDS(id2);
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
return UVM_CMP_DEFAULT(id1.val, id2.val);
|
|
|
|
}
|
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
static bool uvm_parent_id_equal(uvm_parent_processor_id_t id1, uvm_parent_processor_id_t id2)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_PARENT_ID_CHECK_BOUNDS(id1);
|
|
|
|
UVM_PARENT_ID_CHECK_BOUNDS(id2);
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
return id1.val == id2.val;
|
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
static int uvm_id_cmp(uvm_processor_id_t id1, uvm_processor_id_t id2)
|
2023-02-28 11:12:44 -08:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_ID_CHECK_BOUNDS(id1);
|
|
|
|
UVM_ID_CHECK_BOUNDS(id2);
|
2023-02-28 11:12:44 -08:00
|
|
|
|
|
|
|
return UVM_CMP_DEFAULT(id1.val, id2.val);
|
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
static bool uvm_id_equal(uvm_processor_id_t id1, uvm_processor_id_t id2)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_ID_CHECK_BOUNDS(id1);
|
|
|
|
UVM_ID_CHECK_BOUNDS(id2);
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
return id1.val == id2.val;
|
|
|
|
}
|
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
#define UVM_PARENT_ID_IS_CPU(id) uvm_parent_id_equal(id, UVM_PARENT_ID_CPU)
|
|
|
|
#define UVM_PARENT_ID_IS_INVALID(id) uvm_parent_id_equal(id, UVM_PARENT_ID_INVALID)
|
|
|
|
#define UVM_PARENT_ID_IS_VALID(id) (!UVM_PARENT_ID_IS_INVALID(id))
|
|
|
|
#define UVM_PARENT_ID_IS_GPU(id) (!UVM_PARENT_ID_IS_CPU(id) && !UVM_PARENT_ID_IS_INVALID(id))
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
#define UVM_ID_IS_CPU(id) uvm_id_equal(id, UVM_ID_CPU)
|
|
|
|
#define UVM_ID_IS_INVALID(id) uvm_id_equal(id, UVM_ID_INVALID)
|
|
|
|
#define UVM_ID_IS_VALID(id) (!UVM_ID_IS_INVALID(id))
|
|
|
|
#define UVM_ID_IS_GPU(id) (!UVM_ID_IS_CPU(id) && !UVM_ID_IS_INVALID(id))
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
static uvm_parent_processor_id_t uvm_parent_id_from_value(NvU32 val)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2023-10-17 09:25:29 -07:00
|
|
|
uvm_parent_processor_id_t ret = { .val = val };
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_PARENT_ID_CHECK_BOUNDS(ret);
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
static uvm_parent_gpu_id_t uvm_parent_gpu_id_from_value(NvU32 val)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2023-10-17 09:25:29 -07:00
|
|
|
uvm_parent_gpu_id_t ret = uvm_parent_id_from_value(val);
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_ASSERT(!UVM_PARENT_ID_IS_CPU(ret));
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
static uvm_processor_id_t uvm_id_from_value(NvU32 val)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
uvm_processor_id_t ret = { .val = val };
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_ID_CHECK_BOUNDS(ret);
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
static uvm_gpu_id_t uvm_gpu_id_from_value(NvU32 val)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
uvm_gpu_id_t ret = uvm_id_from_value(val);
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_ASSERT(!UVM_ID_IS_CPU(ret));
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
// Create a parent GPU id from the given parent GPU id index (previously
|
|
|
|
// obtained via uvm_parent_id_gpu_index)
|
|
|
|
static uvm_parent_gpu_id_t uvm_parent_gpu_id_from_index(NvU32 index)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2023-10-17 09:25:29 -07:00
|
|
|
return uvm_parent_gpu_id_from_value(index + UVM_PARENT_ID_GPU0_VALUE);
|
2022-05-09 13:18:59 -07:00
|
|
|
}
|
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
static uvm_parent_processor_id_t uvm_parent_id_next(uvm_parent_processor_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
|
|
|
++id.val;
|
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_PARENT_ID_CHECK_BOUNDS(id);
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
return id;
|
|
|
|
}
|
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
static uvm_parent_gpu_id_t uvm_parent_gpu_id_next(uvm_parent_gpu_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_ASSERT(UVM_PARENT_ID_IS_GPU(id));
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
++id.val;
|
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_PARENT_ID_CHECK_BOUNDS(id);
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
return id;
|
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
// Same as uvm_parent_gpu_id_from_index but for uvm_processor_id_t
|
|
|
|
static uvm_gpu_id_t uvm_gpu_id_from_index(NvU32 index)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
return uvm_gpu_id_from_value(index + UVM_ID_GPU0_VALUE);
|
2022-05-09 13:18:59 -07:00
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
static uvm_processor_id_t uvm_id_next(uvm_processor_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
|
|
|
++id.val;
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_ID_CHECK_BOUNDS(id);
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
return id;
|
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
static uvm_gpu_id_t uvm_gpu_id_next(uvm_gpu_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_ASSERT(UVM_ID_IS_GPU(id));
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
++id.val;
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_ID_CHECK_BOUNDS(id);
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
return id;
|
|
|
|
}
|
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
// This function returns the numerical value within
|
|
|
|
// [0, UVM_PARENT_ID_MAX_PROCESSORS) of the given parent processor id.
|
|
|
|
static NvU32 uvm_parent_id_value(uvm_parent_processor_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_ASSERT(UVM_PARENT_ID_IS_VALID(id));
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
return id.val;
|
|
|
|
}
|
|
|
|
|
|
|
|
// This function returns the numerical value within
|
2024-01-24 17:51:53 +01:00
|
|
|
// [0, UVM_ID_MAX_PROCESSORS) of the given processor id
|
|
|
|
static NvU32 uvm_id_value(uvm_processor_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_ASSERT(UVM_ID_IS_VALID(id));
|
2022-05-09 13:18:59 -07:00
|
|
|
|
|
|
|
return id.val;
|
|
|
|
}
|
|
|
|
|
|
|
|
// This function returns the index of the given GPU id within the GPU id space
|
2023-10-17 09:25:29 -07:00
|
|
|
// [0, UVM_PARENT_ID_MAX_GPUS)
|
|
|
|
static NvU32 uvm_parent_id_gpu_index(uvm_parent_gpu_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_ASSERT(UVM_PARENT_ID_IS_GPU(id));
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
return id.val - UVM_PARENT_ID_GPU0_VALUE;
|
2022-05-09 13:18:59 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// This function returns the index of the given GPU id within the GPU id space
|
2024-01-24 17:51:53 +01:00
|
|
|
// [0, UVM_ID_MAX_GPUS)
|
|
|
|
static NvU32 uvm_id_gpu_index(const uvm_gpu_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_ASSERT(UVM_ID_IS_GPU(id));
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
return id.val - UVM_ID_GPU0_VALUE;
|
2022-05-09 13:18:59 -07:00
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
static NvU32 uvm_id_gpu_index_from_parent_gpu_id(const uvm_parent_gpu_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_ASSERT(UVM_PARENT_ID_IS_GPU(id));
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
return uvm_parent_id_gpu_index(id) * UVM_PARENT_ID_MAX_SUB_PROCESSORS;
|
2022-05-09 13:18:59 -07:00
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
// This function returns the numerical value of the parent processor ID from the
|
|
|
|
// given processor id.
|
|
|
|
static NvU32 uvm_parent_id_value_from_processor_id(const uvm_processor_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
if (UVM_ID_IS_CPU(id))
|
|
|
|
return UVM_PARENT_ID_CPU_VALUE;
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
return (uvm_id_gpu_index(id) / UVM_PARENT_ID_MAX_SUB_PROCESSORS) + UVM_PARENT_ID_GPU0_VALUE;
|
2022-05-09 13:18:59 -07:00
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
static NvU32 uvm_parent_id_gpu_index_from_gpu_id(const uvm_gpu_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_ASSERT(UVM_ID_IS_GPU(id));
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
return uvm_id_gpu_index(id) / UVM_PARENT_ID_MAX_SUB_PROCESSORS;
|
2022-05-09 13:18:59 -07:00
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
static uvm_gpu_id_t uvm_gpu_id_from_parent_gpu_id(const uvm_parent_gpu_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_ASSERT(UVM_PARENT_ID_IS_GPU(id));
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
return uvm_gpu_id_from_index(uvm_id_gpu_index_from_parent_gpu_id(id));
|
2022-05-09 13:18:59 -07:00
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
static uvm_gpu_id_t uvm_gpu_id_from_sub_processor_index(NvU32 index, NvU32 sub_index)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_ASSERT(index < UVM_PARENT_ID_MAX_GPUS);
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_ASSERT(sub_index < UVM_PARENT_ID_MAX_SUB_PROCESSORS);
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
return uvm_gpu_id_from_index(index * UVM_PARENT_ID_MAX_SUB_PROCESSORS + sub_index);
|
2022-05-09 13:18:59 -07:00
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
static uvm_parent_gpu_id_t uvm_parent_gpu_id_from_gpu_id(const uvm_gpu_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_ASSERT(UVM_ID_IS_GPU(id));
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
return uvm_parent_gpu_id_from_index(uvm_parent_id_gpu_index_from_gpu_id(id));
|
2022-05-09 13:18:59 -07:00
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
static NvU32 uvm_id_sub_processor_index(const uvm_gpu_id_t id)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
return uvm_id_gpu_index(id) % UVM_PARENT_ID_MAX_SUB_PROCESSORS;
|
2022-05-09 13:18:59 -07:00
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_PROCESSOR_MASK(uvm_parent_processor_mask_t, \
|
|
|
|
uvm_parent_processor_mask, \
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_PARENT_ID_MAX_PROCESSORS, \
|
|
|
|
uvm_parent_processor_id_t, \
|
|
|
|
uvm_parent_id_from_value)
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
UVM_PROCESSOR_MASK(uvm_processor_mask_t, \
|
|
|
|
uvm_processor_mask, \
|
|
|
|
UVM_ID_MAX_PROCESSORS, \
|
|
|
|
uvm_processor_id_t, \
|
|
|
|
uvm_id_from_value)
|
|
|
|
|
2024-02-23 16:37:56 +01:00
|
|
|
extern const uvm_processor_mask_t g_uvm_processor_mask_cpu;
|
|
|
|
extern const uvm_processor_mask_t g_uvm_processor_mask_empty;
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
// Like uvm_processor_mask_subset() but ignores the CPU in the subset mask.
|
|
|
|
// Returns whether the GPUs in subset are a subset of the GPUs in mask.
|
|
|
|
bool uvm_processor_mask_gpu_subset(const uvm_processor_mask_t *subset,
|
|
|
|
const uvm_processor_mask_t *mask);
|
|
|
|
|
|
|
|
// Compress a uvm_processor_mask_t down to a uvm_parent_processor_mask_t
|
|
|
|
// by only copying the first subprocessor bit and ignoring the CPU bit.
|
|
|
|
void uvm_parent_gpus_from_processor_mask(uvm_parent_processor_mask_t *parent_mask,
|
|
|
|
const uvm_processor_mask_t *mask);
|
|
|
|
|
|
|
|
#define for_each_parent_id_in_mask(id, mask) \
|
|
|
|
for ((id) = uvm_parent_processor_mask_find_first_id(mask); \
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_PARENT_ID_IS_VALID(id); \
|
2024-01-24 17:51:53 +01:00
|
|
|
(id) = uvm_parent_processor_mask_find_next_id((mask), uvm_parent_id_next(id)))
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
#define for_each_parent_gpu_id_in_mask(gpu_id, mask) \
|
|
|
|
for ((gpu_id) = uvm_parent_processor_mask_find_first_gpu_id((mask)); \
|
2023-10-17 09:25:29 -07:00
|
|
|
UVM_PARENT_ID_IS_VALID(gpu_id); \
|
2024-01-24 17:51:53 +01:00
|
|
|
(gpu_id) = uvm_parent_processor_mask_find_next_id((mask), uvm_parent_gpu_id_next(gpu_id)))
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
#define for_each_id_in_mask(id, mask) \
|
|
|
|
for ((id) = uvm_processor_mask_find_first_id(mask); \
|
|
|
|
UVM_ID_IS_VALID(id); \
|
|
|
|
(id) = uvm_processor_mask_find_next_id((mask), uvm_id_next(id)))
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
#define for_each_gpu_id_in_mask(gpu_id, mask) \
|
|
|
|
for ((gpu_id) = uvm_processor_mask_find_first_gpu_id((mask)); \
|
|
|
|
UVM_ID_IS_VALID(gpu_id); \
|
|
|
|
(gpu_id) = uvm_processor_mask_find_next_id((mask), uvm_gpu_id_next(gpu_id)))
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
// Helper to iterate over all valid parent gpu ids.
|
|
|
|
#define for_each_parent_gpu_id(i) \
|
2023-10-17 09:25:29 -07:00
|
|
|
for (i = uvm_parent_gpu_id_from_value(UVM_PARENT_ID_GPU0_VALUE); UVM_PARENT_ID_IS_VALID(i); i = uvm_parent_gpu_id_next(i))
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
// Helper to iterate over all valid gpu ids.
|
|
|
|
#define for_each_gpu_id(i) \
|
|
|
|
for (i = uvm_gpu_id_from_value(UVM_ID_GPU0_VALUE); UVM_ID_IS_VALID(i); i = uvm_gpu_id_next(i))
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
// Helper to iterate over all gpu ids in a given parent id.
|
|
|
|
#define for_each_sub_processor_id_in_parent_gpu(i, id) \
|
|
|
|
for (i = uvm_gpu_id_from_parent_gpu_id(id); \
|
|
|
|
UVM_ID_IS_VALID(i) && \
|
|
|
|
(uvm_id_value(i) < uvm_id_value(uvm_gpu_id_from_parent_gpu_id(id)) + UVM_PARENT_ID_MAX_SUB_PROCESSORS); \
|
|
|
|
i = uvm_gpu_id_next(i))
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2024-02-23 16:37:56 +01:00
|
|
|
// Helper to iterate over all sub processor indexes.
|
|
|
|
#define for_each_sub_processor_index(i) \
|
|
|
|
for (i = 0; i < UVM_PARENT_ID_MAX_SUB_PROCESSORS; i++)
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
// Helper to iterate over all valid processor ids.
|
|
|
|
#define for_each_id(i) for (i = UVM_ID_CPU; UVM_ID_IS_VALID(i); i = uvm_id_next(i))
|
2022-05-09 13:18:59 -07:00
|
|
|
|
2023-10-17 09:25:29 -07:00
|
|
|
// Find the node in mask with the shorted distance (as returned by
|
|
|
|
// node_distance) for src.
|
|
|
|
// Note that the search is inclusive of src.
|
|
|
|
// If mask has no bits set, NUMA_NO_NODE is returned.
|
|
|
|
int uvm_find_closest_node_mask(int src, const nodemask_t *mask);
|
|
|
|
|
|
|
|
// Iterate over all nodes in mask with increasing distance from src.
|
|
|
|
// Note that this iterator is destructive of the mask.
|
|
|
|
#define for_each_closest_uvm_node(nid, src, mask) \
|
|
|
|
for ((nid) = uvm_find_closest_node_mask((src), &(mask)); \
|
|
|
|
(nid) != NUMA_NO_NODE; \
|
|
|
|
node_clear((nid), (mask)), (nid) = uvm_find_closest_node_mask((src), &(mask)))
|
|
|
|
|
|
|
|
#define for_each_possible_uvm_node(nid) for_each_node_mask((nid), node_possible_map)
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
// Compare two NUMA node IDs for equality.
|
|
|
|
// The main purpose of this helper is to correctly compare
|
|
|
|
// in situations when the system has only a single NUMA node
|
|
|
|
// (which is also the case when NUMA support is disabled).
|
|
|
|
bool uvm_numa_id_eq(int nid0, int nid1);
|
|
|
|
|
|
|
|
static bool uvm_uuid_eq(const NvProcessorUuid *uuid0, const NvProcessorUuid *uuid1)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
return memcmp(uuid0, uuid1, sizeof(*uuid0)) == 0;
|
2022-05-09 13:18:59 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// Copies a UUID from source (src) to destination (dst).
|
2024-01-24 17:51:53 +01:00
|
|
|
static void uvm_uuid_copy(NvProcessorUuid *dst, const NvProcessorUuid *src)
|
2022-05-09 13:18:59 -07:00
|
|
|
{
|
|
|
|
memcpy(dst, src, sizeof(*dst));
|
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
static inline NvBool uvm_uuid_is_cpu(const NvProcessorUuid *uuid)
|
2023-10-17 09:25:29 -07:00
|
|
|
{
|
2024-01-24 17:51:53 +01:00
|
|
|
return memcmp(uuid, &NV_PROCESSOR_UUID_CPU_DEFAULT, sizeof(*uuid)) == 0;
|
2023-10-17 09:25:29 -07:00
|
|
|
}
|
|
|
|
|
2024-01-24 17:51:53 +01:00
|
|
|
// Dynamic uvm_processor_mask_t object allocation/maintenance.
|
|
|
|
NV_STATUS uvm_processor_mask_cache_init(void);
|
|
|
|
void uvm_processor_mask_cache_exit(void);
|
|
|
|
uvm_processor_mask_t *uvm_processor_mask_cache_alloc(void);
|
|
|
|
void uvm_processor_mask_cache_free(uvm_processor_mask_t *mask);
|
2023-10-17 09:25:29 -07:00
|
|
|
|
2022-05-09 13:18:59 -07:00
|
|
|
#endif
|