Skip to content

Commit

Permalink
Intel(R) oneAPI Collective Communications Library (oneCCL) 2021.14 (#144
Browse files Browse the repository at this point in the history
)
  • Loading branch information
nikitaxgusev authored Nov 6, 2024
1 parent cc09ee2 commit 3afa1bb
Show file tree
Hide file tree
Showing 256 changed files with 9,624 additions and 3,089 deletions.
4 changes: 2 additions & 2 deletions CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -308,8 +308,8 @@ file(GLOB spv_kernels "${PROJECT_SOURCE_DIR}/src/kernels/kernels.spv")
endif()

set(CCL_MAJOR_VERSION "2021")
set(CCL_MINOR_VERSION "13")
set(CCL_UPDATE_VERSION "1")
set(CCL_MINOR_VERSION "14")
set(CCL_UPDATE_VERSION "0")
set(CCL_PRODUCT_STATUS "Gold")
string(TIMESTAMP CCL_PRODUCT_BUILD_DATE "%Y-%m-%dT %H:%M:%SZ")
get_vcs_properties("git")
Expand Down
Binary file modified deps/hwloc/lib/libhwloc.a
Binary file not shown.
185 changes: 182 additions & 3 deletions deps/itt/include/ittnotify.h
Original file line number Diff line number Diff line change
Expand Up @@ -90,13 +90,19 @@ The same ID may not be reused for different instances, unless a previous
# define ITT_OS_FREEBSD 4
#endif /* ITT_OS_FREEBSD */

#ifndef ITT_OS_OPENBSD
# define ITT_OS_OPENBSD 5
#endif /* ITT_OS_OPENBSD */

#ifndef ITT_OS
# if defined WIN32 || defined _WIN32
# define ITT_OS ITT_OS_WIN
# elif defined( __APPLE__ ) && defined( __MACH__ )
# define ITT_OS ITT_OS_MAC
# elif defined( __FreeBSD__ )
# define ITT_OS ITT_OS_FREEBSD
# elif defined( __OpenBSD__)
# define ITT_OS ITT_OS_OPENBSD
# else
# define ITT_OS ITT_OS_LINUX
# endif
Expand All @@ -118,13 +124,19 @@ The same ID may not be reused for different instances, unless a previous
# define ITT_PLATFORM_FREEBSD 4
#endif /* ITT_PLATFORM_FREEBSD */

#ifndef ITT_PLATFORM_OPENBSD
# define ITT_PLATFORM_OPENBSD 5
#endif /* ITT_PLATFORM_OPENBSD */

#ifndef ITT_PLATFORM
# if ITT_OS==ITT_OS_WIN
# define ITT_PLATFORM ITT_PLATFORM_WIN
# elif ITT_OS==ITT_OS_MAC
# define ITT_PLATFORM ITT_PLATFORM_MAC
# elif ITT_OS==ITT_OS_FREEBSD
# define ITT_PLATFORM ITT_PLATFORM_FREEBSD
# elif ITT_OS==ITT_OS_OPENBSD
# define ITT_PLATFORM ITT_PLATFORM_OPENBSD
# else
# define ITT_PLATFORM ITT_PLATFORM_POSIX
# endif
Expand Down Expand Up @@ -294,7 +306,7 @@ extern "C" {
* only pauses tracing and analyzing memory access.
* It does not pause tracing or analyzing threading APIs.
* .
* - Intel(R) Parallel Amplifier and Intel(R) VTune(TM) Amplifier XE:
* - Intel(R) VTune(TM) Profiler:
* - Does continue to record when new threads are started.
* .
* - Other effects:
Expand Down Expand Up @@ -613,12 +625,12 @@ typedef enum __itt_suppress_mode {

/**
* @enum __itt_collection_state
* @brief Enumerator for collection state. All non-work states have negative values.
* @brief Enumerator for collection state.
*/
typedef enum {
__itt_collection_uninitialized = 0, /* uninitialized */
__itt_collection_init_fail = 1, /* failed to init */
__itt_collection_collector_absent = 2, /* non work state collector exists */
__itt_collection_collector_absent = 2, /* non work state collector is absent */
__itt_collection_collector_exists = 3, /* work state collector exists */
__itt_collection_init_successful = 4 /* success to init */
} __itt_collection_state;
Expand Down Expand Up @@ -4021,6 +4033,173 @@ __itt_collection_state __itt_get_collection_state(void);
void __itt_release_resources(void);
/** @endcond */

/**
* @brief Create a typed counter with given domain pointer, string name and counter type
*/
#if ITT_PLATFORM==ITT_PLATFORM_WIN
__itt_counter ITTAPI __itt_counter_createA_v3(const __itt_domain* domain, const char* name, __itt_metadata_type type);
__itt_counter ITTAPI __itt_counter_createW_v3(const __itt_domain* domain, const wchar_t* name, __itt_metadata_type type);
#if defined(UNICODE) || defined(_UNICODE)
# define __itt_counter_create_v3 __itt_counter_createW_v3
# define __itt_counter_create_v3_ptr __itt_counter_createW_v3_ptr
#else /* UNICODE */
# define __itt_counter_create_v3 __itt_counter_createA_v3
# define __itt_counter_create_v3_ptr __itt_counter_createA_v3_ptr
#endif /* UNICODE */
#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
__itt_counter ITTAPI __itt_counter_create_v3(const __itt_domain* domain, const char* name, __itt_metadata_type type);
#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */

#ifndef INTEL_NO_MACRO_BODY
#ifndef INTEL_NO_ITTNOTIFY_API
#if ITT_PLATFORM==ITT_PLATFORM_WIN
ITT_STUB(ITTAPI, __itt_counter, counter_createA_v3, (const __itt_domain* domain, const char* name, __itt_metadata_type type))
ITT_STUB(ITTAPI, __itt_counter, counter_createW_v3, (const __itt_domain* domain, const wchar_t* name, __itt_metadata_type type))
#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
ITT_STUB(ITTAPI, __itt_counter, counter_create_v3, (const __itt_domain* domain, const char* name, __itt_metadata_type type))
#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
#if ITT_PLATFORM==ITT_PLATFORM_WIN
#define __itt_counter_createA_v3 ITTNOTIFY_DATA(counter_createA_v3)
#define __itt_counter_createA_v3_ptr ITTNOTIFY_NAME(counter_createA_v3)
#define __itt_counter_createW_v3 ITTNOTIFY_DATA(counter_createW_v3)
#define __itt_counter_createW_v3_ptr ITTNOTIFY_NAME(counter_createW_v3)
#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
#define __itt_counter_create_v3 ITTNOTIFY_DATA(counter_create_v3)
#define __itt_counter_create_v3_ptr ITTNOTIFY_NAME(counter_create_v3)
#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
#else /* INTEL_NO_ITTNOTIFY_API */
#if ITT_PLATFORM==ITT_PLATFORM_WIN
#define __itt_counter_createA_v3(domain, name, type) (__itt_counter)0
#define __itt_counter_createA_v3_ptr 0
#define __itt_counter_createW_v3(domain, name, type) (__itt_counter)0
#define __itt_counter_create_typedW_ptr 0
#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
#define __itt_counter_create_v3(domain, name, type) (__itt_counter)0
#define __itt_counter_create_v3_ptr 0
#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
#endif /* INTEL_NO_ITTNOTIFY_API */
#else /* INTEL_NO_MACRO_BODY */
#if ITT_PLATFORM==ITT_PLATFORM_WIN
#define __itt_counter_createA_v3_ptr 0
#define __itt_counter_createW_v3_ptr 0
#else /* ITT_PLATFORM==ITT_PLATFORM_WIN */
#define __itt_counter_create_v3_ptr 0
#endif /* ITT_PLATFORM==ITT_PLATFORM_WIN */
#endif /* INTEL_NO_MACRO_BODY */
/** @endcond */

/**
* @brief Set the counter value api
*/
void ITTAPI __itt_counter_set_value_v3(__itt_counter counter, void *value_ptr);

#ifndef INTEL_NO_MACRO_BODY
#ifndef INTEL_NO_ITTNOTIFY_API
ITT_STUBV(ITTAPI, void, counter_set_value_v3, (__itt_counter counter, void *value_ptr))
#define __itt_counter_set_value_v3 ITTNOTIFY_VOID(counter_set_value_v3)
#define __itt_counter_set_value_v3_ptr ITTNOTIFY_NAME(counter_set_value_v3)
#else /* INTEL_NO_ITTNOTIFY_API */
#define __itt_counter_set_value_v3(counter, value_ptr)
#define __itt_counter_set_value_v3_ptr 0
#endif /* INTEL_NO_ITTNOTIFY_API */
#else /* INTEL_NO_MACRO_BODY */
#define __itt_counter_set_value_v3_ptr 0
#endif /* INTEL_NO_MACRO_BODY */
/** @endcond */

/**
* @brief describes the type of context metadata
*/
typedef enum {
__itt_context_unknown = 0, /*!< Undefined type */
__itt_context_nameA, /*!< ASCII string char* type */
__itt_context_nameW, /*!< Unicode string wchar_t* type */
__itt_context_deviceA, /*!< ASCII string char* type */
__itt_context_deviceW, /*!< Unicode string wchar_t* type */
__itt_context_unitsA, /*!< ASCII string char* type */
__itt_context_unitsW, /*!< Unicode string wchar_t* type */
__itt_context_pci_addrA, /*!< ASCII string char* type */
__itt_context_pci_addrW, /*!< Unicode string wchar_t* type */
__itt_context_tid, /*!< Unsigned 64-bit integer type */
__itt_context_max_val, /*!< Unsigned 64-bit integer type */
__itt_context_bandwidth_flag, /*!< Unsigned 64-bit integer type */
__itt_context_latency_flag, /*!< Unsigned 64-bit integer type */
__itt_context_occupancy_flag, /*!< Unsigned 64-bit integer type */
__itt_context_on_thread_flag, /*!< Unsigned 64-bit integer type */
__itt_context_is_abs_val_flag, /*!< Unsigned 64-bit integer type */
__itt_context_cpu_instructions_flag, /*!< Unsigned 64-bit integer type */
__itt_context_cpu_cycles_flag /*!< Unsigned 64-bit integer type */
} __itt_context_type;

#if defined(UNICODE) || defined(_UNICODE)
# define __itt_context_name __itt_context_nameW
# define __itt_context_device __itt_context_deviceW
# define __itt_context_units __itt_context_unitsW
# define __itt_context_pci_addr __itt_context_pci_addrW
#else /* UNICODE || _UNICODE */
# define __itt_context_name __itt_context_nameA
# define __itt_context_device __itt_context_deviceA
# define __itt_context_units __itt_context_unitsA
# define __itt_context_pci_addr __itt_context_pci_addrA
#endif /* UNICODE || _UNICODE */

/** @cond exclude_from_documentation */
#pragma pack(push, 8)

typedef struct ___itt_context_metadata
{
__itt_context_type type; /*!< Type of the context metadata value */
void* value; /*!< Pointer to context metadata value itself */
} __itt_context_metadata;

#pragma pack(pop)
/** @endcond */

/** @cond exclude_from_documentation */
#pragma pack(push, 8)

typedef struct ___itt_counter_metadata
{
__itt_counter counter; /*!< Associated context metadata counter */
__itt_context_type type; /*!< Type of the context metadata value */
const char* str_valueA; /*!< String context metadata value */
#if defined(UNICODE) || defined(_UNICODE)
const wchar_t* str_valueW;
#else /* UNICODE || _UNICODE */
void* str_valueW;
#endif /* UNICODE || _UNICODE */
unsigned long long value; /*!< Numeric context metadata value */
int extra1; /*!< Reserved to the runtime */
void* extra2; /*!< Reserved to the runtime */
struct ___itt_counter_metadata* next;
} __itt_counter_metadata;

#pragma pack(pop)
/** @endcond */

/**
* @brief Bind context metadata to counter instance
* @param[in] counter Pointer to the counter instance to which the context metadata is to be associated.
* @param[in] length The number of elements in context metadata array.
* @param[in] metadata The context metadata itself.
*/
void ITTAPI __itt_bind_context_metadata_to_counter(__itt_counter counter, size_t length, __itt_context_metadata* metadata);

/** @cond exclude_from_documentation */
#ifndef INTEL_NO_MACRO_BODY
#ifndef INTEL_NO_ITTNOTIFY_API
ITT_STUBV(ITTAPI, void, bind_context_metadata_to_counter, (__itt_counter counter, size_t length, __itt_context_metadata* metadata))
#define __itt_bind_context_metadata_to_counter ITTNOTIFY_VOID(bind_context_metadata_to_counter)
#define __itt_bind_context_metadata_to_counter_ptr ITTNOTIFY_NAME(bind_context_metadata_to_counter)
#else /* INTEL_NO_ITTNOTIFY_API */
#define __itt_bind_context_metadata_to_counter(counter, length, metadata)
#define __itt_bind_context_metadata_to_counter_ptr 0
#endif /* INTEL_NO_ITTNOTIFY_API */
#else /* INTEL_NO_MACRO_BODY */
#define __itt_bind_context_metadata_to_counter_ptr 0
#endif /* INTEL_NO_MACRO_BODY */
/** @endcond */

#ifdef __cplusplus
}
#endif /* __cplusplus */
Expand Down
Binary file modified deps/itt/lib64/libittnotify.a
Binary file not shown.
Binary file modified deps/itt/lib64/tracing_functions.so
Binary file not shown.
12 changes: 10 additions & 2 deletions deps/level_zero/include/ze_api.h
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@
* SPDX-License-Identifier: MIT
*
* @file ze_api.h
* @version v1.9-r1.9.1
* @version v1.9-r1.9.3
*
*/
#ifndef _ZE_API_H
Expand Down Expand Up @@ -1443,7 +1443,7 @@ typedef struct _ze_device_properties_t
///< structure (i.e. contains stype and pNext).
ze_device_type_t type; ///< [out] generic device type
uint32_t vendorId; ///< [out] vendor id from PCI configuration
uint32_t deviceId; ///< [out] device id from PCI configuration
uint32_t deviceId; ///< [out] device id from PCI configuration.
///< Note, the device id uses little-endian format.
ze_device_property_flags_t flags; ///< [out] 0 (none) or a valid combination of ::ze_device_property_flag_t
uint32_t subdeviceId; ///< [out] sub-device id. Only valid if ::ZE_DEVICE_PROPERTY_FLAG_SUBDEVICE
Expand Down Expand Up @@ -4697,6 +4697,9 @@ typedef enum _ze_image_format_layout_t
ZE_IMAGE_FORMAT_LAYOUT_444P = 40, ///< Media Format: 444P. Format type and swizzle is ignored for this.
ZE_IMAGE_FORMAT_LAYOUT_RGBP = 41, ///< Media Format: RGBP. Format type and swizzle is ignored for this.
ZE_IMAGE_FORMAT_LAYOUT_BRGP = 42, ///< Media Format: BRGP. Format type and swizzle is ignored for this.
ZE_IMAGE_FORMAT_LAYOUT_8_8_8 = 43, ///< 3-component 8-bit layout
ZE_IMAGE_FORMAT_LAYOUT_16_16_16 = 44, ///< 3-component 16-bit layout
ZE_IMAGE_FORMAT_LAYOUT_32_32_32 = 45, ///< 3-component 32-bit layout
ZE_IMAGE_FORMAT_LAYOUT_FORCE_UINT32 = 0x7fffffff

} ze_image_format_layout_t;
Expand Down Expand Up @@ -10545,6 +10548,9 @@ typedef enum _ze_image_bindless_exp_flag_t
{
ZE_IMAGE_BINDLESS_EXP_FLAG_BINDLESS = ZE_BIT(0), ///< Bindless images are created with ::zeImageCreate. The image handle
///< created with this flag is valid on both host and device.
ZE_IMAGE_BINDLESS_EXP_FLAG_SAMPLED_IMAGE = ZE_BIT(1), ///< Bindless sampled images are created with ::zeImageCreate by combining
///< BINDLESS and SAMPLED_IMAGE.
///< Create sampled image view from bindless unsampled image using SAMPLED_IMAGE.
ZE_IMAGE_BINDLESS_EXP_FLAG_FORCE_UINT32 = 0x7fffffff

} ze_image_bindless_exp_flag_t;
Expand All @@ -10564,6 +10570,8 @@ typedef struct _ze_image_bindless_exp_desc_t
///< When the flag is passed to ::zeImageCreate, then only the memory for
///< the image is allocated.
///< Additional image handles can be created with ::zeImageViewCreateExt.
///< When ::ZE_IMAGE_BINDLESS_EXP_FLAG_SAMPLED_IMAGE flag is passed,
///< ::ze_sampler_desc_t must be attached via pNext member of ::ze_image_bindless_exp_desc_t.

} ze_image_bindless_exp_desc_t;

Expand Down
2 changes: 1 addition & 1 deletion deps/level_zero/include/zes_api.h
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@
* SPDX-License-Identifier: MIT
*
* @file zes_api.h
* @version v1.9-r1.9.1
* @version v1.9-r1.9.3
*
*/
#ifndef _ZES_API_H
Expand Down
Binary file modified deps/mpi/bin/hydra_bstrap_proxy
Binary file not shown.
Binary file modified deps/mpi/bin/hydra_nameserver
Binary file not shown.
Binary file modified deps/mpi/bin/hydra_pmi_proxy
Binary file not shown.
1 change: 0 additions & 1 deletion deps/mpi/bin/mpicc
Original file line number Diff line number Diff line change
Expand Up @@ -42,7 +42,6 @@ for arg in "$@" ; do
done

compiler_short_name=`basename ${compiler_name:?}`
compiler_short_name="${compiler_short_name##*-}"

opt_args=""
if [ $# -eq 1 -a "$1" = "-v" ] ; then
Expand Down
1 change: 0 additions & 1 deletion deps/mpi/bin/mpicxx
Original file line number Diff line number Diff line change
Expand Up @@ -42,7 +42,6 @@ for arg in "$@" ; do
done

compiler_short_name=`basename ${compiler_name:?}`
compiler_short_name="${compiler_short_name##*-}"

opt_args=""
if [ $# -eq 1 -a "$1" = "-v" ] ; then
Expand Down
Binary file modified deps/mpi/bin/mpiexec
Binary file not shown.
Binary file modified deps/mpi/bin/mpiexec.hydra
Binary file not shown.
2 changes: 1 addition & 1 deletion deps/mpi/bin/mpigcc
Original file line number Diff line number Diff line change
Expand Up @@ -126,7 +126,7 @@ CC="gcc"
MPICH_VERSION="3.4a2"
CFLAGS=""
CPPFLAGS=""
MPIVERSION="2021.13"
MPIVERSION="2021.14"
MPILIBNAME="mpi"


Expand Down
2 changes: 1 addition & 1 deletion deps/mpi/bin/mpigxx
Original file line number Diff line number Diff line change
Expand Up @@ -123,7 +123,7 @@ fi
CXX="g++"
MPICH_VERSION="3.4a2"
CXXFLAGS=""
MPIVERSION="2021.13"
MPIVERSION="2021.14"
MPILIBNAME="mpi"
MPICXXLIBNAME="mpicxx"

Expand Down
2 changes: 1 addition & 1 deletion deps/mpi/bin/mpiicpx
Original file line number Diff line number Diff line change
Expand Up @@ -129,7 +129,7 @@ MPILIBNAME="mpi"
MPICXXLIBNAME="mpicxx"

# MPIVERSION is the version of the Intel(R) MPI Library that mpiicpc is intended for
MPIVERSION="@IMPI_OFFICIALVERSION@"
MPIVERSION="2021.14"

# Internal variables
# Show is set to echo to cause the compilation command to be echoed instead
Expand Down
2 changes: 1 addition & 1 deletion deps/mpi/bin/mpiicx
Original file line number Diff line number Diff line change
Expand Up @@ -131,7 +131,7 @@ LDFLAGS="-ldl"
MPILIBNAME="mpi"

# MPIVERSION is the version of the MPICH2 library that mpicc is intended for
MPIVERSION="@IMPI_OFFICIALVERSION@"
MPIVERSION="2021.14"
#
# Internal variables
# Show is set to echo to cause the compilation command to be echoed instead
Expand Down
Binary file modified deps/mpi/lib/libmpi.so
Binary file not shown.
Binary file modified deps/mpi/lib/libmpi.so.12
Binary file not shown.
Binary file modified deps/mpi/lib/libmpi.so.12.0
Binary file not shown.
Binary file modified deps/mpi/lib/libmpi.so.12.0.0
Binary file not shown.
Binary file modified deps/mpi/lib/libmpifort.so
Binary file not shown.
Binary file modified deps/mpi/lib/libmpifort.so.12
Binary file not shown.
Binary file modified deps/mpi/lib/libmpifort.so.12.0
Binary file not shown.
Binary file modified deps/mpi/lib/libmpifort.so.12.0.0
Binary file not shown.
Binary file modified deps/mpi/opt/mpi/etc/tuning_clx-ap_shm-ofi.dat
Binary file not shown.
Binary file added deps/mpi/opt/mpi/etc/tuning_gnr_shm-ofi.dat
Binary file not shown.
Binary file added deps/mpi/opt/mpi/etc/tuning_gnr_shm.dat
Binary file not shown.
Binary file added deps/mpi/opt/mpi/etc/tuning_srf_shm-ofi.dat
Binary file not shown.
Binary file added deps/mpi/opt/mpi/etc/tuning_srf_shm.dat
Binary file not shown.
Binary file modified deps/ofi/bin/fi_info
Binary file not shown.
Loading

0 comments on commit 3afa1bb

Please sign in to comment.