From 5d0c0757bdf8160c290f93a4b1e826e36e5e3f78 Mon Sep 17 00:00:00 2001 From: Arun Karthik Date: Tue, 10 Dec 2024 23:28:35 +0000 Subject: [PATCH] Release v1.13.2-aws Signed-off-by: Arun Karthik --- RELEASENOTES.md | 29 +++++++++++++++++++++++++++++ configure.ac | 2 +- 2 files changed, 30 insertions(+), 1 deletion(-) diff --git a/RELEASENOTES.md b/RELEASENOTES.md index c4e0e0e58..926aae4b2 100644 --- a/RELEASENOTES.md +++ b/RELEASENOTES.md @@ -12,6 +12,35 @@ have unified the code into a single branch, and made the AWS-specific parts a compile-time option. When a feature (or entire release) only supports one of the two variants, we note that in the release notes. +# v1.13.2-aws (2024-12-06) + +This release is intended only for use on AWS P* instances. A general release +that supports other libfabric networks may be made in the near future. + +With this release, building with platform-aws requires +[1.22.0amzn4.0](https://github.com/aws/libfabric/commits/1.22.0amzn4.0/) +or greater. AWS customers are generally recommended to track +[the latest-available EFA Installer](https://docs.aws.amazon.com/AWSEC2/latest/UserGuide/efa-verify.html) +for performance improvements and bug fixes. + +The 1.13.x release series supports +[NCCL 2.23.4-1](https://github.com/NVIDIA/nccl/releases/tag/v2.23.4-1) +while maintaining backward compatibility with older NCCL versions +([NCCL v2.17.1](https://github.com/NVIDIA/nccl/releases/tag/v2.17.1-1) and later). + +Bug Fixes: + + - Tuner Improvements: + - Fixed algorithm selection for larger ranks and message sizes. + - Re-calibrated the tuner for AllGather and ReduceScatter regions for 0x7 bitmask on P5en, + optimizing performance for larger messages. + - Added tuner support for AllGather and ReduceScatter regions for 0x0 bitmask on P5en. + + - Resolved a performance issue by preventing the eager protocol when RDMA writes are in flight, + improving small AllReduce collective performance. + +Note: dmabuf support is now turned off by default. Users can enable it explicitly using OFI_NCCL_DISABLE_DMABUF=0 if needed. + # v1.13.1-aws (2024-11-25) This release is intended only for use on AWS P\* instances. A general release diff --git a/configure.ac b/configure.ac index df6310b5e..a888960b3 100644 --- a/configure.ac +++ b/configure.ac @@ -6,7 +6,7 @@ # # Initialization -AC_INIT([aws-ofi-nccl], [1.13.2a1-aws], [al-ofi-nccl-team@amazon.com], , [http://github.com/aws/aws-ofi-nccl]) +AC_INIT([aws-ofi-nccl], [1.13.2-aws], [al-ofi-nccl-team@amazon.com], , [http://github.com/aws/aws-ofi-nccl]) AC_PREREQ([2.69]) AC_CONFIG_SRCDIR([src/nccl_ofi_net.c]) AC_CONFIG_AUX_DIR([build-aux])