diff --git a/CHANGELOG.md b/CHANGELOG.md index 67c4cdf0..2a129995 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -3,7 +3,7 @@ Documentation for rocRAND is available at [https://rocm.docs.amd.com/projects/rocRAND/en/latest/](https://rocm.docs.amd.com/projects/rocRAND/en/latest/) -## (Unreleased) rocRAND 3.3.0 for ROCm 6.4 +## rocRAND 3.3.0 for ROCm 6.4 ### Added @@ -34,14 +34,15 @@ Documentation for rocRAND is available at ### Changed +* Updated the default value for the `-a` argument from `rmake.py` to `gfx906:xnack-,gfx1030,gfx1100,gfx1101,gfx1102,gfx1151,gfx1200,gfx1201`. * `rocrand_discrete` for MTGP32, LFSR113 and ThreeFry generators now uses the alias method, which is faster than binary search in CDF. ## rocRAND 3.1.1 for ROCm 6.2.4 ## Fixes -* Fixed " unknown extension ?>" issue in scripts/config-tuning/select_best_config.py - when using python version thats older than 3.11 +* Fixed an issue in `rmake.py` where the list storing cmake options would contain individual characters instead of a full string of options. +* Fixed " unknown extension ?>" issue in scripts/config-tuning/select_best_config.py when using python version thats older than 3.11 * Fixed low random sequence quality of `ROCRAND_RNG_PSEUDO_THREEFRY2_64_20` and `ROCRAND_RNG_PSEUDO_THREEFRY4_64_20`. ## rocRAND 3.1.0 for ROCm 6.2.0 @@ -118,7 +119,7 @@ Documentation for rocRAND is available at ### Known issues - SOBOL64 and SCRAMBLED_SOBOL64 generate poisson-distributed `unsigned long long int` numbers instead of `unsigned int`. This will be fixed in the next major release. -## (Unreleased) rocRAND-3.0.0 for ROCm 6.0.0 +## rocRAND-3.0.0 for ROCm 6.0.0 ### Additions diff --git a/CMakeLists.txt b/CMakeLists.txt index 47187067..9c7e98f9 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -123,7 +123,7 @@ if(GPU_TARGETS STREQUAL "all") if(BUILD_ADDRESS_SANITIZER) # ASAN builds require xnack rocm_check_target_ids(DEFAULT_AMDGPU_TARGETS - TARGETS "gfx908:xnack+;gfx90a:xnack+;gfx940:xnack+;gfx941:xnack+;gfx942:xnack+" + TARGETS "gfx908:xnack+;gfx90a:xnack+;gfx942:xnack+" ) else() rocm_check_target_ids(DEFAULT_AMDGPU_TARGETS diff --git a/cmake/Dependencies.cmake b/cmake/Dependencies.cmake index 09b7286a..23aa4108 100644 --- a/cmake/Dependencies.cmake +++ b/cmake/Dependencies.cmake @@ -94,14 +94,6 @@ if(BUILD_BENCHMARK) message(FATAL_ERROR "DownloadProject.cmake doesn't support multi-configuration generators.") endif() set(GOOGLEBENCHMARK_ROOT ${CMAKE_CURRENT_BINARY_DIR}/deps/googlebenchmark CACHE PATH "") - if(NOT (CMAKE_CXX_COMPILER_ID STREQUAL "GNU")) - # hip-clang cannot compile googlebenchmark for some reason - if(WIN32) - set(COMPILER_OVERRIDE "-DCMAKE_CXX_COMPILER=cl") - else() - set(COMPILER_OVERRIDE "-DCMAKE_CXX_COMPILER=g++") - endif() - endif() download_project( PROJ googlebenchmark diff --git a/rmake.py b/rmake.py index 27fefeed..90887d29 100644 --- a/rmake.py +++ b/rmake.py @@ -21,6 +21,9 @@ def parse_args(): parser = argparse.ArgumentParser(description=""" Checks build arguments """) + + default_gpus = 'gfx906:xnack-,gfx1030,gfx1100,gfx1101,gfx1102,gfx1151,gfx1200,gfx1201' + parser.add_argument('-g', '--debug', required=False, default=False, action='store_true', help='Generate Debug build (default: False)') parser.add_argument( '--build_dir', type=str, required=False, default="build", @@ -38,7 +41,7 @@ def parse_args(): help='Install after build (default: False)') parser.add_argument( '--cmake-darg', required=False, dest='cmake_dargs', action='append', default=[], help='List of additional cmake defines for builds (e.g. CMAKE_CXX_COMPILER_LAUNCHER=ccache)') - parser.add_argument('-a', '--architecture', dest='gpu_architecture', required=False, default="gfx906;gfx1030;gfx1100;gfx1101;gfx1102", #:sramecc+:xnack-" ) #gfx1030" ) #gfx906" ) # gfx1030" ) + parser.add_argument('-a', '--architecture', dest='gpu_architecture', required=False, default=default_gpus, #:sramecc+:xnack-" ) #gfx1030" ) #gfx906" ) # gfx1030" ) help='Set GPU architectures, e.g. all, gfx000, gfx803, gfx906:xnack-;gfx1030;gfx1100 (optional, default: all)') parser.add_argument('-v', '--verbose', required=False, default=False, action='store_true', help='Verbose build (default: False)')