diff --git a/.github/ISSUE_TEMPLATE/bug_report.yml b/.github/ISSUE_TEMPLATE/bug_report.yml
index a97636edc..30cf78080 100644
--- a/.github/ISSUE_TEMPLATE/bug_report.yml
+++ b/.github/ISSUE_TEMPLATE/bug_report.yml
@@ -48,7 +48,7 @@ body:
attributes:
label: CUDA Versions
description:
- placeholder: e.g. CUDA 11.0, CUDA 12.2
+ placeholder: e.g. CUDA 11.2, CUDA 12.2
validations:
required: false
- type: input
diff --git a/.github/workflows/CMake.yml b/.github/workflows/CMake.yml
index 9975a424e..75e27cc0b 100644
--- a/.github/workflows/CMake.yml
+++ b/.github/workflows/CMake.yml
@@ -26,7 +26,7 @@ jobs:
# Multiplicative build matrix
matrix:
cudacxx:
- - cuda: "11.0"
+ - cuda: "11.2"
cuda_arch: "35"
hostcxx: gcc-8
os: ubuntu-20.04
diff --git a/.github/workflows/Draft-Release.yml b/.github/workflows/Draft-Release.yml
index 984d609c5..4570d15db 100644
--- a/.github/workflows/Draft-Release.yml
+++ b/.github/workflows/Draft-Release.yml
@@ -49,7 +49,7 @@ jobs:
cuda_arch: "35-real;90-real;90-virtual"
hostcxx: gcc-9
os: ubuntu-20.04
- - cuda: "11.0"
+ - cuda: "11.2"
cuda_arch: "35-real;80-real;80-virtual"
hostcxx: gcc-8
os: ubuntu-20.04
@@ -202,7 +202,7 @@ jobs:
cuda_arch: "35-real;90-real;90-virtual"
hostcxx: "Visual Studio 16 2019"
os: windows-2019
- - cuda: "11.0.3"
+ - cuda: "11.2.2"
cuda_arch: "35-real;80-real;80-virtual"
hostcxx: "Visual Studio 16 2019"
os: windows-2019
diff --git a/.github/workflows/Ubuntu.yml b/.github/workflows/Ubuntu.yml
index 9e70d44d3..f19549283 100644
--- a/.github/workflows/Ubuntu.yml
+++ b/.github/workflows/Ubuntu.yml
@@ -37,7 +37,7 @@ jobs:
cuda_arch: "35"
hostcxx: gcc-11
os: ubuntu-22.04
- - cuda: "11.0"
+ - cuda: "11.2"
cuda_arch: "35"
hostcxx: gcc-8
os: ubuntu-20.04
@@ -56,7 +56,7 @@ jobs:
exclude:
# Exclude VIS=ON for oldest cuda.
- cudacxx:
- cuda: "11.0"
+ cuda: "11.2"
VISUALISATION: "ON"
# Exclude beltsoff builds for old cuda's
- cudacxx:
@@ -64,7 +64,7 @@ jobs:
config:
name: "Beltsoff"
- cudacxx:
- cuda: "11.0"
+ cuda: "11.2"
config:
name: "Beltsoff"
# Exclude beltsoff vis builds to keep the matrix lighter.
diff --git a/.github/workflows/Windows-Tests.yml b/.github/workflows/Windows-Tests.yml
index 4762c62e7..284976693 100644
--- a/.github/workflows/Windows-Tests.yml
+++ b/.github/workflows/Windows-Tests.yml
@@ -31,7 +31,7 @@ jobs:
cuda_arch: "35"
hostcxx: "Visual Studio 17 2022"
os: windows-2022
- - cuda: "11.0.3"
+ - cuda: "11.2.2"
cuda_arch: "35"
hostcxx: "Visual Studio 16 2019"
os: windows-2019
diff --git a/.github/workflows/Windows.yml b/.github/workflows/Windows.yml
index 303861e60..5f4bdcd02 100644
--- a/.github/workflows/Windows.yml
+++ b/.github/workflows/Windows.yml
@@ -37,7 +37,7 @@ jobs:
cuda_arch: "35"
hostcxx: "Visual Studio 17 2022"
os: windows-2022
- - cuda: "11.0.3"
+ - cuda: "11.2.2"
cuda_arch: "35"
hostcxx: "Visual Studio 16 2019"
os: windows-2019
@@ -56,7 +56,7 @@ jobs:
exclude:
# Exclude VIS=ON for oldest cuda.
- cudacxx:
- cuda: "11.0.3"
+ cuda: "11.2.2"
VISUALISATION: "ON"
# Exclude beltsoff builds for old cuda's
- cudacxx:
@@ -64,7 +64,7 @@ jobs:
config:
name: "Beltsoff"
- cudacxx:
- cuda: "11.0.3"
+ cuda: "11.2.2"
config:
name: "Beltsoff"
# Exclude beltsoff vis builds to keep the matrix lighter.
diff --git a/CMakeLists.txt b/CMakeLists.txt
index f634809aa..d004369bf 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -49,10 +49,15 @@ if(CMAKE_CUDA_COMPILER)
flamegpu_set_cuda_architectures()
endif()
-# Set the minimum supported version of CUDA for FLAME GPU, currently 11.0
-set(MINIMUM_SUPPORTED_CUDA_VERSION 11.0)
-# Set the minimum, usable, but deprecated CUDA version. Currently there are no deprecated versions
+# Set the minimum supported version of CUDA for FLAME GPU, currently 11.2
+set(MINIMUM_SUPPORTED_CUDA_VERSION 11.2)
+# Set the minimum, potentially usable, but unsupported CUDA version.
+# Currently 11.0 on linux and 11.1 on windows (due to CCCL support).
+# CUDA 11.1 is not supported to simplify python releases
set(MINIMUM_CUDA_VERSION 11.0)
+if(WIN32)
+ set(MINIMUM_CUDA_VERSION 11.1)
+endif()
# If the CUDA compiler is too old, trigger a docs only build.
if(CMAKE_CUDA_COMPILER_VERSION VERSION_LESS ${MINIMUM_CUDA_VERSION})
@@ -60,9 +65,9 @@ if(CMAKE_CUDA_COMPILER_VERSION VERSION_LESS ${MINIMUM_CUDA_VERSION})
message(STATUS "Documentation-only build: CUDA ${MINIMUM_SUPPORTED_CUDA_VERSION} or greater is required for compilation.")
endif()
-# If the CUDA compiler is atleast the minimum deprecated version, but less than the minimum actually supported version, issue a dev warning.
+# If the CUDA compiler is at least the minimum (unsupported) version, but less than the minimum actually supported version, issue a warning.
if(CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL ${MINIMUM_CUDA_VERSION} AND CMAKE_CUDA_COMPILER_VERSION VERSION_LESS ${MINIMUM_SUPPORTED_CUDA_VERSION})
- message(DEPRECATION "Support for CUDA verisons <= ${MINIMUM_SUPPORTED_CUDA_VERSION} is deprecated and will be removed in a future release.")
+ message(WARNING "CUDA versions >= ${MINIMUM_CUDA_VERSION} && < ${MINIMUM_SUPPORTED_CUDA_VERSION} are unsupported buy may work on some platforms.")
endif()
# If CUDA is not available, or the minimum version is too low only build the docs.
@@ -78,7 +83,7 @@ endif()
# include for dependent modules
include(CMakeDependentOption)
-# Option to enable building all examples, defaults to ON if FLAMEPGU is the top level cmake, else OFF
+# Option to enable building all examples, defaults to ON if FLAMEGPU is the top level cmake, else OFF
cmake_dependent_option(FLAMEGPU_BUILD_ALL_EXAMPLES "Enable building all FLAMEGPU examples" ON "FLAMEGPU_PROJECT_IS_TOP_LEVEL" OFF)
# Options to enable building individual examples, if FLAMEGPU_BUILD_ALL_EXAMPLES is off.
diff --git a/README.md b/README.md
index 323e855f3..060144de9 100644
--- a/README.md
+++ b/README.md
@@ -63,7 +63,8 @@ Building FLAME GPU has the following requirements. There are also optional depen
+ [CMake](https://cmake.org/download/) `>= 3.18`
+ `>= 3.20` if building python bindings using a multi-config generator (Visual Studio, Eclipse or Ninja Multi-Config)
-+ [CUDA](https://developer.nvidia.com/cuda-downloads) `>= 11.0` and a [Compute Capability](https://developer.nvidia.com/cuda-gpus) `>= 3.5` NVIDIA GPU.
++ [CUDA](https://developer.nvidia.com/cuda-downloads) `>= 11.2` and a [Compute Capability](https://developer.nvidia.com/cuda-gpus) `>= 3.5` NVIDIA GPU.
+tab=readme-ov-file#cuda-toolkit-ctk-compatibility).
+ C++17 capable C++ compiler (host), compatible with the installed CUDA version
+ [Microsoft Visual Studio 2019 or 2022](https://visualstudio.microsoft.com/) (Windows)
+ *Note:* Visual Studio must be installed before the CUDA toolkit is installed. See the [CUDA installation guide for Windows](https://docs.nvidia.com/cuda/cuda-installation-guide-microsoft-windows/index.html) for more information.
@@ -242,7 +243,7 @@ Several environmental variables are used or required by FLAME GPU 2.
| Environment Variable | Description |
|--------------------------------------|-------------|
-| `CUDA_PATH` | Required when using RunTime Compilation (RTC), pointing to the root of the CUDA Toolkit where NVRTC resides.
i.e. `/usr/local/cuda-11.0/` or `C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v11.0`.
Alternatively `CUDA_HOME` may be used if `CUDA_PATH` was not set. |
+| `CUDA_PATH` | Required when using RunTime Compilation (RTC), pointing to the root of the CUDA Toolkit where NVRTC resides.
i.e. `/usr/local/cuda-11.2/` or `C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v11.2`.
Alternatively `CUDA_HOME` may be used if `CUDA_PATH` was not set. |
| `FLAMEGPU_INC_DIR` | When RTC compilation is required, if the location of the `include` directory cannot be found it must be specified using the `FLAMEGPU_INC_DIR` environment variable. |
| `FLAMEGPU_TMP_DIR` | FLAME GPU may cache some files to a temporary directory on the system, using the temporary directory returned by [`std::filesystem::temp_directory_path`](https://en.cppreference.com/w/cpp/filesystem/temp_directory_path). The location can optionally be overridden using the `FLAMEGPU_TMP_DIR` environment variable. |
| `FLAMEGPU_RTC_INCLUDE_DIRS` | A list of include directories that should be provided to the RTC compiler, these should be separated using `;` (Windows) or `:` (Linux). If this variable is not found, the working directory will be used as a default. |
@@ -362,6 +363,3 @@ For a full list of known issues pleases see the [Issue Tracker](https://github.c
+ Warnings and a loss of performance due to hash collisions in device code ([#356](https://github.com/FLAMEGPU/FLAMEGPU2/issues/356))
+ Multiple known areas where performance can be improved (e.g. [#449](https://github.com/FLAMEGPU/FLAMEGPU2/issues/449), [#402](https://github.com/FLAMEGPU/FLAMEGPU2/issues/402))
-+ Windows/MSVC builds using CUDA 11.0 may encounter errors when performing incremental builds if the static library has been recompiled. If this presents itself, re-save any `.cu` file in your executable producing project and re-trigger the build.
-+ Debug builds under linux with CUDA 11.0 may encounter cuda errors during `validateIDCollisions`. Consider using an alternate CUDA version if this is required ([#569](https://github.com/FLAMEGPU/FLAMEGPU2/issues/569)).
-+ CUDA 11.0 with GCC 9 may encounter a segmentation fault during compilation of the test suite. Consider using GCC 8 with CUDA 11.0.
\ No newline at end of file
diff --git a/cmake/CUDAArchitectures.cmake b/cmake/CUDAArchitectures.cmake
index 27963a332..84eea2418 100644
--- a/cmake/CUDAArchitectures.cmake
+++ b/cmake/CUDAArchitectures.cmake
@@ -215,7 +215,7 @@ function(flamegpu_set_cuda_architectures)
endif()
message(AUTHOR_WARNING
" ${CMAKE_CURRENT_FUNCTION} failed to parse NVCC --help output for default architecture generation\n"
- " Using ${default_archs} based on CUDA 11.0 to 11.8."
+ " Using ${default_archs} based on CUDA 11.2 to 11.8."
)
endif()
# We actually want real for each arch, then virtual for the final, but only for library-provided values, to only embed one arch worth of ptx.
diff --git a/cmake/common.cmake b/cmake/common.cmake
index f1ed88a17..408ac0a0d 100644
--- a/cmake/common.cmake
+++ b/cmake/common.cmake
@@ -134,22 +134,26 @@ if(FLAMEGPU_ENABLE_NVTX)
endif()
endif(FLAMEGPU_ENABLE_NVTX)
-# Set the minimum supported cuda version, if not already set. Currently duplicated due to docs only build logic.
-# CUDA 11.0 is current minimum cuda version, and the minimum supported
+# Set the minimum unsupported and minimum supported cuda version, if not already set.
+# Currently duplicated due to docs only build logic.
+# CUDA 11.0/11.1 is current minimum (unsupported but usable) cuda version
if(NOT DEFINED MINIMUM_CUDA_VERSION)
set(MINIMUM_CUDA_VERSION 11.0)
+ if(WIN32)
+ set(MINIMUM_CUDA_VERSION 11.1)
+ endif()
# Require a minimum cuda version
if(CMAKE_CUDA_COMPILER_VERSION VERSION_LESS ${MINIMUM_CUDA_VERSION})
message(FATAL_ERROR "CUDA version must be at least ${MINIMUM_CUDA_VERSION}")
endif()
endif()
-# CUDA 11.0 is the current minimum supported version.
+# CUDA 11.2 is the current minimum supported version.
if(NOT DEFINED MINIMUM_SUPPORTED_CUDA_VERSION)
- set(MINIMUM_SUPPORTED_CUDA_VERSION 11.0)
+ set(MINIMUM_SUPPORTED_CUDA_VERSION 11.2)
# Warn on deprecated cuda version.
# If the CUDA compiler is atleast the minimum deprecated version, but less than the minimum actually supported version, issue a dev warning.
if(CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL ${MINIMUM_CUDA_VERSION} AND CMAKE_CUDA_COMPILER_VERSION VERSION_LESS ${MINIMUM_SUPPORTED_CUDA_VERSION})
- message(DEPRECATION "Support for CUDA verisons <= ${MINIMUM_SUPPORTED_CUDA_VERSION} is deprecated and will be removed in a future release.")
+ message(WARNING "CUDA versions >= ${MINIMUM_CUDA_VERSION} && < ${MINIMUM_SUPPORTED_CUDA_VERSION} are unsupported buy may work on some platforms.")
endif()
endif()
diff --git a/src/flamegpu/detail/compute_capability.cu b/src/flamegpu/detail/compute_capability.cu
index cfd8f3e12..2f38c69c1 100644
--- a/src/flamegpu/detail/compute_capability.cu
+++ b/src/flamegpu/detail/compute_capability.cu
@@ -71,8 +71,8 @@ std::vector compute_capability::getNVRTCSupportedComputeCapabilties() {
}
// If any of the above functions failed, we have no idea what arch's are supported, so assume none are?
return {};
-// Older CUDA's do not support this, but this is simple to hard-code for CUDA 11.0/11.1 (and our deprected CUDA 10.x).
-// CUDA 11.1 suports 35 to 86
+// Older CUDA's do not support this, but this is simple to hard-code for CUDA 11.0/11.1 (and our CUDA 10.x).
+// CUDA 11.1 supports 35 to 86
#elif (__CUDACC_VER_MAJOR__ == 11) && __CUDACC_VER_MINOR__ == 1
return {35, 37, 50, 52, 53, 60, 61, 62, 70, 72, 75, 80, 86};
// CUDA 11.0 supports 35 to 80