Skip to content

Commit 96aeb44

Browse files
authored
backend: build with CUDA compute 5.0 support by default (#3499)
Signed-off-by: Jared Van Bortel <[email protected]>
1 parent 29f2977 commit 96aeb44

File tree

3 files changed

+5
-4
lines changed

3 files changed

+5
-4
lines changed

.circleci/continue_config.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1339,7 +1339,7 @@ jobs:
13391339
-DCMAKE_CXX_COMPILER_LAUNCHER=ccache \
13401340
-DCMAKE_CUDA_COMPILER_LAUNCHER=ccache \
13411341
-DKOMPUTE_OPT_DISABLE_VULKAN_VERSION_CHECK=ON \
1342-
-DCMAKE_CUDA_ARCHITECTURES='52-virtual;61-virtual;70-virtual;75-virtual'
1342+
-DCMAKE_CUDA_ARCHITECTURES='50-virtual;52-virtual;61-virtual;70-virtual;75-virtual'
13431343
cmake --build build -j$(nproc)
13441344
ccache -s
13451345
- run:
@@ -1458,7 +1458,7 @@ jobs:
14581458
-DCMAKE_CXX_COMPILER_LAUNCHER=ccache `
14591459
-DCMAKE_CUDA_COMPILER_LAUNCHER=ccache `
14601460
-DKOMPUTE_OPT_DISABLE_VULKAN_VERSION_CHECK=ON `
1461-
-DCMAKE_CUDA_ARCHITECTURES='52-virtual;61-virtual;70-virtual;75-virtual'
1461+
-DCMAKE_CUDA_ARCHITECTURES='50-virtual;52-virtual;61-virtual;70-virtual;75-virtual'
14621462
cmake --build build --parallel
14631463
ccache -s
14641464
- run:

gpt4all-backend/CMakeLists.txt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -69,7 +69,7 @@ if (LLMODEL_CUDA)
6969
cmake_minimum_required(VERSION 3.18) # for CMAKE_CUDA_ARCHITECTURES
7070

7171
# Defaults must be set before enable_language(CUDA).
72-
# Keep this in sync with the arch list in ggml/src/CMakeLists.txt.
72+
# Keep this in sync with the arch list in ggml/src/CMakeLists.txt (plus 5.0 for non-F16 branch).
7373
if (NOT DEFINED CMAKE_CUDA_ARCHITECTURES)
7474
# 52 == lowest CUDA 12 standard
7575
# 60 == f16 CUDA intrinsics
@@ -78,7 +78,7 @@ if (LLMODEL_CUDA)
7878
if (GGML_CUDA_F16 OR GGML_CUDA_DMMV_F16)
7979
set(CMAKE_CUDA_ARCHITECTURES "60;61;70;75") # needed for f16 CUDA intrinsics
8080
else()
81-
set(CMAKE_CUDA_ARCHITECTURES "52;61;70;75") # lowest CUDA 12 standard + lowest for integer intrinsics
81+
set(CMAKE_CUDA_ARCHITECTURES "50;52;61;70;75") # lowest CUDA 12 standard + lowest for integer intrinsics
8282
#set(CMAKE_CUDA_ARCHITECTURES "OFF") # use this to compile much faster, but only F16 models work
8383
endif()
8484
endif()

gpt4all-chat/CHANGELOG.md

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,7 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/).
88

99
### Added
1010
- Whitelist Granite (non-MoE) model architecture (by [@ThiloteE](https://github.com/ThiloteE) in [#3487](https://github.com/nomic-ai/gpt4all/pull/3487))
11+
- Add support for CUDA compute 5.0 GPUs such as the GTX 750 ([#3499](https://github.com/nomic-ai/gpt4all/pull/3499))
1112

1213
### Changed
1314
- Substitute prettier default templates for OLMoE 7B 0924/0125 and Granite 3.1 3B/8B (by [@ThiloteE](https://github.com/ThiloteE) in [#3471](https://github.com/nomic-ai/gpt4all/pull/3471))

0 commit comments

Comments
 (0)