Skip to content

Commit cf6d921

Browse files
committed
Use sm120a. Update vendored cutlass version to the same version DeepGEMM
is vendoring. Update .gitignore.
1 parent 61b05dc commit cf6d921

File tree

3 files changed

+11
-2
lines changed

3 files changed

+11
-2
lines changed

.gitignore

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -42,12 +42,21 @@ lcov-report/
4242

4343
# Build Artifacts
4444

45+
llama.pc
46+
DartConfiguration.tcl
47+
CMakeCache.txt
4548
tags
4649
.build/
4750
build*
4851
release
4952
debug
5053
!build-info.cmake
54+
tests/CTestTestfile.cmake
55+
tests/cmake_install.cmake
56+
**/*.cmake
57+
tests/*.cmake
58+
**/Makefile
59+
**/CMakeFiles
5160
!build-info.cpp.in
5261
!build-info.sh
5362
!build.zig

ggml/src/ggml-cuda/CMakeLists.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -81,7 +81,7 @@ if (CUDAToolkit_FOUND)
8181
)
8282
# Compile this TU for SM100A; TCGen05 TMEM/WGMMA is only available on SM100/SM101/SM110.
8383
# The resulting binary remains forward-compatible with SM120 GPUs.
84-
set_property(TARGET deepgemm_kernels PROPERTY CUDA_ARCHITECTURES "100a")
84+
set_property(TARGET deepgemm_kernels PROPERTY CUDA_ARCHITECTURES "120a")
8585
set_property(TARGET deepgemm_kernels PROPERTY POSITION_INDEPENDENT_CODE ON)
8686
target_include_directories(deepgemm_kernels PRIVATE
8787
${CMAKE_SOURCE_DIR}/ggml/include

ggml/src/ggml-cuda/vendors/cutlass

Submodule cutlass updated 221 files

0 commit comments

Comments
 (0)