From 27db0adfb8414eb91ea38c594d562d84a1d3981f Mon Sep 17 00:00:00 2001 From: Bernhard Merkle Date: Tue, 11 Nov 2025 03:29:14 +0100 Subject: [PATCH] Fix CUDA compiler flags in cuda_init.py -option O3 was used twice so I remove it, -under windows, the cuda compiler reports this as a cmdline option error, so this is acutally a small bug --- xlstm/blocks/slstm/src/cuda_init.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/xlstm/blocks/slstm/src/cuda_init.py b/xlstm/blocks/slstm/src/cuda_init.py index bc02065..1fea2d4 100644 --- a/xlstm/blocks/slstm/src/cuda_init.py +++ b/xlstm/blocks/slstm/src/cuda_init.py @@ -101,7 +101,7 @@ def load(*, name, sources, extra_cflags=(), extra_cuda_cflags=(), **kwargs): "-res-usage", "--use_fast_math", "-O3", - "-Xptxas -O3", + "-Xptxas", "--extra-device-vectorization", *extra_cflags, *extra_cuda_cflags,