Skip to content

Commit 49bcd9c

Browse files
committed
Add Windows build jobs to CI
1 parent e686d70 commit 49bcd9c

File tree

2 files changed

+18
-18
lines changed

2 files changed

+18
-18
lines changed

.github/workflows/build.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@ jobs:
1818
fail-fast: false
1919
matrix:
2020
os:
21-
["ubuntu-22.04"] # "windows-2025" # Disabled until solution/workaround for NVTX is present
21+
["ubuntu-22.04", "windows-2025"]
2222
# "ubuntu-24.04" # Postponed as long as testing against CUDA 12.1, needs 12.6+
2323
python: ["3.9", "3.10", "3.11", "3.12", "3.13"]
2424

@@ -55,9 +55,9 @@ jobs:
5555

5656
- name: Set up CUDA toolkit (Windows)
5757
if: runner.os == 'Windows'
58-
uses: Jimver/cuda-toolkit@master
58+
uses: Jimver/cuda-toolkit@v0.2.24 # https://github.com/Jimver/cuda-toolkit/issues/395
5959
with:
60-
cuda: "12.4.0"
60+
cuda: "12.8.1"
6161
method: "network"
6262

6363
- name: Install torch with CUDA support (Ubuntu)
@@ -66,7 +66,7 @@ jobs:
6666

6767
- name: Install torch with CUDA support (Windows)
6868
if: runner.os == 'Windows'
69-
run: python -m pip install torch --index-url https://download.pytorch.org/whl/cu124
69+
run: python -m pip install torch --index-url https://download.pytorch.org/whl/cu128
7070

7171
- name: Install torchhull
7272
run: python -m pip install --editable ".[dev]"

src/torchhull/_C/src/gaussian_blur_cuda.cu

Lines changed: 14 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -447,6 +447,20 @@ gaussian_blur_cuda_sparse(const torch::Tensor& images,
447447
dim3 grid_convolution;
448448
at::cuda::getApplyGrid(M, grid_convolution, images.device().index(), threads_per_block);
449449

450+
#define CASE_TILE_CONVOLUTION_KERNEL_SPECIALIZED(KERNEL_SIZE) \
451+
case KERNEL_SIZE: \
452+
{ \
453+
tile_convolution_kernel_specialized<KERNEL_SIZE><<<grid_convolution, threads, 0, stream>>>(tile_indices_, \
454+
M, \
455+
tile_size, \
456+
sigma, \
457+
images_, \
458+
blurred_images_); \
459+
DEFER(AT_CUDA_CHECK(cudaGetLastError());) \
460+
DEFER(AT_CUDA_CHECK(cudaStreamSynchronize(stream));) \
461+
} \
462+
break;
463+
450464
AT_DISPATCH_ALL_TYPES_AND(
451465
torch::ScalarType::Half,
452466
images.scalar_type(),
@@ -464,20 +478,6 @@ gaussian_blur_cuda_sparse(const torch::Tensor& images,
464478
auto blurred_images_ =
465479
blurred_images.packed_accessor64<scalar_t, 4, torch::RestrictPtrTraits>();
466480

467-
#define CASE_TILE_CONVOLUTION_KERNEL_SPECIALIZED(KERNEL_SIZE) \
468-
case KERNEL_SIZE: \
469-
{ \
470-
tile_convolution_kernel_specialized<KERNEL_SIZE><<<grid_convolution, threads, 0, stream>>>(tile_indices_, \
471-
M, \
472-
tile_size, \
473-
sigma, \
474-
images_, \
475-
blurred_images_); \
476-
DEFER(AT_CUDA_CHECK(cudaGetLastError());) \
477-
DEFER(AT_CUDA_CHECK(cudaStreamSynchronize(stream));) \
478-
} \
479-
break;
480-
481481
switch (kernel_size)
482482
{
483483
// Tested all possible values up to 21 for specialization.

0 commit comments

Comments
 (0)