Skip to content

Commit 22f36e5

Browse files
authored
make sure nvtx3 is used (#4937)
1 parent 0aebdbe commit 22f36e5

17 files changed

+17
-17
lines changed

src/cudadecoder/batched-threaded-nnet3-cuda-online-pipeline.cc

+1-1
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@
2626

2727
#include "hipify.h"
2828
#else
29-
#include <nvToolsExt.h>
29+
#include <nvtx3/nvToolsExt.h>
3030
#endif
3131

3232
#include <mutex>

src/cudadecoder/batched-threaded-nnet3-cuda-pipeline.cc

+1-1
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,7 @@
3131

3232
#include "hipify.h"
3333
#else
34-
#include <nvToolsExt.h>
34+
#include <nvtx3/nvToolsExt.h>
3535
#endif
3636

3737
#include "base/kaldi-utils.h"

src/cudadecoder/batched-threaded-nnet3-cuda-pipeline2.cc

+1-1
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@
2828

2929
#include "hipify.h"
3030
#else
31-
#include <nvToolsExt.h>
31+
#include <nvtx3/nvToolsExt.h>
3232
#endif
3333

3434
namespace kaldi {

src/cudadecoder/cuda-decoder.cc

+1-1
Original file line numberDiff line numberDiff line change
@@ -44,7 +44,7 @@
4444
#include "hipify.h"
4545
#else
4646
#include <cuda_runtime_api.h>
47-
#include <nvToolsExt.h>
47+
#include <nvtx3/nvToolsExt.h>
4848
#endif
4949

5050
#include "base/kaldi-utils.h"

src/cudadecoder/cuda-fst.cc

+1-1
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,7 @@
2929
#include "hipify.h"
3030
#else
3131
#include <cuda_runtime_api.h>
32-
#include <nvToolsExt.h>
32+
#include <nvtx3/nvToolsExt.h>
3333
#endif
3434

3535
namespace kaldi {

src/cudadecoderbin/batched-wav-nnet3-cuda-online.cc

+1-1
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,7 @@
3030
#else
3131
#include <cuda.h>
3232
#include <cuda_profiler_api.h>
33-
#include <nvToolsExt.h>
33+
#include <nvtx3/nvToolsExt.h>
3434
#endif
3535

3636
#include <algorithm>

src/cudadecoderbin/batched-wav-nnet3-cuda.cc

+1-1
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,7 @@
2424
#else
2525
#include <cuda.h>
2626
#include <cuda_profiler_api.h>
27-
#include <nvToolsExt.h>
27+
#include <nvtx3/nvToolsExt.h>
2828
#endif
2929
#include <sstream>
3030
#include "cudadecoder/batched-threaded-nnet3-cuda-pipeline.h"

src/cudadecoderbin/batched-wav-nnet3-cuda2.cc

+1-1
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@
2727
#else
2828
#include <cuda.h>
2929
#include <cuda_profiler_api.h>
30-
#include <nvToolsExt.h>
30+
#include <nvtx3/nvToolsExt.h>
3131
#endif
3232

3333
#include <sstream>

src/cudafeat/feature-online-batched-spectral-cuda-kernels.cu

+1-1
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@
2525
#include "hipify.h"
2626
#else
2727
#include <cub/cub.cuh>
28-
#include <nvToolsExt.h>
28+
#include <nvtx3/nvToolsExt.h>
2929
#endif
3030

3131
#include "cudafeat/lane-desc.h"

src/cudafeat/feature-spectral-cuda.cu

+1-1
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,7 @@
2424

2525
#include "hipify.h"
2626
#else
27-
#include <nvToolsExt.h>
27+
#include <nvtx3/nvToolsExt.h>
2828
#include <cub/cub.cuh>
2929
#endif
3030

src/cudafeat/feature-window-cuda.cu

+1-1
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@
2222

2323
#include "hipify.h"
2424
#else
25-
#include <nvToolsExt.h>
25+
#include <nvtx3/nvToolsExt.h>
2626
#endif
2727

2828
#include "matrix/matrix-functions.h"

src/cudafeat/online-batched-feature-pipeline-cuda.cc

+1-1
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@
2525

2626
#include "hipify.h"
2727
#else
28-
#include <nvToolsExt.h>
28+
#include <nvtx3/nvToolsExt.h>
2929
#endif
3030

3131
namespace kaldi {

src/cudafeat/online-ivector-feature-cuda.cc

+1-1
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@
2626
#endif
2727
#define CUBLAS_FILL_MODE_LOWER HIPSOLVER_FILL_MODE_LOWER
2828
#else
29-
#include <nvToolsExt.h>
29+
#include <nvtx3/nvToolsExt.h>
3030
#endif
3131
#endif
3232

src/cudafeatbin/compute-online-feats-batched-cuda.cc

+1-1
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@
1818
#if HAVE_CUDA
1919
#ifndef __IS_HIP_COMPILE__
2020
#include <cuda_profiler_api.h>
21-
#include <nvToolsExt.h>
21+
#include <nvtx3/nvToolsExt.h>
2222
#endif
2323
#endif
2424

src/cudafeatbin/compute-online-feats-cuda.cc

+1-1
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@
1717

1818
#if HAVE_CUDA == 1
1919
#ifndef __IS_HIP_COMPILE__
20-
#include <nvToolsExt.h>
20+
#include <nvtx3/nvToolsExt.h>
2121
#endif
2222
#endif
2323
#include "base/kaldi-common.h"

src/cudamatrix/cu-common.h

+1-1
Original file line numberDiff line numberDiff line change
@@ -44,7 +44,7 @@
4444
#include <cuda_runtime_api.h>
4545
#include <curand.h>
4646
#include <cusparse.h>
47-
#include <nvToolsExt.h>
47+
#include <nvtx3/nvToolsExt.h>
4848

4949
#define GPU_WARP_SIZE 32
5050
#define GPU_MAX_THREADS_PER_BLOCK 1024

src/makefiles/cuda_64bit.mk

+1-1
Original file line numberDiff line numberDiff line change
@@ -16,4 +16,4 @@ CUDA_FLAGS = --compiler-options -fPIC --machine 64 -DHAVE_CUDA -DOPENFST_VER=$(O
1616
CUDA_LDFLAGS += -L$(CUDATKDIR)/lib64/stubs -L$(CUDATKDIR)/lib64 -Wl,-rpath,$(CUDATKDIR)/lib64
1717
CUDA_LDFLAGS += -L$(CUDATKDIR)/lib/stubs -L$(CUDATKDIR)/lib -Wl,-rpath,$(CUDATKDIR)/lib
1818

19-
CUDA_LDLIBS += -lcuda -lcublas -lcusparse -lcusolver -lcudart -lcurand -lcufft -lnvToolsExt
19+
CUDA_LDLIBS += -lcuda -lcublas -lcusparse -lcusolver -lcudart -lcurand -lcufft

0 commit comments

Comments
 (0)