Skip to content

Commit

Permalink
make sure nvtx3 is used (#4937)
Browse files Browse the repository at this point in the history
  • Loading branch information
jtrmal authored Sep 16, 2024
1 parent 0aebdbe commit 22f36e5
Show file tree
Hide file tree
Showing 17 changed files with 17 additions and 17 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@

#include "hipify.h"
#else
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif

#include <mutex>
Expand Down
2 changes: 1 addition & 1 deletion src/cudadecoder/batched-threaded-nnet3-cuda-pipeline.cc
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@

#include "hipify.h"
#else
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif

#include "base/kaldi-utils.h"
Expand Down
2 changes: 1 addition & 1 deletion src/cudadecoder/batched-threaded-nnet3-cuda-pipeline2.cc
Original file line number Diff line number Diff line change
Expand Up @@ -28,7 +28,7 @@

#include "hipify.h"
#else
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif

namespace kaldi {
Expand Down
2 changes: 1 addition & 1 deletion src/cudadecoder/cuda-decoder.cc
Original file line number Diff line number Diff line change
Expand Up @@ -44,7 +44,7 @@
#include "hipify.h"
#else
#include <cuda_runtime_api.h>
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif

#include "base/kaldi-utils.h"
Expand Down
2 changes: 1 addition & 1 deletion src/cudadecoder/cuda-fst.cc
Original file line number Diff line number Diff line change
Expand Up @@ -29,7 +29,7 @@
#include "hipify.h"
#else
#include <cuda_runtime_api.h>
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif

namespace kaldi {
Expand Down
2 changes: 1 addition & 1 deletion src/cudadecoderbin/batched-wav-nnet3-cuda-online.cc
Original file line number Diff line number Diff line change
Expand Up @@ -30,7 +30,7 @@
#else
#include <cuda.h>
#include <cuda_profiler_api.h>
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif

#include <algorithm>
Expand Down
2 changes: 1 addition & 1 deletion src/cudadecoderbin/batched-wav-nnet3-cuda.cc
Original file line number Diff line number Diff line change
Expand Up @@ -24,7 +24,7 @@
#else
#include <cuda.h>
#include <cuda_profiler_api.h>
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif
#include <sstream>
#include "cudadecoder/batched-threaded-nnet3-cuda-pipeline.h"
Expand Down
2 changes: 1 addition & 1 deletion src/cudadecoderbin/batched-wav-nnet3-cuda2.cc
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@
#else
#include <cuda.h>
#include <cuda_profiler_api.h>
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif

#include <sstream>
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@
#include "hipify.h"
#else
#include <cub/cub.cuh>
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif

#include "cudafeat/lane-desc.h"
Expand Down
2 changes: 1 addition & 1 deletion src/cudafeat/feature-spectral-cuda.cu
Original file line number Diff line number Diff line change
Expand Up @@ -24,7 +24,7 @@

#include "hipify.h"
#else
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#include <cub/cub.cuh>
#endif

Expand Down
2 changes: 1 addition & 1 deletion src/cudafeat/feature-window-cuda.cu
Original file line number Diff line number Diff line change
Expand Up @@ -22,7 +22,7 @@

#include "hipify.h"
#else
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif

#include "matrix/matrix-functions.h"
Expand Down
2 changes: 1 addition & 1 deletion src/cudafeat/online-batched-feature-pipeline-cuda.cc
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@

#include "hipify.h"
#else
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif

namespace kaldi {
Expand Down
2 changes: 1 addition & 1 deletion src/cudafeat/online-ivector-feature-cuda.cc
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@
#endif
#define CUBLAS_FILL_MODE_LOWER HIPSOLVER_FILL_MODE_LOWER
#else
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif
#endif

Expand Down
2 changes: 1 addition & 1 deletion src/cudafeatbin/compute-online-feats-batched-cuda.cc
Original file line number Diff line number Diff line change
Expand Up @@ -18,7 +18,7 @@
#if HAVE_CUDA
#ifndef __IS_HIP_COMPILE__
#include <cuda_profiler_api.h>
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif
#endif

Expand Down
2 changes: 1 addition & 1 deletion src/cudafeatbin/compute-online-feats-cuda.cc
Original file line number Diff line number Diff line change
Expand Up @@ -17,7 +17,7 @@

#if HAVE_CUDA == 1
#ifndef __IS_HIP_COMPILE__
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>
#endif
#endif
#include "base/kaldi-common.h"
Expand Down
2 changes: 1 addition & 1 deletion src/cudamatrix/cu-common.h
Original file line number Diff line number Diff line change
Expand Up @@ -44,7 +44,7 @@
#include <cuda_runtime_api.h>
#include <curand.h>
#include <cusparse.h>
#include <nvToolsExt.h>
#include <nvtx3/nvToolsExt.h>

#define GPU_WARP_SIZE 32
#define GPU_MAX_THREADS_PER_BLOCK 1024
Expand Down
2 changes: 1 addition & 1 deletion src/makefiles/cuda_64bit.mk
Original file line number Diff line number Diff line change
Expand Up @@ -16,4 +16,4 @@ CUDA_FLAGS = --compiler-options -fPIC --machine 64 -DHAVE_CUDA -DOPENFST_VER=$(O
CUDA_LDFLAGS += -L$(CUDATKDIR)/lib64/stubs -L$(CUDATKDIR)/lib64 -Wl,-rpath,$(CUDATKDIR)/lib64
CUDA_LDFLAGS += -L$(CUDATKDIR)/lib/stubs -L$(CUDATKDIR)/lib -Wl,-rpath,$(CUDATKDIR)/lib

CUDA_LDLIBS += -lcuda -lcublas -lcusparse -lcusolver -lcudart -lcurand -lcufft -lnvToolsExt
CUDA_LDLIBS += -lcuda -lcublas -lcusparse -lcusolver -lcudart -lcurand -lcufft

0 comments on commit 22f36e5

Please sign in to comment.