diff --git a/dali/kernels/signal/CMakeLists.txt b/dali/kernels/signal/CMakeLists.txt
index 431ae39629..74ca2e8970 100644
--- a/dali/kernels/signal/CMakeLists.txt
+++ b/dali/kernels/signal/CMakeLists.txt
@@ -17,6 +17,7 @@ add_subdirectory(decibel)
 if (BUILD_FFTS)
   add_subdirectory(fft)
 endif()
+add_subdirectory(wavelet)
 add_subdirectory(window)
 
 collect_headers(DALI_INST_HDRS PARENT_SCOPE)
diff --git a/dali/kernels/signal/wavelet/CMakeLists.txt b/dali/kernels/signal/wavelet/CMakeLists.txt
new file mode 100644
index 0000000000..f3a24faa7c
--- /dev/null
+++ b/dali/kernels/signal/wavelet/CMakeLists.txt
@@ -0,0 +1,17 @@
+# Copyright (c) 2023, NVIDIA CORPORATION. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+collect_headers(DALI_INST_HDRS PARENT_SCOPE)
+collect_sources(DALI_KERNEL_SRCS PARENT_SCOPE)
+collect_test_sources(DALI_KERNEL_TEST_SRCS PARENT_SCOPE)
\ No newline at end of file
diff --git a/dali/kernels/signal/wavelet/cwt_args.h b/dali/kernels/signal/wavelet/cwt_args.h
new file mode 100644
index 0000000000..9a38b8d006
--- /dev/null
+++ b/dali/kernels/signal/wavelet/cwt_args.h
@@ -0,0 +1,36 @@
+// Copyright (c) 2019, NVIDIA CORPORATION. All rights reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef DALI_KERNELS_SIGNAL_WAVELET_CWT_ARGS_H_
+#define DALI_KERNELS_SIGNAL_WAVELET_CWT_ARGS_H_
+
+#include <vector>
+#include "dali/operators/signal/wavelet/wavelet_name.h"
+
+namespace dali {
+namespace kernels {
+namespace signal {
+
+template <typename T = float>
+struct CwtArgs {
+  std::vector<T> a;
+  dali::DALIWaveletName wavelet;
+  std::vector<T> wavelet_args;
+};
+
+}  // namespace signal
+}  // namespace kernels
+}  // namespace dali
+
+#endif  // DALI_KERNELS_SIGNAL_WAVELET_CWT_ARGS_H_
diff --git a/dali/kernels/signal/wavelet/cwt_gpu.cu b/dali/kernels/signal/wavelet/cwt_gpu.cu
new file mode 100644
index 0000000000..cfca159483
--- /dev/null
+++ b/dali/kernels/signal/wavelet/cwt_gpu.cu
@@ -0,0 +1,96 @@
+// Copyright (c) 2020-2021, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include <cmath>
+#include <complex>
+#include <vector>
+#include "dali/core/common.h"
+#include "dali/core/error_handling.h"
+#include "dali/core/format.h"
+#include "dali/kernels/kernel.h"
+#include "dali/kernels/signal/wavelet/cwt_args.h"
+#include "dali/kernels/signal/wavelet/cwt_gpu.h"
+
+namespace dali {
+namespace kernels {
+namespace signal {
+
+template <typename T>
+struct SampleDesc {
+  const T *in = nullptr;
+  T *out = nullptr;
+  int64_t size = 0;
+};
+
+template <typename T>
+__global__ void CwtKernel(const SampleDesc<T> *sample_data) {
+  const int64_t block_size = blockDim.y * blockDim.x;
+  const int64_t grid_size = gridDim.x * block_size;
+  const int sample_idx = blockIdx.y;
+  const auto sample = sample_data[sample_idx];
+  const int64_t offset = block_size * blockIdx.x;
+  const int64_t tid = threadIdx.y * blockDim.x + threadIdx.x;
+
+  for (int64_t idx = offset + tid; idx < sample.size; idx += grid_size) {
+    sample.out[idx] = sample.in[idx];
+  }
+}
+
+template <typename T>
+CwtGpu<T>::~CwtGpu() = default;
+
+template <typename T>
+KernelRequirements CwtGpu<T>::Setup(KernelContext &context,
+                                    const InListGPU<T, DynamicDimensions> &in) {
+  auto out_shape = in.shape;
+  const size_t num_samples = in.size();
+  ScratchpadEstimator se;
+  se.add<mm::memory_kind::host, SampleDesc<T>>(num_samples);
+  se.add<mm::memory_kind::device, SampleDesc<T>>(num_samples);
+  KernelRequirements req;
+  req.scratch_sizes = se.sizes;
+  req.output_shapes = {out_shape};
+  return req;
+}
+
+template <typename T>
+void CwtGpu<T>::Run(KernelContext &context, const OutListGPU<T, DynamicDimensions> &out,
+                    const InListGPU<T, DynamicDimensions> &in, const CwtArgs<T> &args) {
+  auto num_samples = in.size();
+  auto *sample_data = context.scratchpad->AllocateHost<SampleDesc<T>>(num_samples);
+
+  for (int i = 0; i < num_samples; i++) {
+    auto &sample = sample_data[i];
+    sample.out = out.tensor_data(i);
+    sample.in = in.tensor_data(i);
+    sample.size = volume(in.tensor_shape(i));
+    assert(sample.size == volume(out.tensor_shape(i)));
+  }
+
+  auto *sample_data_gpu = context.scratchpad->AllocateGPU<SampleDesc<T>>(num_samples);
+  CUDA_CALL(cudaMemcpyAsync(sample_data_gpu, sample_data, num_samples * sizeof(SampleDesc<T>),
+                            cudaMemcpyHostToDevice, context.gpu.stream));
+
+  dim3 block(32, 32);
+  auto blocks_per_sample = std::max(32, 1024 / num_samples);
+  dim3 grid(blocks_per_sample, num_samples);
+  CwtKernel<T><<<grid, block, 0, context.gpu.stream>>>(sample_data_gpu);
+}
+
+template class CwtGpu<float>;
+template class CwtGpu<double>;
+
+}  // namespace signal
+}  // namespace kernels
+}  // namespace dali
diff --git a/dali/kernels/signal/wavelet/cwt_gpu.h b/dali/kernels/signal/wavelet/cwt_gpu.h
new file mode 100644
index 0000000000..35a494aca6
--- /dev/null
+++ b/dali/kernels/signal/wavelet/cwt_gpu.h
@@ -0,0 +1,48 @@
+// Copyright (c) 2020, NVIDIA CORPORATION. All rights reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef DALI_KERNELS_SIGNAL_WAVELET_CWT_GPU_H_
+#define DALI_KERNELS_SIGNAL_WAVELET_CWT_GPU_H_
+
+#include <memory>
+#include "dali/core/common.h"
+#include "dali/core/error_handling.h"
+#include "dali/core/format.h"
+#include "dali/core/util.h"
+#include "dali/kernels/kernel.h"
+#include "dali/kernels/signal/wavelet/cwt_args.h"
+
+namespace dali {
+namespace kernels {
+namespace signal {
+
+template <typename T = float>
+class DLL_PUBLIC CwtGpu {
+ public:
+  static_assert(std::is_floating_point<T>::value, "Only floating point types are supported");
+
+  DLL_PUBLIC ~CwtGpu();
+
+  DLL_PUBLIC KernelRequirements Setup(KernelContext &context,
+                                      const InListGPU<T, DynamicDimensions> &in);
+
+  DLL_PUBLIC void Run(KernelContext &context, const OutListGPU<T, DynamicDimensions> &out,
+                      const InListGPU<T, DynamicDimensions> &in, const CwtArgs<T> &args);
+};
+
+}  // namespace signal
+}  // namespace kernels
+}  // namespace dali
+
+#endif  // DALI_KERNELS_SIGNAL_WAVELET_CWT_GPU_H_
diff --git a/dali/kernels/signal/wavelet/mother_wavelet.cu b/dali/kernels/signal/wavelet/mother_wavelet.cu
new file mode 100644
index 0000000000..232c183a0c
--- /dev/null
+++ b/dali/kernels/signal/wavelet/mother_wavelet.cu
@@ -0,0 +1,161 @@
+// Copyright (c) 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include <cmath>
+#include <vector>
+#include "dali/kernels/signal/wavelet/mother_wavelet.cuh"
+#include "dali/core/math_util.h"
+
+namespace dali {
+namespace kernels {
+namespace signal {
+
+template <typename T>
+HaarWavelet<T>::HaarWavelet(const std::vector<T> &args) {
+  if (args.size() != 0) {
+    throw std::invalid_argument("HaarWavelet doesn't accept any arguments.");
+  }
+}
+
+template <typename T>
+__device__ T HaarWavelet<T>::operator()(const T &t) const {
+  if (0.0 <= t && t < 0.5) {
+    return 1.0;
+  }
+  if (0.5 <= t && t < 1.0) {
+    return -1.0;
+  }
+  return 0.0;
+}
+
+template class HaarWavelet<float>;
+template class HaarWavelet<double>;
+
+template <typename T>
+GaussianWavelet<T>::GaussianWavelet(const std::vector<T> &args) {
+  if (args.size() != 1) {
+    throw std::invalid_argument("GaussianWavelet accepts exactly one argument - n.");
+  }
+  if (args[0] < 1.0 || args[0] > 8.0) {
+    throw std::invalid_argument(
+      "GaussianWavelet's argument n should be integer from range [1,8].");
+  }
+  this->n = args[0];
+}
+
+template <typename T>
+__device__ T GaussianWavelet<T>::operator()(const T &t) const {
+  T expTerm = std::exp(-std::pow(t, 2.0));
+  T sqrtTerm = 1.2533141373155001;  // std::sqrt(M_PI/2.0)
+  switch (static_cast<int>(n)) {
+  case 1:
+    return -2.0*t*expTerm/std::sqrt(sqrtTerm);
+  case 2:
+    return (-4.0*std::pow(t, 2.0)+2.0)*expTerm/std::sqrt(3.0*sqrtTerm);
+  case 3:
+    return (8.0*std::pow(t, 3.0)-12.0*t)*expTerm/std::sqrt(15.0*sqrtTerm);
+  case 4:
+    return (-48.0*std::pow(t, 2.0)+16.0*std::pow(t, 4.0)+12.0)*expTerm/std::sqrt(105.0*sqrtTerm);
+  case 5:
+    return (-32.0*std::pow(t, 5.0)+160.0*std::pow(t, 3.0)-120.0*t)*
+              expTerm/std::sqrt(945.0*sqrtTerm);
+  case 6:
+    return (-64.0*std::pow(t, 6.0)+480.0*std::pow(t, 4.0)-720.0*std::pow(t, 2.0)+120.0)*
+              expTerm/std::sqrt(10395.0*sqrtTerm);
+  case 7:
+    return (128.0*std::pow(t, 7.0)-1344.0*std::pow(t, 5.0)+3360.0*std::pow(t, 3.0)-1680.0*t)*
+              expTerm/std::sqrt(135135.0*sqrtTerm);
+  case 8:
+    return (256.0*std::pow(t, 8.0)-3584.0*std::pow(t, 6.0)+13440.0*std::pow(t, 4.0)-13440.0*
+              std::pow(t, 2.0)+1680.0)*expTerm/std::sqrt(2027025.0*sqrtTerm);
+  }
+}
+
+template class GaussianWavelet<float>;
+template class GaussianWavelet<double>;
+
+template <typename T>
+MexicanHatWavelet<T>::MexicanHatWavelet(const std::vector<T> &args) {
+  if (args.size() != 1) {
+    throw std::invalid_argument("MexicanHatWavelet accepts exactly one argument - sigma.");
+  }
+  this->sigma = args[0];
+}
+
+template <typename T>
+__device__ T MexicanHatWavelet<T>::operator()(const T &t) const {
+  return 2.0/(std::sqrt(3.0*sigma)*std::pow(M_PI, 0.25))*(1.0-std::pow(t/sigma, 2.0))*
+            std::exp(-std::pow(t, 2.0)/(2.0*std::pow(sigma, 2.0)));
+}
+
+template class MexicanHatWavelet<float>;
+template class MexicanHatWavelet<double>;
+
+template <typename T>
+MorletWavelet<T>::MorletWavelet(const std::vector<T> &args) {
+  if (args.size() != 0) {
+    throw std::invalid_argument("MorletWavelet doesn't accept any arguments.");
+  }
+}
+
+template <typename T>
+__device__ T MorletWavelet<T>::operator()(const T &t) const {
+  return std::exp(-std::pow(t, 2.0) / 2.0) * std::cos(5.0 * t);
+}
+
+template class MorletWavelet<float>;
+template class MorletWavelet<double>;
+
+template <typename T>
+ShannonWavelet<T>::ShannonWavelet(const std::vector<T> &args) {
+  if (args.size() != 2) {
+    throw std::invalid_argument(
+      "ShannonWavelet accepts exactly 2 arguments -> fb, fc in that order.");
+  }
+  this->fb = args[0];
+  this->fc = args[1];
+}
+
+template <typename T>
+__device__ T ShannonWavelet<T>::operator()(const T &t) const {
+  auto res = std::cos((T)(2.0*M_PI)*fc*t)*std::sqrt(fb);
+  return t == 0.0 ? res : res*std::sin(t*fb*(T)(M_PI))/(t*fb*(T)(M_PI));
+}
+
+template class ShannonWavelet<float>;
+template class ShannonWavelet<double>;
+
+template <typename T>
+FbspWavelet<T>::FbspWavelet(const std::vector<T> &args) {
+  if (args.size() != 3) {
+    throw std::invalid_argument(
+      "FbspWavelet accepts exactly 3 arguments -> m, fb, fc in that order.");
+  }
+  this->m = args[0];
+  this->fb = args[1];
+  this->fc = args[2];
+}
+
+template <typename T>
+__device__ T FbspWavelet<T>::operator()(const T &t) const {
+  auto res = std::cos((T)(2.0*M_PI)*fc*t)*std::sqrt(fb);
+  return t == 0.0 ? res : res*std::pow(std::sin((T)(M_PI)*t*fb/m)/((T)(M_PI)*t*fb/m), m);
+}
+
+template class FbspWavelet<float>;
+template class FbspWavelet<double>;
+
+}  // namespace signal
+}  // namespace kernels
+}  // namespace dali
diff --git a/dali/kernels/signal/wavelet/mother_wavelet.cuh b/dali/kernels/signal/wavelet/mother_wavelet.cuh
new file mode 100644
index 0000000000..9cbd81592b
--- /dev/null
+++ b/dali/kernels/signal/wavelet/mother_wavelet.cuh
@@ -0,0 +1,124 @@
+// Copyright (c) 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef DALI_KERNELS_SIGNAL_WAVELET_MOTHER_WAVELET_CUH_
+#define DALI_KERNELS_SIGNAL_WAVELET_MOTHER_WAVELET_CUH_
+
+#include <vector>
+
+#include "dali/core/common.h"
+#include "dali/core/error_handling.h"
+#include "dali/core/format.h"
+#include "dali/core/util.h"
+#include "dali/kernels/kernel.h"
+
+namespace dali {
+namespace kernels {
+namespace signal {
+
+// wavelets are represented by functors
+// they can store any necessary parameters
+// they must overload () operator
+
+template <typename T>
+class HaarWavelet {
+  static_assert(std::is_floating_point<T>::value,
+    "Data type should be floating point");
+ public:
+  HaarWavelet() = default;
+  explicit HaarWavelet(const std::vector<T> &args);
+  ~HaarWavelet() = default;
+
+  __device__ T operator()(const T &t) const;
+};
+
+template <typename T>
+class GaussianWavelet {
+  static_assert(std::is_floating_point<T>::value,
+    "Data type should be floating point");
+ public:
+  GaussianWavelet() = default;
+  explicit GaussianWavelet(const std::vector<T> &args);
+  ~GaussianWavelet() = default;
+
+  __device__ T operator()(const T &t) const;
+ private:
+  T n;
+};
+
+template <typename T>
+class MexicanHatWavelet {
+  static_assert(std::is_floating_point<T>::value,
+    "Data type should be floating point");
+ public:
+  MexicanHatWavelet() = default;
+  explicit MexicanHatWavelet(const std::vector<T> &args);
+  ~MexicanHatWavelet() = default;
+
+  __device__ T operator()(const T &t) const;
+
+ private:
+  T sigma;
+};
+
+template <typename T>
+class MorletWavelet {
+  static_assert(std::is_floating_point<T>::value,
+    "Data type should be floating point");
+ public:
+  MorletWavelet() = default;
+  explicit MorletWavelet(const std::vector<T> &args);
+  ~MorletWavelet() = default;
+
+  __device__ T operator()(const T &t) const;
+};
+
+template <typename T>
+class ShannonWavelet {
+  static_assert(std::is_floating_point<T>::value,
+    "Data type should be floating point");
+ public:
+  ShannonWavelet() = default;
+  explicit ShannonWavelet(const std::vector<T> &args);
+  ~ShannonWavelet() = default;
+
+  __device__ T operator()(const T &t) const;
+
+ private:
+  T fb;
+  T fc;
+};
+
+template <typename T>
+class FbspWavelet {
+  static_assert(std::is_floating_point<T>::value,
+    "Data type should be floating point");
+ public:
+  FbspWavelet() = default;
+  explicit FbspWavelet(const std::vector<T> &args);
+  ~FbspWavelet() = default;
+
+  __device__ T operator()(const T &t) const;
+
+ private:
+  T m;
+  T fb;
+  T fc;
+};
+
+}  // namespace signal
+}  // namespace kernels
+}  // namespace dali
+
+#endif  // DALI_KERNELS_SIGNAL_WAVELET_MOTHER_WAVELET_CUH_
diff --git a/dali/kernels/signal/wavelet/wavelet_gpu.cu b/dali/kernels/signal/wavelet/wavelet_gpu.cu
new file mode 100644
index 0000000000..a5ab81a5df
--- /dev/null
+++ b/dali/kernels/signal/wavelet/wavelet_gpu.cu
@@ -0,0 +1,161 @@
+// Copyright (c) 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "dali/kernels/signal/wavelet/wavelet_gpu.cuh"
+#include <cmath>
+#include <complex>
+#include <vector>
+#include "dali/core/common.h"
+#include "dali/core/error_handling.h"
+#include "dali/core/format.h"
+#include "dali/kernels/kernel.h"
+#include "dali/kernels/signal/wavelet/mother_wavelet.cuh"
+#include "dali/core/tensor_shape.h"
+
+namespace dali {
+namespace kernels {
+namespace signal {
+
+// computes wavelet value for each sample in specified range,
+// and each a and b coeff
+template <typename T, template <typename> class W >
+__global__ void ComputeWavelet(const SampleDesc<T>* sample_data, W<T> wavelet) {
+  // id inside block
+  const int64_t b_id = threadIdx.y * blockDim.x + threadIdx.x;
+  // wavelet sample id
+  const int64_t t_id = blockDim.x * blockDim.y * blockIdx.x + b_id;
+  auto& sample = sample_data[blockIdx.z];
+  if (t_id >= sample.size_in) return;
+  __shared__ T shm[1025];
+  auto a = sample.a[blockIdx.y];
+  auto x = std::pow(2.0, a);
+  if (a == 0.0) {
+    shm[b_id] = sample.in[t_id];
+  } else {
+    shm[b_id] = x * sample.in[t_id];
+    shm[1024] = std::pow(2.0, a / 2.0);
+  }
+  __syncthreads();
+  for (int i = 0; i < sample.size_b; ++i) {
+    const int64_t out_id = blockIdx.y * sample.size_b * sample.size_in + i * sample.size_in + t_id;
+    auto b = sample.b[i];
+    if (b == 0.0) {
+      sample.out[out_id] = wavelet(shm[b_id]);
+    } else {
+      sample.out[out_id] = wavelet(shm[b_id] - b);
+    }
+    if (a != 0.0) {
+      sample.out[out_id] *= shm[1024];
+    }
+  }
+}
+
+// translate input range information to input samples
+template <typename T>
+__global__ void ComputeInputSamples(const SampleDesc<T>* sample_data) {
+  const int64_t block_size = blockDim.x * blockDim.y;
+  const int64_t t_id = block_size * blockIdx.x + threadIdx.y * blockDim.x + threadIdx.x;
+  auto& sample = sample_data[blockIdx.y];
+  if (t_id >= sample.size_in) return;
+  sample.in[t_id] = sample.span.begin + (T)t_id / sample.span.sampling_rate;
+}
+
+template <typename T, template <typename> class W >
+DLL_PUBLIC KernelRequirements WaveletGpu<T, W>::Setup(KernelContext &context,
+                                                      const InListGPU<T> &a,
+                                                      const InListGPU<T> &b,
+                                                      const WaveletSpan<T> &span,
+                                                      const std::vector<T> &args) {
+  ENFORCE_SHAPES(a.shape, b.shape);
+  auto out_shape = this->GetOutputShape(a.shape, b.shape, span);
+  KernelRequirements req;
+  req.output_shapes = {out_shape};
+  wavelet_ = W(args);
+  return req;
+}
+
+template <typename T, template <typename> class W >
+DLL_PUBLIC void WaveletGpu<T, W>::Run(KernelContext &ctx,
+                                      OutListGPU<T> &out,
+                                      const InListGPU<T> &a,
+                                      const InListGPU<T> &b,
+                                      const WaveletSpan<T> &span) {
+  ENFORCE_SHAPES(a.shape, b.shape);
+
+  auto num_samples = a.num_samples();
+  std::vector<SampleDesc<T>> sample_data = std::vector<SampleDesc<T>>(num_samples);
+  int64_t max_size_in = 0, max_size_a = 0;
+
+  for (int i = 0; i < num_samples; i++) {
+    auto &sample = sample_data[i];
+    sample.out = out.tensor_data(i);
+    sample.a = a.tensor_data(i);
+    sample.size_a = a.shape.tensor_size(i);
+    max_size_a = std::max(max_size_a, sample.size_a);
+    sample.b = b.tensor_data(i);
+    sample.size_b = b.shape.tensor_size(i);
+    sample.span = span;
+    sample.size_in =
+      std::ceil((sample.span.end - sample.span.begin) * sample.span.sampling_rate) + 1;
+    sample.in = ctx.scratchpad->AllocateGPU<T>(sample.size_in);
+    max_size_in = std::max(max_size_in, sample.size_in);
+  }
+
+  auto* sample_data_gpu = std::get<0>(ctx.scratchpad->ToContiguousGPU(ctx.gpu.stream, sample_data));
+
+  dim3 block(32, 32);
+  const int64_t block_size = block.x * block.y;
+  dim3 grid1((max_size_in + block_size - 1) / block_size, num_samples);
+  dim3 grid2((max_size_in + block_size - 1) / block_size, max_size_a, num_samples);
+
+  ComputeInputSamples<<<grid1, block, 0, ctx.gpu.stream>>>(sample_data_gpu);
+  auto shared_mem_size = (block_size + 1) * sizeof(T);
+  ComputeWavelet<<<grid2, block, shared_mem_size, ctx.gpu.stream>>>(sample_data_gpu, wavelet_);
+}
+
+template <typename T, template <typename> class W >
+TensorListShape<> WaveletGpu<T, W>::GetOutputShape(const TensorListShape<> &a_shape,
+                                                   const TensorListShape<> &b_shape,
+                                                   const WaveletSpan<T> &span) {
+  int N = a_shape.num_samples();
+  int in_size = std::ceil((span.end - span.begin) * span.sampling_rate) + 1;
+  TensorListShape<> out_shape(N, 3);
+  TensorShape<> tshape;
+  for (int i = 0; i < N; i++) {
+    // output tensor will be 3-dimensional of shape:
+    //  a coeffs x b coeffs x signal samples
+    tshape = TensorShape<>({a_shape.tensor_shape(i).num_elements(),
+                            b_shape.tensor_shape(i).num_elements(),
+                            in_size});
+    out_shape.set_tensor_shape(i, tshape);
+  }
+  return out_shape;
+}
+
+template class WaveletGpu<float, HaarWavelet>;
+template class WaveletGpu<double, HaarWavelet>;
+template class WaveletGpu<float, GaussianWavelet>;
+template class WaveletGpu<double, GaussianWavelet>;
+template class WaveletGpu<float, MexicanHatWavelet>;
+template class WaveletGpu<double, MexicanHatWavelet>;
+template class WaveletGpu<float, MorletWavelet>;
+template class WaveletGpu<double, MorletWavelet>;
+template class WaveletGpu<float, ShannonWavelet>;
+template class WaveletGpu<double, ShannonWavelet>;
+template class WaveletGpu<float, FbspWavelet>;
+template class WaveletGpu<double, FbspWavelet>;
+
+}  // namespace signal
+}  // namespace kernels
+}  // namespace dali
diff --git a/dali/kernels/signal/wavelet/wavelet_gpu.cuh b/dali/kernels/signal/wavelet/wavelet_gpu.cuh
new file mode 100644
index 0000000000..49a03d8c7b
--- /dev/null
+++ b/dali/kernels/signal/wavelet/wavelet_gpu.cuh
@@ -0,0 +1,101 @@
+// Copyright (c) 2023, NVIDIA CORPORATION. All rights reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef DALI_KERNELS_SIGNAL_WAVELET_WAVELET_GPU_CUH_
+#define DALI_KERNELS_SIGNAL_WAVELET_WAVELET_GPU_CUH_
+
+#include <memory>
+#include <string>
+#include <vector>
+#include "dali/core/common.h"
+#include "dali/core/error_handling.h"
+#include "dali/core/format.h"
+#include "dali/core/util.h"
+#include "dali/kernels/kernel.h"
+#include "dali/kernels/signal/wavelet/mother_wavelet.cuh"
+
+// makes sure both tensors have the same number of samples and
+// that they're one-dimensional
+#define ENFORCE_SHAPES(a_shape, b_shape)                                   \
+  do {                                                                     \
+    DALI_ENFORCE(a_shape.num_samples() == b_shape.num_samples(),           \
+                 "a and b tensors must have the same amount of samples."); \
+    for (int i = 0; i < a_shape.num_samples(); ++i) {                      \
+      DALI_ENFORCE(a_shape.tensor_shape(i).size() == 1,                    \
+                   "Tensor of a coeffs should be 1-dimensional.");         \
+      DALI_ENFORCE(b_shape.tensor_shape(i).size() == 1,                    \
+                   "Tensor of b coeffs should be 1-dimensional.");         \
+    }                                                                      \
+  } while (0);
+
+namespace dali {
+namespace kernels {
+namespace signal {
+
+// stores data needed to reconstruct wavelet input arguments
+template <typename T = float>
+struct WaveletSpan {
+  // lower limit of wavelet samples
+  T begin = -1.0;
+
+  // upper limit of wavelet samples
+  T end = 1.0;
+
+  // wavelet sampling rate (samples/s)
+  T sampling_rate = 1000.0;
+};
+
+template class WaveletSpan<float>;
+template class WaveletSpan<double>;
+
+template <typename T>
+struct SampleDesc {
+  const T *a = nullptr;
+  int64_t size_a = 0;
+  const T *b = nullptr;
+  int64_t size_b = 0;
+  T *in = nullptr;
+  int64_t size_in = 0;
+  T *out = nullptr;
+  WaveletSpan<T> span;
+};
+
+template <typename T, template <typename> class W>
+class DLL_PUBLIC WaveletGpu {
+ public:
+  static_assert(std::is_floating_point<T>::value, "Only floating point types are supported");
+
+  DLL_PUBLIC WaveletGpu() = default;
+  DLL_PUBLIC ~WaveletGpu() = default;
+
+  DLL_PUBLIC KernelRequirements Setup(KernelContext &context, const InListGPU<T> &a,
+                                      const InListGPU<T> &b, const WaveletSpan<T> &span,
+                                      const std::vector<T> &args);
+
+  DLL_PUBLIC void Run(KernelContext &ctx, OutListGPU<T> &out, const InListGPU<T> &a,
+                      const InListGPU<T> &b, const WaveletSpan<T> &span);
+
+  static TensorListShape<> GetOutputShape(const TensorListShape<> &a_shape,
+                                          const TensorListShape<> &b_shape,
+                                          const WaveletSpan<T> &span);
+
+ private:
+  W<T> wavelet_;
+};
+
+}  // namespace signal
+}  // namespace kernels
+}  // namespace dali
+
+#endif  // DALI_KERNELS_SIGNAL_WAVELET_WAVELET_GPU_CUH_
diff --git a/dali/operators/signal/CMakeLists.txt b/dali/operators/signal/CMakeLists.txt
index 217f785aa2..44d93c05ba 100644
--- a/dali/operators/signal/CMakeLists.txt
+++ b/dali/operators/signal/CMakeLists.txt
@@ -16,6 +16,7 @@ add_subdirectory(decibel)
 if (BUILD_FFTS)
   add_subdirectory(fft)
 endif()
+add_subdirectory(wavelet)
 
 collect_headers(DALI_INST_HDRS PARENT_SCOPE)
 collect_sources(DALI_OPERATOR_SRCS PARENT_SCOPE)
diff --git a/dali/operators/signal/fft/power_spectrum.h b/dali/operators/signal/fft/power_spectrum.h
index 170818187a..65117ef1c8 100644
--- a/dali/operators/signal/fft/power_spectrum.h
+++ b/dali/operators/signal/fft/power_spectrum.h
@@ -28,8 +28,7 @@ namespace dali {
 template <typename Backend>
 class PowerSpectrum : public Operator<Backend> {
  public:
-  explicit PowerSpectrum(const OpSpec &spec)
-      : Operator<Backend>(spec) {
+  explicit PowerSpectrum(const OpSpec &spec) : Operator<Backend>(spec) {
     fft_args_.nfft = spec.HasArgument("nfft") ? spec.GetArgument<int>("nfft") : -1;
     fft_args_.transform_axis = spec.GetArgument<int>("axis");
     int power = spec.GetArgument<int>("power");
@@ -41,13 +40,17 @@ class PowerSpectrum : public Operator<Backend> {
         fft_args_.spectrum_type = kernels::signal::fft::FFT_SPECTRUM_POWER;
         break;
       default:
-        DALI_FAIL(make_string("Power argument should be either `2` for power spectrum or `1` "
-          "for complex magnitude. Received: ", power));
+        DALI_FAIL(
+            make_string("Power argument should be either `2` for power spectrum or `1` "
+                        "for complex magnitude. Received: ",
+                        power));
     }
   }
 
  protected:
-  bool CanInferOutputs() const override { return true; }
+  bool CanInferOutputs() const override {
+    return true;
+  }
   bool SetupImpl(std::vector<OutputDesc> &output_desc, const Workspace &ws) override;
   void RunImpl(Workspace &ws) override;
 
diff --git a/dali/operators/signal/wavelet/CMakeLists.txt b/dali/operators/signal/wavelet/CMakeLists.txt
new file mode 100644
index 0000000000..0dba230abf
--- /dev/null
+++ b/dali/operators/signal/wavelet/CMakeLists.txt
@@ -0,0 +1,17 @@
+# Copyright (c) 2019, NVIDIA CORPORATION. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+collect_headers(DALI_INST_HDRS PARENT_SCOPE)
+collect_sources(DALI_OPERATOR_SRCS PARENT_SCOPE)
+collect_test_sources(DALI_OPERATOR_TEST_SRCS PARENT_SCOPE)
diff --git a/dali/operators/signal/wavelet/cwt_op.h b/dali/operators/signal/wavelet/cwt_op.h
new file mode 100644
index 0000000000..59c211cc7f
--- /dev/null
+++ b/dali/operators/signal/wavelet/cwt_op.h
@@ -0,0 +1,73 @@
+// Copyright (c) 2019-2022, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef DALI_OPERATORS_SIGNAL_WAVELETS_CWT_H_
+#define DALI_OPERATORS_SIGNAL_WAVELETS_CWT_H_
+
+#include <memory>
+#include <vector>
+#include "dali/core/common.h"
+#include "dali/core/static_switch.h"
+#include "dali/kernels/kernel_manager.h"
+#include "dali/kernels/kernel_params.h"
+#include "dali/kernels/signal/wavelet/cwt_args.h"
+#include "dali/kernels/signal/wavelet/cwt_gpu.h"
+#include "dali/operators/signal/wavelet/cwt_op.h"
+#include "dali/operators/signal/wavelet/wavelet_name.h"
+#include "dali/pipeline/data/types.h"
+#include "dali/pipeline/data/views.h"
+#include "dali/pipeline/operator/common.h"
+#include "dali/pipeline/operator/op_spec.h"
+#include "dali/pipeline/operator/operator.h"
+#include "dali/pipeline/util/operator_impl_utils.h"
+
+namespace dali {
+
+template <typename Backend>
+class Cwt : public Operator<Backend> {
+ public:
+  explicit Cwt(const OpSpec &spec) : Operator<Backend>(spec) {
+    if (!spec.HasArgument("a")) {
+      DALI_ENFORCE("`a` argument must be provided.");
+    }
+    args_.a = spec.GetRepeatedArgument<float>("a");
+    if (!spec.HasArgument("wavelet")) {
+      DALI_ENFORCE("`wavelet` argument must be provided.");
+    }
+    args_.wavelet = spec.GetArgument<DALIWaveletName>("wavelet");
+    args_.wavelet_args = spec.GetRepeatedArgument<float>("wavelet_args");
+  }
+
+ protected:
+  bool CanInferOutputs() const override {
+    return true;
+  }
+
+  bool SetupImpl(std::vector<OutputDesc> &output_desc, const Workspace &ws) override;
+
+  void RunImpl(Workspace &ws) override;
+
+  USE_OPERATOR_MEMBERS();
+  using Operator<Backend>::RunImpl;
+
+  kernels::KernelManager kmgr_;
+  kernels::signal::CwtArgs<float> args_;
+
+  std::unique_ptr<OpImplBase<Backend>> impl_;
+  DALIDataType type_ = DALI_NO_TYPE;
+};
+
+}  // namespace dali
+
+#endif  // DALI_OPERATORS_SIGNAL_WAVELETS_CWT_H_
diff --git a/dali/operators/signal/wavelet/cwt_op_gpu.cu b/dali/operators/signal/wavelet/cwt_op_gpu.cu
new file mode 100644
index 0000000000..7d3fad3f95
--- /dev/null
+++ b/dali/operators/signal/wavelet/cwt_op_gpu.cu
@@ -0,0 +1,177 @@
+// Copyright (c) 2019-2022, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include <memory>
+#include <utility>
+#include <vector>
+#include "dali/core/dev_buffer.h"
+#include "dali/core/static_switch.h"
+#include "dali/core/tensor_shape.h"
+#include "dali/kernels/kernel_manager.h"
+#include "dali/kernels/kernel_params.h"
+#include "dali/kernels/signal/wavelet/cwt_args.h"
+#include "dali/kernels/signal/wavelet/cwt_gpu.h"
+#include "dali/kernels/signal/wavelet/wavelet_gpu.cuh"
+#include "dali/operators/signal/wavelet/cwt_op.h"
+#include "dali/operators/signal/wavelet/wavelet_run.h"
+#include "dali/pipeline/data/types.h"
+#include "dali/pipeline/data/views.h"
+#include "dali/pipeline/operator/op_schema.h"
+
+namespace dali {
+
+DALI_SCHEMA(Cwt)
+    .DocStr(R"(Performs continuous wavelet transform on a 1D signal (for example, audio).
+
+Result values of transform are computed for all specified scales.
+Input data is expected to be one channel (shape being ``(nsamples,)``, ``(nsamples, 1)``
+) of type float32.)")
+    .NumInput(1)
+    .NumOutput(1)
+    .AddArg("a", R"(List of scale coefficients of type float32.)", DALIDataType::DALI_FLOAT_VEC)
+    .AddArg("wavelet", R"(Name of mother wavelet. Currently supported wavelets' names are:
+- HAAR - Haar wavelet
+- GAUS - Gaussian wavelet
+- MEXH - Mexican hat wavelet
+- MORL - Morlet wavelet
+- SHAN - Shannon wavleet
+- FBSP - Frequency B-spline wavelet)",
+            DALIDataType::DALI_WAVELET_NAME)
+    .AddArg("wavelet_args", R"(Additional arguments for mother wavelet. They are passed
+as list of float32 values.
+- HAAR - none
+- GAUS - n (order of derivative)
+- MEXH - sigma
+- MORL - none
+- SHAN - fb (bandwidth parameter > 0), fc (center frequency > 0)
+- FBSP - m (order parameter >= 1), fb (bandwidth parameter > 0), fc (center frequency > 0)
+)",
+            DALIDataType::DALI_FLOAT_VEC);
+
+template <typename T>
+struct CwtImplGPU : public OpImplBase<GPUBackend> {
+ public:
+  using CwtArgs = kernels::signal::CwtArgs<T>;
+  using CwtKernel = kernels::signal::CwtGpu<T>;
+
+  template <template <typename> class W>
+  using WvltKernel = kernels::signal::WaveletGpu<T, W>;
+
+  explicit CwtImplGPU(CwtArgs args) : args_(std::move(args)) {
+    ResizeWaveletKernelForName<T>(args_.wavelet, kmgr_wvlt_);
+  }
+
+  bool SetupImpl(std::vector<OutputDesc> &output_desc, const Workspace &ws) override;
+
+  void RunImpl(Workspace &ws) override;
+
+  dali::kernels::signal::WaveletSpan<T> GetDefaultSpan() {
+    dali::kernels::signal::WaveletSpan<T> def_span;
+    def_span.begin = -1.0f;
+    def_span.end = 1.0f;
+    def_span.sampling_rate = 1000;
+    return def_span;
+  }
+
+ private:
+  CwtArgs args_;
+  kernels::KernelManager kmgr_wvlt_;
+  // std::vector<OutputDesc> wvlt_out_desc_;
+  // TensorList<GPUBackend> wvlt_out_;
+
+  // kernels::KernelManager kmgr_cwt_;
+  // std::vector<OutputDesc> cwt_out_desc_;
+  // TensorList<GPUBackend> cwt_out_;
+};
+
+template <typename T>
+bool CwtImplGPU<T>::SetupImpl(std::vector<OutputDesc> &output_desc, const Workspace &ws) {
+  kernels::KernelContext ctx;
+  ctx.gpu.stream = ws.stream();
+  auto type = type2id<T>::value;
+
+  dali::kernels::signal::WaveletSpan<T> def_span = GetDefaultSpan();
+
+  TensorListShape<> a_shape(1, {1});
+  a_shape.set_tensor_shape(0, {args_.a.size()});
+  TensorListView<StorageGPU, const T> a_view = make_tensor_list_gpu((T *)nullptr, a_shape);
+
+  TensorListShape<> b_shape(1, {1});
+  b_shape.set_tensor_shape(0, {1});
+  TensorListView<StorageGPU, const T> b_view = make_tensor_list_gpu((T *)nullptr, b_shape);
+
+  auto &req = SetupWaveletKernelForName(args_.wavelet, kmgr_wvlt_, ctx, a_view, b_view, def_span,
+                                        args_.wavelet_args);
+
+  // wvlt_out_desc_.resize(1);
+  // wvlt_out_desc_[0].type = type;
+  // wvlt_out_desc_[0].shape = req.output_shapes[0];
+
+  output_desc.resize(1);
+  output_desc[0].type = type;
+  output_desc[0].shape = req.output_shapes[0];
+  return true;
+}
+
+template <typename T>
+void CwtImplGPU<T>::RunImpl(Workspace &ws) {
+  kernels::KernelContext ctx;
+  ctx.gpu.stream = ws.stream();
+  auto &output = ws.Output<GPUBackend>(0);
+
+  DeviceBuffer<T> a_buffer;
+  a_buffer.from_host(args_.a);
+  TensorListShape<> a_shape(1, {1});
+  a_shape.set_tensor_shape(0, {args_.a.size()});
+  TensorListView<StorageGPU, const T> a_view = make_tensor_list_gpu(a_buffer.data(), a_shape);
+
+  std::vector<T> zero;
+  zero.push_back(0);
+  DeviceBuffer<T> b_buffer;
+  b_buffer.from_host(zero);
+  TensorListShape<> b_shape(1, {1});
+  b_shape.set_tensor_shape(0, {1});
+  TensorListView<StorageGPU, const T> b_view = make_tensor_list_gpu(b_buffer.data(), b_shape);
+
+  dali::kernels::signal::WaveletSpan<T> def_span = GetDefaultSpan();
+  auto out_view = view<T>(output);
+  RunWaveletKernelForName(args_.wavelet, kmgr_wvlt_, ctx, out_view, a_view, b_view, def_span);
+}
+
+template <>
+bool Cwt<GPUBackend>::SetupImpl(std::vector<OutputDesc> &output_desc, const Workspace &ws) {
+  output_desc.resize(1);
+  const auto &input = ws.Input<GPUBackend>(0);
+  auto type = input.type();
+  TYPE_SWITCH(type, type2id, T, (float), (
+      using Impl = CwtImplGPU<T>;
+      if (!impl_ || type != type_) {
+        impl_ = std::make_unique<Impl>(args_);
+        type_ = type;
+      }
+  ), DALI_FAIL(make_string("Unsupported data type: ", type)));  // NOLINT
+
+  impl_->SetupImpl(output_desc, ws);
+  return true;
+}
+
+template <>
+void Cwt<GPUBackend>::RunImpl(Workspace &ws) {
+  assert(impl_ != nullptr);
+  impl_->RunImpl(ws);
+}
+
+DALI_REGISTER_OPERATOR(Cwt, Cwt<GPUBackend>, GPU);
+
+}  // namespace dali
diff --git a/dali/operators/signal/wavelet/wavelet_name.h b/dali/operators/signal/wavelet/wavelet_name.h
new file mode 100644
index 0000000000..e101040b14
--- /dev/null
+++ b/dali/operators/signal/wavelet/wavelet_name.h
@@ -0,0 +1,34 @@
+// Copyright (c) 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef DALI_OPERATORS_SIGNAL_WAVELET_WAVELET_NAME_H_
+#define DALI_OPERATORS_SIGNAL_WAVELET_WAVELET_NAME_H_
+
+namespace dali {
+
+/**
+ * @brief Supported wavelet names
+ */
+enum DALIWaveletName {
+  DALI_HAAR = 0,
+  DALI_GAUS = 1,
+  DALI_MEXH = 2,
+  DALI_MORL = 3,
+  DALI_SHAN = 4,
+  DALI_FBSP = 5
+};
+
+}  // namespace dali
+
+#endif  // DALI_OPERATORS_SIGNAL_WAVELET_WAVELET_NAME_H_
diff --git a/dali/operators/signal/wavelet/wavelet_run.h b/dali/operators/signal/wavelet/wavelet_run.h
new file mode 100644
index 0000000000..676f092d1f
--- /dev/null
+++ b/dali/operators/signal/wavelet/wavelet_run.h
@@ -0,0 +1,168 @@
+// Copyright (c) 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#ifndef DALI_OPERATORS_SIGNAL_WAVELET_WAVELET_RUN_H_
+#define DALI_OPERATORS_SIGNAL_WAVELET_WAVELET_RUN_H_
+
+#include <vector>
+#include "dali/core/format.h"
+#include "dali/core/geom/mat.h"
+#include "dali/core/static_switch.h"
+#include "dali/kernels/kernel_manager.h"
+#include "dali/kernels/signal/wavelet/mother_wavelet.cuh"
+#include "dali/kernels/signal/wavelet/wavelet_gpu.cuh"
+#include "dali/pipeline/operator/operator.h"
+
+namespace dali {
+
+
+// only resizes kernel for specific wavelet type
+template <typename T, template <typename> class W>
+void ResizeWaveletKernel(kernels::KernelManager &kmgr) {
+  using Kernel = kernels::signal::WaveletGpu<T, W>;
+  kmgr.template Resize<Kernel>(1);
+}
+
+
+template <typename T>
+void ResizeWaveletKernelForName(const DALIWaveletName &name, kernels::KernelManager &kmgr) {
+  switch (name) {
+    case DALIWaveletName::DALI_HAAR:
+      using kernels::signal::HaarWavelet;
+      ResizeWaveletKernel<T, HaarWavelet>(kmgr);
+      break;
+    case DALIWaveletName::DALI_GAUS:
+      using kernels::signal::GaussianWavelet;
+      ResizeWaveletKernel<T, GaussianWavelet>(kmgr);
+      break;
+    case DALIWaveletName::DALI_MEXH:
+      using kernels::signal::MexicanHatWavelet;
+      ResizeWaveletKernel<T, MexicanHatWavelet>(kmgr);
+      break;
+    case DALIWaveletName::DALI_MORL:
+      using kernels::signal::MorletWavelet;
+      ResizeWaveletKernel<T, MorletWavelet>(kmgr);
+      break;
+    case DALIWaveletName::DALI_SHAN:
+      using kernels::signal::ShannonWavelet;
+      ResizeWaveletKernel<T, ShannonWavelet>(kmgr);
+      break;
+    case DALIWaveletName::DALI_FBSP:
+      using kernels::signal::FbspWavelet;
+      ResizeWaveletKernel<T, FbspWavelet>(kmgr);
+      break;
+    default:
+      throw std::invalid_argument("Unknown wavelet name.");
+  }
+}
+
+
+// setups kernel for specific wavelet type
+template <typename T, template <typename> class W>
+dali::kernels::KernelRequirements &SetupWaveletKernel(kernels::KernelManager &kmgr,
+                                                      kernels::KernelContext &ctx,
+                                                      TensorListView<StorageGPU, const T> &a,
+                                                      TensorListView<StorageGPU, const T> &b,
+                                                      const kernels::signal::WaveletSpan<T> &span,
+                                                      const std::vector<T> &args) {
+  using Kernel = kernels::signal::WaveletGpu<T, W>;
+  return kmgr.Setup<Kernel>(0, ctx, a, b, span, args);
+}
+
+// translates wavelet name to type and runs SetupWaveletKernel() for that type
+template <typename T>
+dali::kernels::KernelRequirements &SetupWaveletKernelForName(
+    const DALIWaveletName &name, kernels::KernelManager &kmgr, kernels::KernelContext &ctx,
+    TensorListView<StorageGPU, const T> &a, TensorListView<StorageGPU, const T> &b,
+    const kernels::signal::WaveletSpan<T> &span, const std::vector<T> &args) {
+  switch (name) {
+    case DALIWaveletName::DALI_HAAR:
+      using kernels::signal::HaarWavelet;
+      return SetupWaveletKernel<T, HaarWavelet>(kmgr, ctx, a, b, span, args);
+      break;
+    case DALIWaveletName::DALI_GAUS:
+      using kernels::signal::GaussianWavelet;
+      return SetupWaveletKernel<T, GaussianWavelet>(kmgr, ctx, a, b, span, args);
+      break;
+    case DALIWaveletName::DALI_MEXH:
+      using kernels::signal::MexicanHatWavelet;
+      return SetupWaveletKernel<T, MexicanHatWavelet>(kmgr, ctx, a, b, span, args);
+      break;
+    case DALIWaveletName::DALI_MORL:
+      using kernels::signal::MorletWavelet;
+      return SetupWaveletKernel<T, MorletWavelet>(kmgr, ctx, a, b, span, args);
+      break;
+    case DALIWaveletName::DALI_SHAN:
+      using kernels::signal::ShannonWavelet;
+      return SetupWaveletKernel<T, ShannonWavelet>(kmgr, ctx, a, b, span, args);
+      break;
+    case DALIWaveletName::DALI_FBSP:
+      using kernels::signal::FbspWavelet;
+      return SetupWaveletKernel<T, FbspWavelet>(kmgr, ctx, a, b, span, args);
+      break;
+    default:
+      throw std::invalid_argument("Unknown wavelet name.");
+  }
+}
+
+// runs kernel for specific wavelet type
+template <typename T, template <typename> class W>
+void RunWaveletKernel(kernels::KernelManager &kmgr, kernels::KernelContext &ctx,
+                      TensorListView<StorageGPU, T> &out, TensorListView<StorageGPU, const T> &a,
+                      TensorListView<StorageGPU, const T> &b,
+                      const kernels::signal::WaveletSpan<T> &span) {
+  using Kernel = kernels::signal::WaveletGpu<T, W>;
+  kmgr.Run<Kernel>(0, ctx, out, a, b, span);
+}
+
+// translates wavelet name to type and runs RunWaveletKernel() for that type
+template <typename T>
+void RunWaveletKernelForName(const DALIWaveletName &name, kernels::KernelManager &kmgr,
+                             kernels::KernelContext &ctx, TensorListView<StorageGPU, T> &out,
+                             TensorListView<StorageGPU, const T> &a,
+                             TensorListView<StorageGPU, const T> &b,
+                             const kernels::signal::WaveletSpan<T> &span) {
+  switch (name) {
+    case DALIWaveletName::DALI_HAAR:
+      using kernels::signal::HaarWavelet;
+      RunWaveletKernel<T, HaarWavelet>(kmgr, ctx, out, a, b, span);
+      break;
+    case DALIWaveletName::DALI_GAUS:
+      using kernels::signal::GaussianWavelet;
+      RunWaveletKernel<T, GaussianWavelet>(kmgr, ctx, out, a, b, span);
+      break;
+    case DALIWaveletName::DALI_MEXH:
+      using kernels::signal::MexicanHatWavelet;
+      RunWaveletKernel<T, MexicanHatWavelet>(kmgr, ctx, out, a, b, span);
+      break;
+    case DALIWaveletName::DALI_MORL:
+      using kernels::signal::MorletWavelet;
+      RunWaveletKernel<T, MorletWavelet>(kmgr, ctx, out, a, b, span);
+      break;
+    case DALIWaveletName::DALI_SHAN:
+      using kernels::signal::ShannonWavelet;
+      RunWaveletKernel<T, ShannonWavelet>(kmgr, ctx, out, a, b, span);
+      break;
+    case DALIWaveletName::DALI_FBSP:
+      using kernels::signal::FbspWavelet;
+      RunWaveletKernel<T, FbspWavelet>(kmgr, ctx, out, a, b, span);
+      break;
+    default:
+      throw std::invalid_argument("Unknown wavelet name.");
+  }
+}
+
+}  // namespace dali
+
+#endif  // DALI_OPERATORS_SIGNAL_WAVELET_WAVELET_RUN_H_
diff --git a/dali/pipeline/data/types.h b/dali/pipeline/data/types.h
index 4c77204d59..a517493283 100644
--- a/dali/pipeline/data/types.h
+++ b/dali/pipeline/data/types.h
@@ -30,6 +30,7 @@
 #include "dali/core/float16.h"
 #include "dali/core/cuda_error.h"
 #include "dali/core/tensor_layout.h"
+#include "dali/operators/signal/wavelet/wavelet_name.h"
 
 #ifdef DALI_BUILD_PROTO3
 #include "dali/operators/reader/parser/tf_feature.h"
@@ -123,6 +124,7 @@ enum DALIDataType : int {
   DALI_PYTHON_OBJECT     = 24,
   DALI_TENSOR_LAYOUT_VEC = 25,
   DALI_DATA_TYPE_VEC     = 26,
+  DALI_WAVELET_NAME      = 27,
   DALI_DATATYPE_END      = 1000
 };
 
@@ -202,6 +204,9 @@ inline const char *GetBuiltinTypeName(DALIDataType t) {
     case DALI_INTERP_TYPE:
       return "DALIInterpType";
       break;
+    case DALI_WAVELET_NAME:
+      return "DALIWaveletName";
+      break;
     case DALI_TENSOR_LAYOUT:
       return "TensorLayout";
       break;
@@ -557,24 +562,25 @@ DLL_PUBLIC inline bool IsValidType(const TypeInfo &type) {
   DALI_REGISTER_TYPE_IMPL(Type, dtype);
 
 // Instantiate some basic types
-DALI_REGISTER_TYPE(NoType,         DALI_NO_TYPE);
-DALI_REGISTER_TYPE(uint8_t,        DALI_UINT8);
-DALI_REGISTER_TYPE(uint16_t,       DALI_UINT16);
-DALI_REGISTER_TYPE(uint32_t,       DALI_UINT32);
-DALI_REGISTER_TYPE(uint64_t,       DALI_UINT64);
-DALI_REGISTER_TYPE(int8_t,         DALI_INT8);
-DALI_REGISTER_TYPE(int16_t,        DALI_INT16);
-DALI_REGISTER_TYPE(int32_t,        DALI_INT32);
-DALI_REGISTER_TYPE(int64_t,        DALI_INT64);
-DALI_REGISTER_TYPE(float16,        DALI_FLOAT16);
-DALI_REGISTER_TYPE(float,          DALI_FLOAT);
-DALI_REGISTER_TYPE(double,         DALI_FLOAT64);
-DALI_REGISTER_TYPE(bool,           DALI_BOOL);
-DALI_REGISTER_TYPE(string,         DALI_STRING);
-DALI_REGISTER_TYPE(DALIImageType,  DALI_IMAGE_TYPE);
-DALI_REGISTER_TYPE(DALIDataType,   DALI_DATA_TYPE);
-DALI_REGISTER_TYPE(DALIInterpType, DALI_INTERP_TYPE);
-DALI_REGISTER_TYPE(TensorLayout,   DALI_TENSOR_LAYOUT);
+DALI_REGISTER_TYPE(NoType,          DALI_NO_TYPE);
+DALI_REGISTER_TYPE(uint8_t,         DALI_UINT8);
+DALI_REGISTER_TYPE(uint16_t,        DALI_UINT16);
+DALI_REGISTER_TYPE(uint32_t,        DALI_UINT32);
+DALI_REGISTER_TYPE(uint64_t,        DALI_UINT64);
+DALI_REGISTER_TYPE(int8_t,          DALI_INT8);
+DALI_REGISTER_TYPE(int16_t,         DALI_INT16);
+DALI_REGISTER_TYPE(int32_t,         DALI_INT32);
+DALI_REGISTER_TYPE(int64_t,         DALI_INT64);
+DALI_REGISTER_TYPE(float16,         DALI_FLOAT16);
+DALI_REGISTER_TYPE(float,           DALI_FLOAT);
+DALI_REGISTER_TYPE(double,          DALI_FLOAT64);
+DALI_REGISTER_TYPE(bool,            DALI_BOOL);
+DALI_REGISTER_TYPE(string,          DALI_STRING);
+DALI_REGISTER_TYPE(DALIImageType,   DALI_IMAGE_TYPE);
+DALI_REGISTER_TYPE(DALIDataType,    DALI_DATA_TYPE);
+DALI_REGISTER_TYPE(DALIInterpType,  DALI_INTERP_TYPE);
+DALI_REGISTER_TYPE(DALIWaveletName, DALI_WAVELET_NAME);
+DALI_REGISTER_TYPE(TensorLayout,    DALI_TENSOR_LAYOUT);
 
 
 #ifdef DALI_BUILD_PROTO3
diff --git a/dali/python/backend_impl.cc b/dali/python/backend_impl.cc
index d9846acf3b..f5de76b215 100644
--- a/dali/python/backend_impl.cc
+++ b/dali/python/backend_impl.cc
@@ -27,6 +27,7 @@
 #include "dali/operators.h"
 #include "dali/kernels/kernel.h"
 #include "dali/operators/reader/parser/tfrecord_parser.h"
+#include "dali/operators/signal/wavelet/wavelet_name.h"
 #include "dali/pipeline/data/copy_to_external.h"
 #include "dali/pipeline/data/dltensor.h"
 #include "dali/pipeline/data/tensor.h"
@@ -121,8 +122,7 @@ py::dict ArrayInterfaceRepr(Tensor<Backend> &t) {
   d["shape"] = py::tuple(py_shape<Backend>(t));
   // tuple of (raw_data_pointer, if_data_is_read_only)
   tup[0] = py::reinterpret_borrow<py::object>(PyLong_FromVoidPtr(t.raw_mutable_data()));
-  // if we make it readonly, it prevents us from sharing memory with PyTorch tensor
-  tup[1] = false;
+  tup[1] = true;
   d["data"] = tup;
   if (std::is_same<Backend, GPUBackend>::value) {
     // see https://numba.pydata.org/numba-doc/dev/cuda/cuda_array_interface.html
@@ -1719,6 +1719,7 @@ PYBIND11_MODULE(backend_impl, m) {
     .value("IMAGE_TYPE",    DALI_IMAGE_TYPE)
     .value("DATA_TYPE",     DALI_DATA_TYPE)
     .value("INTERP_TYPE",   DALI_INTERP_TYPE)
+    .value("WAVELET_NAME",  DALI_WAVELET_NAME)
     .value("TENSOR_LAYOUT", DALI_TENSOR_LAYOUT)
     .value("PYTHON_OBJECT", DALI_PYTHON_OBJECT)
     .value("_TENSOR_LAYOUT_VEC", DALI_TENSOR_LAYOUT_VEC)
@@ -1763,6 +1764,16 @@ PYBIND11_MODULE(backend_impl, m) {
     .value("INTERP_GAUSSIAN", DALI_INTERP_GAUSSIAN)
     .export_values();
 
+  // DALIWaveletName
+  py::enum_<DALIWaveletName>(types_m, "DALIWaveletName", "Wavelet name\n<SPHINX_IGNORE>")
+    .value("HAAR", DALI_HAAR)
+    .value("GAUS", DALI_GAUS)
+    .value("MEXH", DALI_MEXH)
+    .value("MORL", DALI_MORL)
+    .value("SHAN", DALI_SHAN)
+    .value("FBSP", DALI_FBSP)
+    .export_values();
+
   // Operator node
   py::class_<OpNode>(m, "OpNode")
     .def("instance_name",
@@ -2047,6 +2058,7 @@ PYBIND11_MODULE(backend_impl, m) {
     DALI_OPSPEC_ADDARG(DALIDataType)
     DALI_OPSPEC_ADDARG(DALIImageType)
     DALI_OPSPEC_ADDARG(DALIInterpType)
+    DALI_OPSPEC_ADDARG(DALIWaveletName)
 #ifdef DALI_BUILD_PROTO3
     DALI_OPSPEC_ADDARG(TFFeature)
 #endif
diff --git a/dali/python/nvidia/dali/types.py b/dali/python/nvidia/dali/types.py
index f4362fd224..5d56077ee6 100644
--- a/dali/python/nvidia/dali/types.py
+++ b/dali/python/nvidia/dali/types.py
@@ -16,7 +16,8 @@
 from enum import Enum, unique
 import re
 
-from nvidia.dali.backend_impl.types import DALIDataType, DALIImageType, DALIInterpType
+from nvidia.dali.backend_impl.types import DALIDataType, DALIImageType, \
+        DALIInterpType, DALIWaveletName
 
 # TODO: Handle forwarding imports from backend_impl
 from nvidia.dali.backend_impl.types import *        # noqa: F401, F403
@@ -63,6 +64,8 @@ def _not_implemented(val):
     DALIDataType.DATA_TYPE: ("nvidia.dali.types.DALIDataType", lambda x: DALIDataType(int(x))),
     DALIDataType.INTERP_TYPE:
     ("nvidia.dali.types.DALIInterpType", lambda x: DALIInterpType(int(x))),
+    DALIDataType.WAVELET_NAME:
+    ("nvidia.dali.types.DALIWaveletName", lambda x: DALIWaveletName(int(x))),
     DALIDataType.TENSOR_LAYOUT: (":ref:`layout str<layout_str_doc>`", lambda x: str(x)),
     DALIDataType.PYTHON_OBJECT: ("object", lambda x: x),
     DALIDataType._TENSOR_LAYOUT_VEC:
diff --git a/dali/test/python/operator_2/test_cwt.py b/dali/test/python/operator_2/test_cwt.py
new file mode 100644
index 0000000000..c5eb5dddf1
--- /dev/null
+++ b/dali/test/python/operator_2/test_cwt.py
@@ -0,0 +1,42 @@
+# Copyright (c) 2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import numpy as np
+import sys
+import matplotlib.pyplot as plt
+from nvidia.dali import pipeline_def, fn, types
+
+def get_data():
+    s1 = np.array([2.3, 4.5, 1000.2, 4.8, 6.8, 4.5], dtype=np.float32)
+    s2 = np.array([5.53, 4.6, 10.2, 0.8, 0.3], dtype=np.float32)
+    s3 = [5.3, 94.6, 10.2, 0.8, 0.3]
+    s4 = [5.23, 4.6, 10.2, 0.85, 0.3, 8.9, 2.3]
+    s5 = [5.3, 4.6, 103.2, 0.8, 0.36, 4.4]
+
+    return [s1]
+
+@pipeline_def(num_threads = 1, device_id = 0)
+def get_pipeline():
+    data = fn.external_source(get_data, batch=True, dtype=types.FLOAT)
+    result = fn.cwt(data.gpu(), device="gpu", a=[1.0, 2.0, 4.5], wavelet=types.MEXH, wavelet_args=[1.0])
+    return data, result
+
+pipe = get_pipeline(batch_size=1, device_id=0)
+pipe.build()
+data, result = pipe.run()
+print(result.as_cpu())
+res = [np.array(r) for r in result.as_cpu()]
+
+np.set_printoptions(threshold=sys.maxsize)
+print(res[0][0][0])
\ No newline at end of file