[feat][assistant][I3CEGC] add op timestretch

2021-08-07 22:53:41 +08:00 · 2021-08-07 22:53:41 +08:00 · 04705e5b0d
parent 3693625d6f
commit 04705e5b0d
21 changed files with 1024 additions and 3 deletions
--- a/mindspore/ccsrc/minddata/dataset/api/audio.cc
+++ b/mindspore/ccsrc/minddata/dataset/api/audio.cc
@ -23,6 +23,7 @@
 #include "minddata/dataset/audio/ir/kernels/bandpass_biquad_ir.h"
 #include "minddata/dataset/audio/ir/kernels/bandreject_biquad_ir.h"
 #include "minddata/dataset/audio/ir/kernels/bass_biquad_ir.h"
+#include "minddata/dataset/audio/ir/kernels/time_stretch_ir.h"

 namespace mindspore {
 namespace dataset {
@ -132,6 +133,23 @@ BassBiquad::BassBiquad(int32_t sample_rate, float gain, float central_freq, floa
 std::shared_ptr<TensorOperation> BassBiquad::Parse() {
  return std::make_shared<BassBiquadOperation>(data_->sample_rate_, data_->gain_, data_->central_freq_, data_->Q_);
 }
+
+// TimeStretch Operation.
+struct TimeStretch::Data {
+  explicit Data(float hop_length, int n_freq, float fixed_rate)
+      : hop_length_(hop_length), n_freq_(n_freq), fixed_rate_(fixed_rate) {}
+  float hop_length_;
+  int n_freq_;
+  float fixed_rate_;
+};
+
+TimeStretch::TimeStretch(float hop_length, int n_freq, float fixed_rate)
+    : data_(std::make_shared<Data>(hop_length, n_freq, fixed_rate)) {}
+
+std::shared_ptr<TensorOperation> TimeStretch::Parse() {
+  return std::make_shared<TimeStretchOperation>(data_->hop_length_, data_->n_freq_, data_->fixed_rate_);
+}
+
 }  // namespace audio
 }  // namespace dataset
 }  // namespace mindspore
--- a/mindspore/ccsrc/minddata/dataset/api/python/bindings/dataset/audio/kernels/ir/bindings.cc
+++ b/mindspore/ccsrc/minddata/dataset/api/python/bindings/dataset/audio/kernels/ir/bindings.cc
@ -24,6 +24,7 @@
 #include "minddata/dataset/audio/ir/kernels/bandpass_biquad_ir.h"
 #include "minddata/dataset/audio/ir/kernels/bandreject_biquad_ir.h"
 #include "minddata/dataset/audio/ir/kernels/bass_biquad_ir.h"
+#include "minddata/dataset/audio/ir/kernels/time_stretch_ir.h"
 #include "minddata/dataset/include/dataset/transforms.h"

 namespace mindspore {
@ -113,5 +114,15 @@ PYBIND_REGISTER(
      }));
  }));

+PYBIND_REGISTER(
+  TimeStretchOperation, 1, ([](const py::module *m) {
+    (void)py::class_<audio::TimeStretchOperation, TensorOperation, std::shared_ptr<audio::TimeStretchOperation>>(
+      *m, "TimeStretchOperation")
+      .def(py::init([](float hop_length, int n_freq, float fixed_rate) {
+        auto timestretch = std::make_shared<audio::TimeStretchOperation>(hop_length, n_freq, fixed_rate);
+        THROW_IF_ERROR(timestretch->ValidateParams());
+        return timestretch;
+      }));
+  }));
 }  // namespace dataset
 }  // namespace mindspore
--- a/mindspore/ccsrc/minddata/dataset/audio/ir/kernels/CMakeLists.txt
+++ b/mindspore/ccsrc/minddata/dataset/audio/ir/kernels/CMakeLists.txt
@ -9,4 +9,5 @@ add_library(audio-ir-kernels OBJECT
        bandpass_biquad_ir.cc
        bandreject_biquad_ir.cc
        bass_biquad_ir.cc
+        time_stretch_ir.cc
        )
--- a/mindspore/ccsrc/minddata/dataset/audio/ir/kernels/time_stretch_ir.cc
+++ b/mindspore/ccsrc/minddata/dataset/audio/ir/kernels/time_stretch_ir.cc
@ -0,0 +1,56 @@
+/**
+ * Copyright 2021 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include "minddata/dataset/audio/ir/kernels/time_stretch_ir.h"
+#include "minddata/dataset/audio/kernels/time_stretch_op.h"
+
+#include "minddata/dataset/audio/ir/validators.h"
+namespace mindspore {
+namespace dataset {
+namespace audio {
+
+// TimeStretch
+TimeStretchOperation::TimeStretchOperation(float hop_length, int n_freq, float fixed_rate)
+    : hop_length_(hop_length), n_freq_(n_freq), fixed_rate_(fixed_rate) {}
+
+TimeStretchOperation::~TimeStretchOperation() = default;
+
+std::string TimeStretchOperation::Name() const { return kTimeStretchOperation; }
+
+Status TimeStretchOperation::ValidateParams() {
+  //  param check
+  RETURN_IF_NOT_OK(CheckFloatScalarPositive("TimeStretch", "hop_length", hop_length_));
+  RETURN_IF_NOT_OK(CheckIntScalarPositive("TimeStretch", "n_freq", n_freq_));
+  RETURN_IF_NOT_OK(CheckFloatScalarNotNan("TimeStretch", "fixed_rate", fixed_rate_));
+  RETURN_IF_NOT_OK(CheckFloatScalarPositive("TimeStretch", "fixed_rate", fixed_rate_));
+  return Status::OK();
+}
+
+std::shared_ptr<TensorOp> TimeStretchOperation::Build() {
+  std::shared_ptr<TimeStretchOp> tensor_op = std::make_shared<TimeStretchOp>(hop_length_, n_freq_, fixed_rate_);
+  return tensor_op;
+}
+
+Status TimeStretchOperation::to_json(nlohmann::json *out_json) {
+  nlohmann::json args;
+  args["hop_length"] = hop_length_;
+  args["n_freq"] = n_freq_;
+  args["fixed_rate"] = fixed_rate_;
+  *out_json = args;
+  return Status::OK();
+}
+}  // namespace audio
+}  // namespace dataset
+}  // namespace mindspore
--- a/mindspore/ccsrc/minddata/dataset/audio/ir/kernels/time_stretch_ir.h
+++ b/mindspore/ccsrc/minddata/dataset/audio/ir/kernels/time_stretch_ir.h
@ -0,0 +1,55 @@
+/**
+ * Copyright 2021 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_CCSRC_MINDDATA_DATASET_AUDIO_IR_KERNELS_TIME_STRETCH_IR_H_
+#define MINDSPORE_CCSRC_MINDDATA_DATASET_AUDIO_IR_KERNELS_TIME_STRETCH_IR_H_
+
+#include <memory>
+#include <string>
+
+#include "include/api/status.h"
+#include "minddata/dataset/kernels/ir/tensor_operation.h"
+
+namespace mindspore {
+namespace dataset {
+namespace audio {
+
+constexpr char kTimeStretchOperation[] = "TimeStretch";
+
+class TimeStretchOperation : public TensorOperation {
+ public:
+  TimeStretchOperation(float hop_length, int n_freq, float fixed_rate);
+
+  ~TimeStretchOperation();
+
+  std::shared_ptr<TensorOp> Build() override;
+
+  Status ValidateParams() override;
+
+  std::string Name() const override;
+
+  Status to_json(nlohmann::json *out_json) override;
+
+ private:
+  float hop_length_;
+  int n_freq_;
+  float fixed_rate_;
+};
+
+}  // namespace audio
+}  // namespace dataset
+}  // namespace mindspore
+#endif  // MINDSPORE_CCSRC_MINDDATA_DATASET_AUDIO_IR_KERNELS_TIME_STRETCH_IR_H_
--- a/mindspore/ccsrc/minddata/dataset/audio/ir/validators.cc
+++ b/mindspore/ccsrc/minddata/dataset/audio/ir/validators.cc
@ -23,11 +23,25 @@ Status CheckFloatScalarPositive(const std::string &op_name, const std::string &s
  return Status::OK();
 }

+Status CheckFloatScalarNotNan(const std::string &op_name, const std::string &scalar_name, float scalar) {
+  if (std::isnan(scalar)) {
+    std::string err_msg = op_name + ":" + scalar_name + " should be specified, got: Nan.";
+    MS_LOG(ERROR) << err_msg;
+    return Status(StatusCode::kMDSyntaxError, __LINE__, __FILE__, err_msg);
+  }
+  return Status::OK();
+}
+
 Status CheckFloatScalarNonNegative(const std::string &op_name, const std::string &scalar_name, float scalar) {
  RETURN_IF_NOT_OK(CheckScalar(op_name, scalar_name, scalar, {0}, false));
  return Status::OK();
 }

+Status CheckIntScalarPositive(const std::string &op_name, const std::string &scalar_name, int32_t scalar) {
+  RETURN_IF_NOT_OK(CheckScalar(op_name, scalar_name, scalar, {0}, true));
+  return Status::OK();
+}
+
 Status CheckStringScalarInList(const std::string &op_name, const std::string &scalar_name, const std::string &scalar,
                               const std::vector<std::string> &str_vec) {
  auto ret = std::find(str_vec.begin(), str_vec.end(), scalar);
@ -78,5 +92,7 @@ Status CheckScalar(const std::string &op_name, const std::string &scalar_name, c
 template Status CheckScalar(const std::string &op_name, const std::string &scalar_name, const float scalar,
                            const std::vector<float> &range, bool left_open_interval, bool right_open_interval);

+template Status CheckScalar(const std::string &op_name, const std::string &scalar_name, const int32_t scalar,
+                            const std::vector<int32_t> &range, bool left_open_interval, bool right_open_interval);
 }  // namespace dataset
 }  // namespace mindspore
--- a/mindspore/ccsrc/minddata/dataset/audio/ir/validators.h
+++ b/mindspore/ccsrc/minddata/dataset/audio/ir/validators.h
@ -28,6 +28,15 @@
 namespace mindspore {
 namespace dataset {

+// Helper function to non-nan float scalar
+Status CheckFloatScalarNotNan(const std::string &op_name, const std::string &scalar_name, float scalar);
+
+// Helper function to positive float scalar
+Status CheckFloatScalarPositive(const std::string &op_name, const std::string &scalar_name, float scalar);
+
+// Helper function to positive int scalar
+Status CheckIntScalarPositive(const std::string &op_name, const std::string &scalar_name, int32_t scalar);
+
 template <typename T>
 // Helper function to check scalar is not equal to zero
 Status CheckScalarNotZero(const std::string &op_name, const std::string &scalar_name, const T scalar) {
--- a/mindspore/ccsrc/minddata/dataset/audio/kernels/CMakeLists.txt
+++ b/mindspore/ccsrc/minddata/dataset/audio/kernels/CMakeLists.txt
@ -10,4 +10,5 @@ add_library(audio-kernels OBJECT
        bandpass_biquad_op.cc
        bandreject_biquad_op.cc
        bass_biquad_op.cc
+        time_stretch_op.cc
        )
--- a/mindspore/ccsrc/minddata/dataset/audio/kernels/audio_utils.cc
+++ b/mindspore/ccsrc/minddata/dataset/audio/kernels/audio_utils.cc
@ -61,5 +61,325 @@ template Status AmplitudeToDB<float>(const std::shared_ptr<Tensor> &input, std::
                                     float multiplier, float amin, float db_multiplier, float top_db);
 template Status AmplitudeToDB<double>(const std::shared_ptr<Tensor> &input, std::shared_ptr<Tensor> *output,
                                      double multiplier, double amin, double db_multiplier, double top_db);
+
+/// \brief Generate linearly spaced vector
+/// \param[in] start - Value of the startpoint.
+/// \param[in] end - Value of the endpoint.
+/// \param[in] n - N points in the output tensor.
+/// \param[out] output - Tensor has n points with linearly space. The spacing between the points is (end-start)/(n-1).
+/// \return Status return code
+template <typename T>
+Status Linespace(std::shared_ptr<Tensor> *output, T start, T end, int n) {
+  if (start > end) {
+    std::string err = "Linespace: input param end must be greater than start.";
+    RETURN_STATUS_UNEXPECTED(err);
+  }
+  n = std::isnan(n) ? 100 : n;
+  TensorShape out_shape({n});
+  std::vector<T> linear_vect(n);
+  T interval = (end - start) / (n - 1);
+  for (int i = 0; i < linear_vect.size(); ++i) {
+    linear_vect[i] = start + i * interval;
+  }
+  std::shared_ptr<Tensor> out_t;
+  RETURN_IF_NOT_OK(Tensor::CreateFromVector(linear_vect, out_shape, &out_t));
+  linear_vect.clear();
+  linear_vect.shrink_to_fit();
+  *output = out_t;
+  return Status::OK();
+}
+
+/// \brief Calculate complex tensor angle
+/// \param[in] input - Input tensor, must be complex, <channel, freq, time, complex=2>.
+/// \param[out] output - Complex tensor angle.
+/// \return Status return code
+template <typename T>
+Status ComplexAngle(const std::shared_ptr<Tensor> &input, std::shared_ptr<Tensor> *output) {
+  // check complex
+  if (!input->IsComplex()) {
+    std::string err_msg = "ComplexAngle: input tensor is not in shape of <..., 2>.";
+    MS_LOG(ERROR) << err_msg;
+    RETURN_STATUS_SYNTAX_ERROR(err_msg);
+  }
+  TensorShape input_shape = input->shape();
+  TensorShape out_shape({input_shape[0], input_shape[1], input_shape[2]});
+  std::vector<T> phase(input_shape[0] * input_shape[1] * input_shape[2]);
+  int ind = 0;
+
+  for (auto itr = input->begin<T>(); itr != input->end<T>(); itr++, ind++) {
+    auto x = (*itr);
+    itr++;
+    auto y = (*itr);
+    phase[ind] = atan2(y, x);
+  }
+
+  std::shared_ptr<Tensor> out_t;
+  RETURN_IF_NOT_OK(Tensor::CreateFromVector(phase, out_shape, &out_t));
+  phase.clear();
+  phase.shrink_to_fit();
+  *output = out_t;
+  return Status::OK();
+}
+
+/// \brief Calculate complex tensor abs
+/// \param[in] input - Input tensor, must be complex, <channel, freq, time, complex=2>.
+/// \param[out] output - Complex tensor abs.
+/// \return Status return code
+template <typename T>
+Status ComplexAbs(const std::shared_ptr<Tensor> &input, std::shared_ptr<Tensor> *output) {
+  // check complex
+  if (!input->IsComplex()) {
+    std::string err_msg = "ComplexAngle: input tensor is not in shape of <..., 2>.";
+    MS_LOG(ERROR) << err_msg;
+    RETURN_STATUS_SYNTAX_ERROR(err_msg);
+  }
+  TensorShape input_shape = input->shape();
+  TensorShape out_shape({input_shape[0], input_shape[1], input_shape[2]});
+  std::vector<T> abs(input_shape[0] * input_shape[1] * input_shape[2]);
+  int ind = 0;
+  for (auto itr = input->begin<T>(); itr != input->end<T>(); itr++, ind++) {
+    T x = (*itr);
+    itr++;
+    T y = (*itr);
+    abs[ind] = sqrt(pow(y, 2) + pow(x, 2));
+  }
+
+  std::shared_ptr<Tensor> out_t;
+  RETURN_IF_NOT_OK(Tensor::CreateFromVector(abs, out_shape, &out_t));
+  *output = out_t;
+  return Status::OK();
+}
+
+/// \brief Reconstruct complex tensor from norm and angle
+/// \param[in] abs - The absolute value of the complex tensor.
+/// \param[in] angle - The angle of the complex tensor.
+/// \param[out] output - Complex tensor, <channel, freq, time, complex=2>.
+/// \return Status return code
+template <typename T>
+Status Polar(const std::shared_ptr<Tensor> &abs, const std::shared_ptr<Tensor> &angle,
+             std::shared_ptr<Tensor> *output) {
+  // check shape
+  if (abs->shape() != angle->shape()) {
+    std::string err_msg = "Polar: input shape of abs and angle must be same.";
+    MS_LOG(ERROR) << err_msg;
+    RETURN_STATUS_SYNTAX_ERROR(err_msg);
+  }
+
+  TensorShape input_shape = abs->shape();
+  TensorShape out_shape({input_shape[0], input_shape[1], input_shape[2], 2});
+  std::vector<T> complex_vec(input_shape[0] * input_shape[1] * input_shape[2] * 2);
+  int ind = 0;
+  auto itr_abs = abs->begin<T>();
+  auto itr_angle = angle->begin<T>();
+
+  for (; itr_abs != abs->end<T>(); itr_abs++, itr_angle++) {
+    complex_vec[ind++] = cos(*itr_angle) * (*itr_abs);
+    complex_vec[ind++] = sin(*itr_angle) * (*itr_abs);
+  }
+
+  std::shared_ptr<Tensor> out_t;
+  RETURN_IF_NOT_OK(Tensor::CreateFromVector(complex_vec, out_shape, &out_t));
+  *output = out_t;
+  return Status::OK();
+}
+
+/// \brief Pad complex tensor
+/// \param[in] input - The complex tensor.
+/// \param[in] length - The length of padding.
+/// \param[in] dim - The dim index for padding.
+/// \param[out] output - Complex tensor, <channel, freq, time, complex=2>.
+/// \return Status return code
+template <typename T>
+Status PadComplexTensor(const std::shared_ptr<Tensor> &input, std::shared_ptr<Tensor> *output, int length, int dim) {
+  TensorShape input_shape = input->shape();
+  std::vector<int64_t> pad_shape_vec = {input_shape[0], input_shape[1], input_shape[2], input_shape[3]};
+  pad_shape_vec[dim] += length;
+  TensorShape input_shape_with_pad(pad_shape_vec);
+  std::vector<T> in_vect(input_shape_with_pad[0] * input_shape_with_pad[1] * input_shape_with_pad[2] *
+                         input_shape_with_pad[3]);
+  auto itr_input = input->begin<T>();
+  int input_cnt = 0;
+  for (int ind = 0; ind < in_vect.size(); ind++) {
+    in_vect[ind] = (*itr_input);
+    input_cnt = (input_cnt + 1) % (input_shape[2] * input_shape[3]);
+    itr_input++;
+    // complex tensor last dim equals 2, fill zero count equals 2*width
+    if (input_cnt == 0 && ind != 0) {
+      for (int c = 0; c < length * 2; c++) {
+        in_vect[++ind] = 0.0f;
+      }
+    }
+  }
+  std::shared_ptr<Tensor> out_t;
+  RETURN_IF_NOT_OK(Tensor::CreateFromVector(in_vect, input_shape_with_pad, &out_t));
+  *output = out_t;
+  return Status::OK();
+}
+
+/// \brief Calculate phase
+/// \param[in] angle_0 - The angle.
+/// \param[in] angle_1 - The angle.
+/// \param[in] phase_advance - The phase advance.
+/// \param[in] phase_time0 - The phase at time 0.
+/// \param[out] output - Phase tensor.
+/// \return Status return code
+template <typename T>
+Status Phase(const std::shared_ptr<Tensor> &angle_0, const std::shared_ptr<Tensor> &angle_1,
+             const std::shared_ptr<Tensor> &phase_advance, const std::shared_ptr<Tensor> &phase_time0,
+             std::shared_ptr<Tensor> *output) {
+  TensorShape phase_shape = angle_0->shape();
+  std::vector<T> phase(phase_shape[0] * phase_shape[1] * phase_shape[2]);
+  auto itr_angle_0 = angle_0->begin<T>();
+  auto itr_angle_1 = angle_1->begin<T>();
+  auto itr_pa = phase_advance->begin<T>();
+  for (int ind = 0, input_cnt = 0; itr_angle_0 != angle_0->end<T>(); itr_angle_0++, itr_angle_1++, ind++) {
+    if (ind != 0 && ind % phase_shape[2] == 0) {
+      itr_pa++;
+      if (itr_pa == phase_advance->end<T>()) {
+        itr_pa = phase_advance->begin<T>();
+      }
+      input_cnt++;
+    }
+    phase[ind] = (*itr_angle_1) - (*itr_angle_0) - (*itr_pa);
+    phase[ind] = phase[ind] - 2 * PI * round(phase[ind] / (2 * PI)) + (*itr_pa);
+  }
+
+  // concat phase time 0
+  int ind = 0;
+  auto itr_p0 = phase_time0->begin<T>();
+  phase.insert(phase.begin(), (*itr_p0));
+  while (itr_p0 != phase_time0->end<T>()) {
+    itr_p0++;
+    ind += phase_shape[2];
+    phase[ind] = (*itr_p0);
+  }
+  phase.erase(phase.begin() + static_cast<int>(angle_0->Size()), phase.end());
+
+  // cal phase accum
+  for (ind = 0; ind < phase.size(); ind++) {
+    if (ind % phase_shape[2] != 0) {
+      phase[ind] = phase[ind] + phase[ind - 1];
+    }
+  }
+  std::shared_ptr<Tensor> phase_tensor;
+  RETURN_IF_NOT_OK(Tensor::CreateFromVector(phase, phase_shape, &phase_tensor));
+  *output = phase_tensor;
+  return Status::OK();
+}
+
+/// \brief Calculate magnitude
+/// \param[in] alphas - The alphas.
+/// \param[in] abs_0 - The norm.
+/// \param[in] abs_1 - The norm.
+/// \param[out] output - Magnitude tensor.
+/// \return Status return code
+template <typename T>
+Status Mag(const std::shared_ptr<Tensor> &abs_0, const std::shared_ptr<Tensor> &abs_1, std::shared_ptr<Tensor> *output,
+           const std::vector<T> &alphas) {
+  TensorShape mag_shape = abs_0->shape();
+  std::vector<T> mag(mag_shape[0] * mag_shape[1] * mag_shape[2]);
+  auto itr_abs_0 = abs_0->begin<T>();
+  auto itr_abs_1 = abs_1->begin<T>();
+  for (int ind = 0; itr_abs_0 != abs_0->end<T>(); itr_abs_0++, itr_abs_1++, ind++) {
+    mag[ind] = alphas[ind % mag_shape[2]] * (*itr_abs_1) + (1 - alphas[ind % mag_shape[2]]) * (*itr_abs_0);
+  }
+  std::shared_ptr<Tensor> mag_tensor;
+  RETURN_IF_NOT_OK(Tensor::CreateFromVector(mag, mag_shape, &mag_tensor));
+  *output = mag_tensor;
+  return Status::OK();
+}
+
+template <typename T>
+Status TimeStretch(std::shared_ptr<Tensor> input, std::shared_ptr<Tensor> *output, float rate,
+                   std::shared_ptr<Tensor> phase_advance) {
+  // pack <..., freq, time, complex>
+  TensorShape input_shape = input->shape();
+  TensorShape toShape({input->Size() / (input_shape[-1] * input_shape[-2] * input_shape[-3]), input_shape[-3],
+                       input_shape[-2], input_shape[-1]});
+  RETURN_IF_NOT_OK(input->Reshape(toShape));
+  if (rate == 1.0) {
+    *output = input;
+    return Status::OK();
+  }
+  // calculate time step and alphas
+  int ind = 0;
+  std::vector<dsize_t> time_steps_0, time_steps_1;
+  std::vector<T> alphas;
+  for (T val = 0;; ind++) {
+    val = ind * rate;
+    if (val >= input_shape[-2]) break;
+    int val_int = static_cast<int>(val);
+    time_steps_0.push_back(val_int);
+    time_steps_1.push_back(val_int + 1);
+    alphas.push_back(fmod(val, 1));
+  }
+
+  // calculate phase on time 0
+  std::shared_ptr<Tensor> spec_time0, phase_time0;
+  RETURN_IF_NOT_OK(
+    input->Slice(&spec_time0, std::vector<SliceOption>({SliceOption(true), SliceOption(true),
+                                                        SliceOption(std::vector<dsize_t>{0}), SliceOption(true)})));
+  RETURN_IF_NOT_OK(ComplexAngle<T>(spec_time0, &phase_time0));
+
+  // time pad: add zero to time dim
+  RETURN_IF_NOT_OK(PadComplexTensor<T>(input, &input, 2, 2));
+
+  // slice
+  std::shared_ptr<Tensor> spec_0;
+  RETURN_IF_NOT_OK(input->Slice(&spec_0, std::vector<SliceOption>({SliceOption(true), SliceOption(true),
+                                                                   SliceOption(time_steps_0), SliceOption(true)})));
+  std::shared_ptr<Tensor> spec_1;
+  RETURN_IF_NOT_OK(input->Slice(&spec_1, std::vector<SliceOption>({SliceOption(true), SliceOption(true),
+                                                                   SliceOption(time_steps_1), SliceOption(true)})));
+
+  // new slices angle and abs <channel, freq, time>
+  std::shared_ptr<Tensor> angle_0, angle_1, abs_0, abs_1;
+  RETURN_IF_NOT_OK(ComplexAngle<T>(spec_0, &angle_0));
+  RETURN_IF_NOT_OK(ComplexAbs<T>(spec_0, &abs_0));
+  RETURN_IF_NOT_OK(ComplexAngle<T>(spec_1, &angle_1));
+  RETURN_IF_NOT_OK(ComplexAbs<T>(spec_1, &abs_1));
+
+  // cal phase, there exists precision loss between mindspore and pytorch
+  std::shared_ptr<Tensor> phase_tensor;
+  RETURN_IF_NOT_OK(Phase<T>(angle_0, angle_1, phase_advance, phase_time0, &phase_tensor));
+
+  // calculate magnitude
+  std::shared_ptr<Tensor> mag_tensor;
+  RETURN_IF_NOT_OK(Mag<T>(abs_0, abs_1, &mag_tensor, alphas));
+
+  // reconstruct complex from norm and angle
+  std::shared_ptr<Tensor> complex_spec_stretch;
+  RETURN_IF_NOT_OK(Polar<T>(mag_tensor, phase_tensor, &complex_spec_stretch));
+
+  // unpack
+  auto output_shape_vec = input_shape.AsVector();
+  output_shape_vec.pop_back();
+  output_shape_vec.pop_back();
+  output_shape_vec.push_back(complex_spec_stretch->shape()[-2]);
+  output_shape_vec.push_back(input_shape[-1]);
+  RETURN_IF_NOT_OK(complex_spec_stretch->Reshape(TensorShape(output_shape_vec)));
+  *output = complex_spec_stretch;
+  return Status::OK();
+}
+
+Status TimeStretch(std::shared_ptr<Tensor> input, std::shared_ptr<Tensor> *output, float rate, float hop_length,
+                   float n_freq) {
+  std::shared_ptr<Tensor> phase_advance;
+  switch (input->type().value()) {
+    case DataType::DE_FLOAT32:
+      RETURN_IF_NOT_OK(Linespace<float>(&phase_advance, 0, PI * hop_length, n_freq));
+      RETURN_IF_NOT_OK(TimeStretch<float>(input, output, rate, phase_advance));
+      break;
+    case DataType::DE_FLOAT64:
+      RETURN_IF_NOT_OK(Linespace<double>(&phase_advance, 0, PI * hop_length, n_freq));
+      RETURN_IF_NOT_OK(TimeStretch<double>(input, output, rate, phase_advance));
+      break;
+    default:
+      RETURN_STATUS_UNEXPECTED(
+        "TimeStretch: unsupported type, currently supported types include "
+        "[float, double].");
+  }
+  return Status::OK();
+}
 }  // namespace dataset
 }  // namespace mindspore
--- a/mindspore/ccsrc/minddata/dataset/audio/kernels/audio_utils.h
+++ b/mindspore/ccsrc/minddata/dataset/audio/kernels/audio_utils.h
@ -176,6 +176,16 @@ Status LFilter(const std::shared_ptr<Tensor> &input, std::shared_ptr<Tensor> *ou
  delete m_py;
  return Status::OK();
 }
+
+/// \brief Stretch STFT in time at a given rate, without changing the pitch.
+/// \param[in] input - Tensor of shape <...,freq,time>.
+/// \param[in] rate - Stretch factor.
+/// \param[in] phase_advance - Expected phase advance in each bin.
+/// \param[out] output - Tensor after stretch in time domain.
+/// \return Status return code
+Status TimeStretch(std::shared_ptr<Tensor> input, std::shared_ptr<Tensor> *output, float rate, float hop_length,
+                   float n_freq);
+
 }  // namespace dataset
 }  // namespace mindspore
 #endif  // MINDSPORE_CCSRC_MINDDATA_DATASET_AUDIO_KERNELS_AUDIO_UTILS_H_
--- a/mindspore/ccsrc/minddata/dataset/audio/kernels/time_stretch_op.cc
+++ b/mindspore/ccsrc/minddata/dataset/audio/kernels/time_stretch_op.cc
@ -0,0 +1,80 @@
+/**
+ * Copyright 2021 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include "minddata/dataset/audio/kernels/time_stretch_op.h"
+
+#include <limits>
+
+#include "minddata/dataset/audio/kernels/audio_utils.h"
+#include "minddata/dataset/kernels/data/data_utils.h"
+#include "minddata/dataset/util/status.h"
+
+namespace mindspore {
+namespace dataset {
+
+const float TimeStretchOp::kHopLength = std::numeric_limits<float>::quiet_NaN();
+const int TimeStretchOp::kNFreq = 201;
+const float TimeStretchOp::kFixedRate = std::numeric_limits<float>::quiet_NaN();
+
+Status TimeStretchOp::Compute(const std::shared_ptr<Tensor> &input, std::shared_ptr<Tensor> *output) {
+  // check and init
+  IO_CHECK(input, output);
+
+  // check shape
+  if (input->shape().Rank() < 3) {
+    std::string err_msg = "TimeStretch: input tensor shape is not <..., freq, num_frame, complex=2>.";
+    MS_LOG(ERROR) << err_msg;
+    RETURN_STATUS_SYNTAX_ERROR(err_msg);
+  }
+
+  // check complex
+  if (!input->IsComplex()) {
+    std::string err_msg = "TimeStretch: input tensor is not in shape of <..., 2>.";
+    MS_LOG(ERROR) << err_msg;
+    RETURN_STATUS_SYNTAX_ERROR(err_msg);
+  }
+
+  std::shared_ptr<Tensor> input_tensor;
+  // std::shared_ptr<Tensor> phase_advance;
+  float hop_length = std::isnan(hop_length_) ? (n_freq_ - 1) : hop_length_;
+  // typecast
+  CHECK_FAIL_RETURN_UNEXPECTED(input->type() != DataType::DE_STRING,
+                               "TimeStretch: input tensor type should be [int, float, double], but got string.");
+  if (input->type() != DataType::DE_FLOAT64) {
+    RETURN_IF_NOT_OK(TypeCast(input, &input_tensor, DataType(DataType::DE_FLOAT32)));
+  } else {
+    input_tensor = input;
+  }
+
+  return TimeStretch(input_tensor, output, fixed_rate_, hop_length, n_freq_);
+}
+
+Status TimeStretchOp::OutputShape(const std::vector<TensorShape> &inputs, std::vector<TensorShape> &outputs) {
+  RETURN_IF_NOT_OK(TensorOp::OutputShape(inputs, outputs));
+  outputs.clear();
+  for (auto s : inputs) {
+    std::vector<dsize_t> s_vec = s.AsVector();
+    s_vec.pop_back();
+    s_vec.pop_back();
+    s_vec.push_back(std::ceil(s[-2] / fixed_rate_));
+    // push back complex
+    s_vec.push_back(2);
+    outputs.emplace_back(TensorShape(s_vec));
+  }
+  CHECK_FAIL_RETURN_UNEXPECTED(!outputs.empty(), "TimeStretch: invalid input shape.");
+  return Status::OK();
+}
+}  // namespace dataset
+}  // namespace mindspore
--- a/mindspore/ccsrc/minddata/dataset/audio/kernels/time_stretch_op.h
+++ b/mindspore/ccsrc/minddata/dataset/audio/kernels/time_stretch_op.h
@ -0,0 +1,58 @@
+/**
+ * Copyright 2021 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef MINDSPORE_CCSRC_MINDDATA_DATASET_AUDIO_KERNELS_TIME_STRETCH_OP_H_
+#define MINDSPORE_CCSRC_MINDDATA_DATASET_AUDIO_KERNELS_TIME_STRETCH_OP_H_
+
+#include <memory>
+#include <string>
+#include <utility>
+#include <vector>
+
+#include "minddata/dataset/core/tensor.h"
+#include "minddata/dataset/kernels/tensor_op.h"
+
+namespace mindspore {
+namespace dataset {
+class TimeStretchOp : public TensorOp {
+ public:
+  /// Default value
+  static const float kHopLength;
+  static const int kNFreq;
+  static const float kFixedRate;
+
+  explicit TimeStretchOp(float hop_length = kHopLength, int n_freq = kNFreq, float fixed_rate = kFixedRate)
+      : hop_length_(hop_length), n_freq_(n_freq), fixed_rate_(fixed_rate) {}
+
+  ~TimeStretchOp() override = default;
+
+  Status Compute(const std::shared_ptr<Tensor> &input, std::shared_ptr<Tensor> *output) override;
+
+  std::string Name() const override { return kTimeStretchOp; }
+
+  /// \param[in] inputs
+  /// \param[out] outputs
+  /// \return  Status code
+  Status OutputShape(const std::vector<TensorShape> &inputs, std::vector<TensorShape> &outputs) override;
+
+ private:
+  float hop_length_;
+  int n_freq_;
+  float fixed_rate_;
+};
+}  // namespace dataset
+}  // namespace mindspore
+#endif  // MINDSPORE_CCSRC_MINDDATA_DATASET_AUDIO_KERNELS_TIME_STRETCH_OP_H_
--- a/mindspore/ccsrc/minddata/dataset/core/tensor.h
+++ b/mindspore/ccsrc/minddata/dataset/core/tensor.h
@ -306,6 +306,13 @@ class Tensor {
  /// \return bool - true if tensor is not empty
  bool HasData() const { return data_ != nullptr; }

+  /// Check if tensor is complex
+  /// \return bool - true if tensor is complex
+  bool IsComplex() const {
+    // check the last dim all be 2
+    return shape_[-1] == 2;
+  }
+
  /// Reshape the tensor. The given shape should have the same number of elements in the Tensor
  /// \param shape
  virtual Status Reshape(const TensorShape &shape);
--- a/mindspore/ccsrc/minddata/dataset/include/dataset/audio.h
+++ b/mindspore/ccsrc/minddata/dataset/include/dataset/audio.h
@ -186,6 +186,30 @@ class BassBiquad final : public TensorTransform {
  struct Data;
  std::shared_ptr<Data> data_;
 };
+
+/// \brief TimeStretch TensorTransform
+/// \notes Stretch STFT in time at a given rate, without changing the pitch.
+class TimeStretch final : public TensorTransform {
+ public:
+  /// \brief Constructor.
+  /// \param[in] hop_length Length of hop between STFT windows. Default: None.
+  /// \param[in] n_freq Number of filter banks form STFT. Default: 201.
+  /// \param[in] fixed_rate Rate to speed up or slow down the input in time. Default: None.
+  explicit TimeStretch(float hop_length = std::numeric_limits<float>::quiet_NaN(), int n_freq = 201,
+                       float fixed_rate = std::numeric_limits<float>::quiet_NaN());
+
+  /// \brief Destructor.
+  ~TimeStretch() = default;
+
+ protected:
+  /// \brief Function to convert TensorTransform object into a TensorOperation object.
+  /// \return Shared pointer to TensorOperation object.
+  std::shared_ptr<TensorOperation> Parse() override;
+
+ private:
+  struct Data;
+  std::shared_ptr<Data> data_;
+};
 }  // namespace audio
 }  // namespace dataset
 }  // namespace mindspore
--- a/mindspore/ccsrc/minddata/dataset/kernels/tensor_op.h
+++ b/mindspore/ccsrc/minddata/dataset/kernels/tensor_op.h
@ -145,6 +145,7 @@ constexpr char kBandBiquadOp[] = "BandBiquadOp";
 constexpr char kBandpassBiquadOp[] = "BandpassBiquadOp";
 constexpr char kBandrejectBiquadOp[] = "BandrejectBiquadOp";
 constexpr char kBassBiquadOp[] = "BassBiquadOp";
+constexpr char kTimeStretchOp[] = "TimeStretchOp";

 // data
 constexpr char kConcatenateOp[] = "ConcatenateOp";
--- a/mindspore/dataset/audio/transforms.py
+++ b/mindspore/dataset/audio/transforms.py
@ -22,7 +22,7 @@ import numpy as np
 from ..transforms.c_transforms import TensorOperation
 from .utils import ScaleType
 from .validators import check_allpass_biquad, check_amplitude_to_db, check_band_biquad, check_bandpass_biquad, \
-    check_bandreject_biquad, check_bass_biquad
+    check_bandreject_biquad, check_bass_biquad, check_time_stretch


 class AudioTensorOperation(TensorOperation):
@ -249,3 +249,36 @@ class BassBiquad(AudioTensorOperation):

    def parse(self):
        return cde.BassBiquadOperation(self.sample_rate, self.gain, self.central_freq, self.Q)
+
+
+class TimeStretch(AudioTensorOperation):
+    """
+    Stretch STFT in time at a given rate, without changing the pitch.
+
+    Args:
+        hop_length (int, optional): Length of hop between STFT windows (default=None).
+        n_freq (int, optional): Number of filter banks form STFT (default=201).
+        fixed_rate (float, optional): Rate to speed up or slow down the input in time (default=None).
+
+    Examples:
+        >>> freq = 44100
+        >>> num_frame = 30
+        >>> def gen():
+        ...     np.random.seed(0)
+        ...     data =  np.random.random([freq, num_frame])
+        ...     yield (np.array(data, dtype=np.float32), )
+        >>> data1 = ds.GeneratorDataset(source=gen, column_names=["multi_dimensional_data"])
+        >>> transforms = [py_audio.TimeStretch()]
+        >>> data1 = data1.map(operations=transforms, input_columns=["multi_dimensional_data"])
+    """
+    @check_time_stretch
+    def __init__(self, hop_length=None, n_freq=201, fixed_rate=None):
+        self.n_freq = n_freq
+        self.fixed_rate = fixed_rate
+
+        n_fft = (n_freq - 1) * 2
+        self.hop_length = hop_length if hop_length is not None else n_fft // 2
+        self.fixed_rate = fixed_rate if fixed_rate is not None else np.nan
+
+    def parse(self):
+        return cde.TimeStretchOperation(self.hop_length, self.n_freq, self.fixed_rate)
--- a/mindspore/dataset/audio/validators.py
+++ b/mindspore/dataset/audio/validators.py
@ -16,8 +16,8 @@
 Validators for TensorOps.
 """
 from functools import wraps
-from mindspore.dataset.core.validator_helpers import check_not_zero, check_int32, check_float32, \
-    check_value_normalize_std, check_value_ratio, FLOAT_MAX_INTEGER, parse_user_args, type_check
+from mindspore.dataset.core.validator_helpers import check_not_zero, check_int32, check_float32, check_value, \
+    check_value_normalize_std, check_value_ratio, FLOAT_MAX_INTEGER, INT64_MAX, parse_user_args, type_check
 from .utils import ScaleType


@ -164,3 +164,25 @@ def check_bass_biquad(method):
        return method(self, *args, **kwargs)

    return new_method
+
+
+def check_time_stretch(method):
+    """Wrapper method to check the parameters of time_stretch."""
+    @wraps(method)
+    def new_method(self, *args, **kwargs):
+        [hop_length, n_freq, fixed_rate], _ = parse_user_args(method, *args, **kwargs)
+        # type check
+        type_check(hop_length, (int, type(None)), "hop_length")
+        type_check(n_freq, (int,), "n_freq")
+        type_check(fixed_rate, (int, float, type(None)), "fixed_rate")
+
+        # value check
+        if hop_length is not None:
+            check_value(hop_length, (1, INT64_MAX), "hop_length")
+        check_value(n_freq, (1, INT64_MAX), "n_freq")
+        if fixed_rate is not None:
+            check_value_ratio(fixed_rate, (0, FLOAT_MAX_INTEGER), "fixed_rate")
+
+        return method(self, *args, **kwargs)
+
+    return new_method
--- a/tests/ut/cpp/dataset/CMakeLists.txt
+++ b/tests/ut/cpp/dataset/CMakeLists.txt
@ -13,6 +13,7 @@ SET(DE_UT_SRCS
        buddy_test.cc
        build_vocab_test.cc
        c_api_audio_a_to_q_test.cc
+        c_api_audio_r_to_z_test.cc
        c_api_cache_test.cc
        c_api_dataset_album_test.cc
        c_api_audio_a_to_q_test.cc
--- a/tests/ut/cpp/dataset/c_api_audio_r_to_z_test.cc
+++ b/tests/ut/cpp/dataset/c_api_audio_r_to_z_test.cc
@ -0,0 +1,96 @@
+/**
+ * Copyright 2021 Huawei Technologies Co., Ltd
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+#include "common/common.h"
+#include "minddata/dataset/core/tensor.h"
+#include "minddata/dataset/include/dataset/datasets.h"
+#include "minddata/dataset/include/dataset/audio.h"
+
+using namespace mindspore::dataset;
+using mindspore::LogStream;
+using mindspore::ExceptionType::NoExceptionType;
+using mindspore::MsLogLevel::INFO;
+
+class MindDataTestPipeline : public UT::Common {
+ public:
+};
+
+TEST_F(MindDataTestPipeline, TestTimeStretchPipeline) {
+  MS_LOG(INFO) << "Doing test TimeStretchOp with custom param value. Pipeline.";
+  // op param
+  int freq = 1025;
+  int hop_length = 512;
+  float rate = 1.2;
+  // Original waveform
+  std::shared_ptr<SchemaObj> schema = Schema();
+  ASSERT_OK(schema->add_column("inputData", mindspore::DataType::kNumberTypeFloat32, {2, freq, 400, 2}));
+  std::shared_ptr<Dataset> ds = RandomData(50, schema);
+  EXPECT_NE(ds, nullptr);
+
+  ds = ds->SetNumWorkers(4);
+  EXPECT_NE(ds, nullptr);
+
+  auto TimeStretchOp = audio::TimeStretch(hop_length, freq, rate);
+
+  ds = ds->Map({TimeStretchOp});
+  EXPECT_NE(ds, nullptr);
+
+  // apply timestretch
+  std::shared_ptr<Iterator> iter = ds->CreateIterator();
+  EXPECT_NE(ds, nullptr);
+
+  std::unordered_map<std::string, mindspore::MSTensor> row;
+  ASSERT_OK(iter->GetNextRow(&row));
+
+  std::vector<int64_t> expected = {2, freq, int(std::ceil(400 / rate)), 2};
+
+  int i = 0;
+  while (row.size() != 0) {
+    auto col = row["inputData"];
+    ASSERT_EQ(col.Shape(), expected);
+    ASSERT_EQ(col.DataType(), mindspore::DataType::kNumberTypeFloat32);
+    ASSERT_OK(iter->GetNextRow(&row));
+    i++;
+  }
+  EXPECT_EQ(i, 50);
+
+  iter->Stop();
+}
+
+TEST_F(MindDataTestPipeline, TestTimeStretchPipelineWrongArgs) {
+  MS_LOG(INFO) << "Doing test TimeStretchOp with wrong param value. Pipeline.";
+  // op param
+  int freq = 1025;
+  int hop_length = 512;
+  float rate = -2;
+  // Original waveform
+  std::shared_ptr<SchemaObj> schema = Schema();
+  ASSERT_OK(schema->add_column("inputData", mindspore::DataType::kNumberTypeFloat32, {2, freq, 400, 2}));
+  std::shared_ptr<Dataset> ds = RandomData(50, schema);
+  EXPECT_NE(ds, nullptr);
+
+  ds = ds->SetNumWorkers(4);
+  EXPECT_NE(ds, nullptr);
+
+  auto TimeStretchOp = audio::TimeStretch(hop_length, freq, rate);
+
+  ds = ds->Map({TimeStretchOp});
+  EXPECT_NE(ds, nullptr);
+
+  // apply timestretch
+  std::shared_ptr<Iterator> iter = ds->CreateIterator();
+  // Expect failure
+  EXPECT_EQ(iter, nullptr);
+}
--- a/tests/ut/cpp/dataset/execute_test.cc
+++ b/tests/ut/cpp/dataset/execute_test.cc
@ -19,6 +19,7 @@
 #include "minddata/dataset/include/dataset/audio.h"
 #include "minddata/dataset/include/dataset/execute.h"
 #include "minddata/dataset/include/dataset/transforms.h"
+#include "minddata/dataset/include/dataset/audio.h"
 #include "minddata/dataset/include/dataset/vision.h"
 #include "minddata/dataset/include/dataset/audio.h"
 #include "minddata/dataset/include/dataset/text.h"
@ -196,6 +197,65 @@ TEST_F(MindDataTestExecute, TestCrop) {
  EXPECT_EQ(image.Shape()[1], 15);
 }

+TEST_F(MindDataTestExecute, TestTimeStretchEager) {
+  MS_LOG(INFO) << "Doing test TimeStretchOp with custom param value. Eager.";
+  std::shared_ptr<Tensor> input_tensor_;
+  // op param
+  int freq = 4;
+  int hop_length = 20;
+  float rate = 1.3;
+  int frame_num = 10;
+  // create tensor
+  TensorShape s = TensorShape({2, freq, frame_num, 2});
+  // init input vec
+  std::vector<float> input_vec(2 * freq * frame_num * 2);
+  for (int ind = 0; ind < input_vec.size(); ind++) {
+    input_vec[ind] = std::rand() % (1000) / (1000.0f);
+  }
+  ASSERT_OK(Tensor::CreateFromVector(input_vec, s, &input_tensor_));
+  auto input_ms = mindspore::MSTensor(std::make_shared<mindspore::dataset::DETensor>(input_tensor_));
+  std::shared_ptr<TensorTransform> time_stretch_op = std::make_shared<audio::TimeStretch>(hop_length, freq, rate);
+
+  // apply timestretch
+  mindspore::dataset::Execute Transform({time_stretch_op});
+  Status status = Transform(input_ms, &input_ms);
+  EXPECT_TRUE(status.IsOk());
+}
+
+TEST_F(MindDataTestExecute, TestTimeStretchParamCheck1) {
+  MS_LOG(INFO) << "Doing MindDataTestTimeStretch-TestTimeStretchParamCheck with invalid parameters.";
+  // Create an input
+  std::shared_ptr<Tensor> input_tensor_;
+  std::shared_ptr<Tensor> output_tensor;
+  TensorShape s = TensorShape({1, 4, 3, 2});
+  ASSERT_OK(Tensor::CreateFromVector(
+    std::vector<float>({1.0f, 2.0f, 3.0f, 4.0f, 5.0f, 6.0f, 6.0f, 5.0f, 4.0f, 3.0f, 2.0f, 1.0f,
+                        1.0f, 2.0f, 3.0f, 4.0f, 5.0f, 6.0f, 6.0f, 5.0f, 4.0f, 3.0f, 2.0f, 1.0f}),
+    s, &input_tensor_));
+  auto input_ms = mindspore::MSTensor(std::make_shared<mindspore::dataset::DETensor>(input_tensor_));
+  std::shared_ptr<TensorTransform> timestretch = std::make_shared<audio::TimeStretch>(4, 512, -2);
+  mindspore::dataset::Execute Transform({timestretch});
+  Status status = Transform(input_ms, &input_ms);
+  EXPECT_FALSE(status.IsOk());
+}
+
+TEST_F(MindDataTestExecute, TestTimeStretchParamCheck2) {
+  MS_LOG(INFO) << "Doing MindDataTestTimeStretch-TestTimeStretchParamCheck with invalid parameters.";
+  // Create an input
+  std::shared_ptr<Tensor> input_tensor_;
+  std::shared_ptr<Tensor> output_tensor;
+  TensorShape s = TensorShape({1, 4, 3, 2});
+  ASSERT_OK(Tensor::CreateFromVector(
+    std::vector<float>({1.0f, 2.0f, 3.0f, 4.0f, 5.0f, 6.0f, 6.0f, 5.0f, 4.0f, 3.0f, 2.0f, 1.0f,
+                        1.0f, 2.0f, 3.0f, 4.0f, 5.0f, 6.0f, 6.0f, 5.0f, 4.0f, 3.0f, 2.0f, 1.0f}),
+    s, &input_tensor_));
+  auto input_ms = mindspore::MSTensor(std::make_shared<mindspore::dataset::DETensor>(input_tensor_));
+  std::shared_ptr<TensorTransform> timestretch = std::make_shared<audio::TimeStretch>(4, -512, 2);
+  mindspore::dataset::Execute Transform({timestretch});
+  Status status = Transform(input_ms, &input_ms);
+  EXPECT_FALSE(status.IsOk());
+}
+
 TEST_F(MindDataTestExecute, TestTransformInput1) {
  MS_LOG(INFO) << "Doing MindDataTestExecute-TestTransformInput1.";
  // Test Execute with transform op input using API constructors, with std::shared_ptr<TensorTransform pointers,
--- a/tests/ut/python/dataset/test_time_stretch.py
+++ b/tests/ut/python/dataset/test_time_stretch.py
@ -0,0 +1,142 @@
+# Copyright 2021 Huawei Technologies Co., Ltd
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""
+Testing TimeStretch op in DE
+"""
+import numpy as np
+import pytest
+
+import mindspore.dataset as ds
+import mindspore.dataset.audio.transforms as c_audio
+from mindspore import log as logger
+
+CHANNEL_NUM = 2
+FREQ = 1025
+FRAME_NUM = 300
+COMPLEX = 2
+
+
+def gen(shape):
+    np.random.seed(0)
+    data = np.random.random(shape)
+    yield(np.array(data, dtype=np.float32),)
+
+
+def _count_unequal_element(data_expected, data_me, rtol, atol):
+    assert data_expected.shape == data_me.shape
+    total_count = len(data_expected.flatten())
+    error = np.abs(data_expected - data_me)
+    greater = np.greater(error, atol + np.abs(data_expected) * rtol)
+    loss_count = np.count_nonzero(greater)
+    assert (loss_count / total_count) < rtol, \
+        "\ndata_expected_std:{0}\ndata_me_error:{1}\nloss:{2}". \
+        format(data_expected[greater], data_me[greater], error[greater])
+
+
+def allclose_nparray(data_expected, data_me, rtol, atol, equal_nan=True):
+    if np.any(np.isnan(data_expected)):
+        assert np.allclose(data_me, data_expected, rtol, atol, equal_nan=equal_nan)
+    elif not np.allclose(data_me, data_expected, rtol, atol, equal_nan=equal_nan):
+        _count_unequal_element(data_expected, data_me, rtol, atol)
+    else:
+        assert True
+
+
+def test_time_stretch_pipeline():
+    """
+    Test TimeStretch op. Pipeline.
+    """
+    logger.info("test TimeStretch op")
+    generator = gen([CHANNEL_NUM, FREQ, FRAME_NUM, COMPLEX])
+    data1 = ds.GeneratorDataset(source=generator, column_names=[
+        "multi_dimensional_data"])
+
+    transforms = [
+        c_audio.TimeStretch(512, FREQ, 1.3)
+    ]
+    data1 = data1.map(operations=transforms, input_columns=[
+        "multi_dimensional_data"])
+
+    for item in data1.create_dict_iterator(num_epochs=1, output_numpy=True):
+        out_put = item["multi_dimensional_data"]
+    assert out_put.shape == (CHANNEL_NUM, FREQ, np.ceil(FRAME_NUM/1.3), COMPLEX)
+
+
+def test_time_stretch_pipeline_invalid_param():
+    """
+    Test TimeStretch op. Set invalid param. Pipeline.
+    """
+    logger.info("test TimeStretch op with invalid values")
+    generator = gen([CHANNEL_NUM, FREQ, FRAME_NUM, COMPLEX])
+    data1 = ds.GeneratorDataset(source=generator, column_names=[
+        "multi_dimensional_data"])
+
+    with pytest.raises(ValueError, match=r"Input fixed_rate is not within the required interval of \(0, 16777216\]."):
+        transforms = [
+            c_audio.TimeStretch(512, FREQ, -1.3)
+        ]
+        data1 = data1.map(operations=transforms, input_columns=[
+            "multi_dimensional_data"])
+
+        for item in data1.create_dict_iterator(num_epochs=1, output_numpy=True):
+            out_put = item["multi_dimensional_data"]
+        assert out_put.shape == (CHANNEL_NUM, FREQ, np.ceil(FRAME_NUM/1.3), COMPLEX)
+
+
+def test_time_stretch_eager():
+    """
+    Test TimeStretch op. Set param. Eager.
+    """
+    logger.info("test TimeStretch op with customized parameter values")
+    spectrogram = next(gen([CHANNEL_NUM, FREQ, FRAME_NUM, COMPLEX]))[0]
+    out_put = c_audio.TimeStretch(512, FREQ, 1.3)(spectrogram)
+    assert out_put.shape == (CHANNEL_NUM, FREQ, np.ceil(FRAME_NUM/1.3), COMPLEX)
+
+
+def test_percision_time_stretch_eager():
+    """
+    Test TimeStretch op. Compare precision. Eager.
+    """
+    logger.info("test TimeStretch op with default values")
+    spectrogram = np.array([[[[1.0402449369430542, 0.3807601034641266],
+                              [-1.120057225227356, -0.12819576263427734],
+                              [1.4303032159805298, -0.08839055150747299]],
+                             [[1.4198592901229858, 0.6900091767311096],
+                              [-1.8593409061431885, 0.16363371908664703],
+                              [-2.3349387645721436, -1.4366451501846313]]],
+                            [[[-0.7083967328071594, 0.9325454831123352],
+                              [-1.9133838415145874, 0.011225821450352669],
+                              [1.477278232574463, -1.0551637411117554]],
+                             [[-0.6668586134910583, -0.23143270611763],
+                              [-2.4390718936920166, 0.17638640105724335],
+                              [-0.4795735776424408, 0.1345423310995102]]]]).astype(np.float64)
+    out_expect = np.array([[[[1.0402449369430542, 0.3807601034641266],
+                             [-1.302264928817749, -0.1490504890680313]],
+                            [[1.4198592901229858, 0.6900091767311096],
+                             [-2.382312774658203, 0.2096325159072876]]],
+                           [[[-0.7083966732025146, 0.9325454831123352],
+                             [-1.8545820713043213, 0.010880803689360619]],
+                            [[-0.6668586134910583, -0.23143276572227478],
+                             [-1.2737033367156982, 0.09211209416389465]]]]).astype(np.float64)
+    out_ms = c_audio.TimeStretch(64, 2, 1.6)(spectrogram)
+
+    allclose_nparray(out_ms, out_expect, 0.001, 0.001)
+
+
+if __name__ == '__main__':
+    test_time_stretch_pipeline()
+    test_time_stretch_pipeline_invalid_param()
+    test_time_stretch_eager()
+    test_percision_time_stretch_eager()