k2-fsa · csukuangfj · Sep 30, 2021 · Aug 25, 2021 · Aug 26, 2021 · Aug 26, 2021
diff --git a/k2/python/csrc/torch/CMakeLists.txt b/k2/python/csrc/torch/CMakeLists.txt
@@ -11,10 +11,12 @@ set(torch_srcs
   ragged_ops.cu
   torch_util.cu
 
-  v2/k2.cu
   v2/any.cu
   v2/doc/doc.cu
+  v2/fsa.cu
+  v2/k2.cu
   v2/ragged_any.cu
+  v2/ragged_arc.cu
   v2/ragged_shape.cu
 )
 

diff --git a/k2/python/csrc/torch/v2/any.cu b/k2/python/csrc/torch/v2/any.cu
@@ -83,19 +83,19 @@ void PybindRaggedAny(py::module &m) {
   any.def(
       "clone",
       [](const RaggedAny &self) -> RaggedAny {
-        DeviceGuard guard(self.any_.Context());
+        DeviceGuard guard(self.any.Context());
         return self.Clone();
       },
       kRaggedAnyCloneDoc);
 
   any.def(
       "__eq__",
       [](const RaggedAny &self, const RaggedAny &other) -> bool {
-        DeviceGuard guard(self.any_.Context());
-        Dtype t = self.any_.GetDtype();
+        DeviceGuard guard(self.any.Context());
+        Dtype t = self.any.GetDtype();
         bool ans = false;
         FOR_REAL_AND_INT32_TYPES(t, T, {
-          ans = Equal<T>(self.any_.Specialize<T>(), other.any_.Specialize<T>());
+          ans = Equal<T>(self.any.Specialize<T>(), other.any.Specialize<T>());
         });
         return ans;
       },
@@ -104,12 +104,11 @@ void PybindRaggedAny(py::module &m) {
   any.def(
       "__ne__",
       [](const RaggedAny &self, const RaggedAny &other) -> bool {
-        DeviceGuard guard(self.any_.Context());
-        Dtype t = self.any_.GetDtype();
+        DeviceGuard guard(self.any.Context());
+        Dtype t = self.any.GetDtype();
         bool ans = false;
         FOR_REAL_AND_INT32_TYPES(t, T, {
-          ans =
-              !Equal<T>(self.any_.Specialize<T>(), other.any_.Specialize<T>());
+          ans = !Equal<T>(self.any.Specialize<T>(), other.any.Specialize<T>());
         });
         return ans;
       },
@@ -124,37 +123,37 @@ void PybindRaggedAny(py::module &m) {
   any.def(
       "numel",
       [](RaggedAny &self) -> int32_t {
-        DeviceGuard guard(self.any_.Context());
-        return self.any_.NumElements();
+        DeviceGuard guard(self.any.Context());
+        return self.any.NumElements();
       },
       kRaggedAnyNumelDoc);
 
   any.def(
       "tot_size",
       [](const RaggedAny &self, int32_t axis) -> int32_t {
-        DeviceGuard guard(self.any_.Context());
-        return self.any_.TotSize(axis);
+        DeviceGuard guard(self.any.Context());
+        return self.any.TotSize(axis);
       },
       py::arg("axis"), kRaggedAnyTotSizeDoc);
 
   any.def(py::pickle(
       [](const RaggedAny &self) -> py::tuple {
-        DeviceGuard guard(self.any_.Context());
-        K2_CHECK(self.any_.NumAxes() == 2 || self.any_.NumAxes() == 3)
+        DeviceGuard guard(self.any.Context());
+        K2_CHECK(self.any.NumAxes() == 2 || self.any.NumAxes() == 3)
             << "Only support Ragged with NumAxes() == 2 or 3 for now, given "
-            << self.any_.NumAxes();
-        Array1<int32_t> row_splits1 = self.any_.RowSplits(1);
-        Dtype t = self.any_.GetDtype();
+            << self.any.NumAxes();
+        Array1<int32_t> row_splits1 = self.any.RowSplits(1);
+        Dtype t = self.any.GetDtype();
 
         FOR_REAL_AND_INT32_TYPES(t, T, {
-          auto values = self.any_.Specialize<T>().values;
+          auto values = self.any.Specialize<T>().values;
           // We use "row_ids" placeholder here to make it compatible for the
           // old format file.
-          if (self.any_.NumAxes() == 2) {
+          if (self.any.NumAxes() == 2) {
             return py::make_tuple(ToTorch(row_splits1), "row_ids1",
                                   ToTorch(values));
           } else {
-            Array1<int32_t> row_splits2 = self.any_.RowSplits(2);
+            Array1<int32_t> row_splits2 = self.any.RowSplits(2);
             return py::make_tuple(ToTorch(row_splits1), "row_ids1",
                                   ToTorch(row_splits2), "row_ids2",
                                   ToTorch(values));
@@ -213,7 +212,7 @@ void PybindRaggedAny(py::module &m) {
   any.def_property_readonly(
       "dtype",
       [](const RaggedAny &self) -> py::object {
-        Dtype t = self.any_.GetDtype();
+        Dtype t = self.any.GetDtype();
         auto torch = py::module::import("torch");
         switch (t) {
           case kFloatDtype:
@@ -234,10 +233,10 @@ void PybindRaggedAny(py::module &m) {
   any.def_property_readonly(
       "device",
       [](const RaggedAny &self) -> py::object {
-        DeviceType d = self.any_.Context()->GetDeviceType();
+        DeviceType d = self.any.Context()->GetDeviceType();
         torch::DeviceType device_type = ToTorchDeviceType(d);
 
-        torch::Device device(device_type, self.any_.Context()->GetDeviceId());
+        torch::Device device(device_type, self.any.Context()->GetDeviceId());
 
         PyObject *ptr = THPDevice_New(device);
 
@@ -251,22 +250,23 @@ void PybindRaggedAny(py::module &m) {
   any.def_property_readonly(
       "data",
       [](RaggedAny &self) -> torch::Tensor {
-        Dtype t = self.any_.GetDtype();
+        Dtype t = self.any.GetDtype();
         FOR_REAL_AND_INT32_TYPES(
-            t, T, { return ToTorch(self.any_.values.Specialize<T>()); });
+            t, T, { return ToTorch(self.any.values.Specialize<T>()); });
 
         // Unreachable code
         return {};
       },
       kRaggedAnyDataDoc);
 
   any.def_property_readonly(
-      "shape", [](RaggedAny &self) -> RaggedShape { return self.any_.shape; });
+      "shape", [](RaggedAny &self) -> RaggedShape { return self.any.shape; },
+      "Return the ``Shape`` of this tensor.");
 
   any.def_property_readonly(
       "grad",
       [](RaggedAny &self) -> torch::optional<torch::Tensor> {
-        if (!self.data_.defined()) return {};
+        if (!self.data.defined()) return {};
 
         return self.Data().grad();
       },
@@ -275,7 +275,7 @@ void PybindRaggedAny(py::module &m) {
   any.def_property(
       "requires_grad",
       [](RaggedAny &self) -> bool {
-        if (!self.data_.defined()) return false;
+        if (!self.data.defined()) return false;
 
         return self.Data().requires_grad();
       },
@@ -287,19 +287,19 @@ void PybindRaggedAny(py::module &m) {
   any.def_property_readonly(
       "is_cuda",
       [](RaggedAny &self) -> bool {
-        return self.any_.Context()->GetDeviceType() == kCuda;
+        return self.any.Context()->GetDeviceType() == kCuda;
       },
       kRaggedAnyIsCudaDoc);
 
   // NumAxes() does not access GPU memory
   any.def_property_readonly(
       "num_axes",
-      [](const RaggedAny &self) -> int32_t { return self.any_.NumAxes(); },
+      [](const RaggedAny &self) -> int32_t { return self.any.NumAxes(); },
       kRaggedAnyNumAxesDoc);
 
   // Dim0() does not access GPU memory
   any.def_property_readonly(
-      "dim0", [](const RaggedAny &self) -> int32_t { return self.any_.Dim0(); },
+      "dim0", [](const RaggedAny &self) -> int32_t { return self.any.Dim0(); },
       kRaggedAnyDim0Doc);
 
   //==================================================
@@ -313,6 +313,13 @@ void PybindRaggedAny(py::module &m) {
         return RaggedAny(data, dtype);
       },
       py::arg("data"), py::arg("dtype") = py::none(), kRaggedAnyInitDataDoc);
+
+  m.def(
+      "create_tensor",
+      [](const std::string &s, py::object dtype = py::none()) -> RaggedAny {
+        return RaggedAny(s, dtype);
+      },
+      py::arg("s"), py::arg("dtype") = py::none(), kRaggedAnyInitStrDoc);
 }
 
 }  // namespace k2
diff --git a/k2/python/csrc/torch/v2/autograd/arc_sort.h b/k2/python/csrc/torch/v2/autograd/arc_sort.h
@@ -0,0 +1,81 @@
+/**
+ * @brief A wrapper around k2::ArcSort to support autograd
+ *
+ * @copyright
+ * Copyright      2021  Xiaomi Corp.  (authors: Fangjun Kuang)
+ *
+ * @copyright
+ * See LICENSE for clarification regarding multiple authors
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#ifndef K2_PYTHON_CSRC_TORCH_V2_AUTOGRAD_ARC_SORT_H
+#define K2_PYTHON_CSRC_TORCH_V2_AUTOGRAD_ARC_SORT_H
+
+#include "k2/csrc/fsa_algo.h"
+#include "k2/csrc/ragged_ops.h"
+#include "k2/csrc/tensor.h"
+#include "k2/csrc/tensor_ops.h"
+#include "k2/python/csrc/torch/torch_util.h"
+#include "k2/python/csrc/torch/v2/ragged_arc.h"
+
+using namespace torch::autograd;
+
+namespace k2 {
+
+// see https://pytorch.org/tutorials/advanced/cpp_autograd
+class ArcSortFunction : public torch::autograd::Function<ArcSortFunction> {
+ public:
+  /* ArcSort an Fsa. It is a wrapper around k2::ArcSort, supporting autograd.
+
+
+     @param ragged The input Fsa.
+     @param dummy  Its purpose is to make autograd to track the operations on
+                   the input `ragged`. It is the same as `ragged.scores`.
+     @param out  The output Fsa.
+
+     @return Return a 1-D unused tensor, which is out->scores.
+   */
+  static torch::Tensor forward(AutogradContext *ctx,
+                               /*const*/ RaggedArc &ragged,
+                               torch::Tensor /*dummy*/, RaggedArc *out) {
+    Array1<int32_t> arc_map;
+    ArcSort(ragged.fsa, &out->fsa, &arc_map);
+
+    ctx->save_for_backward({ToTorch(arc_map)});
+
+    return out->Scores();
+  }
+
+  static tensor_list backward(AutogradContext *ctx, tensor_list grad_outputs) {
+    auto saved = ctx->get_saved_variables();
+    torch::Tensor arc_map_tensor = saved[0];
+    Array1<int32_t> arc_map = FromTorch<int32_t>(arc_map_tensor);
+    torch::Tensor grad_output_tensor = grad_outputs[0];
+    Tensor grad_output = FromTorch(grad_output_tensor, TensorTag{});
+
+    Tensor ans = Index(grad_output, arc_map, /*allow_minus_one*/ false,
+                       /*default_value*/ 0);
+
+    return {
+        torch::Tensor(),  // ragged
+        ToTorch(ans),     // dummy
+        torch::Tensor()   // out
+    };
+  }
+};
+
+}  // namespace k2
+
+#endif  // K2_PYTHON_CSRC_TORCH_V2_AUTOGRAD_ARC_SORT_H
diff --git a/k2/python/csrc/torch/v2/autograd/sum.h b/k2/python/csrc/torch/v2/autograd/sum.h
@@ -41,7 +41,7 @@ class SumFunction : public torch::autograd::Function<SumFunction> {
 
      @param ragged The input RaggedAny
      @param dummy  Its purpose is to make autograd to track the operations on
-                   the input `ragged`. It is the same as `ragged.data_`.
+                   the input `ragged`. It is the same as `ragged.data`.
      @param initial_value This value is added to the sum of each sublist,
                           so when a sublist is empty, its sum is this value.
 
@@ -50,21 +50,20 @@ class SumFunction : public torch::autograd::Function<SumFunction> {
    */
   static torch::Tensor forward(AutogradContext *ctx, const RaggedAny &ragged,
                                torch::Tensor /*dummy*/, float initial_value) {
-    ctx->saved_data["n"] = ragged.any_.values.Dim();
+    ctx->saved_data["n"] = ragged.any.values.Dim();
 
-    int32_t num_axes = ragged.any_.NumAxes();
+    int32_t num_axes = ragged.any.NumAxes();
 
     torch::Tensor row_ids =
-        ToTorch(const_cast<RaggedAny &>(ragged).any_.RowIds(num_axes - 1));
+        ToTorch(const_cast<RaggedAny &>(ragged).any.RowIds(num_axes - 1));
 
     ctx->save_for_backward({row_ids});
 
-    Dtype t = ragged.any_.GetDtype();
+    Dtype t = ragged.any.GetDtype();
 
     FOR_REAL_AND_INT32_TYPES(t, T, {
-      Array1<T> values(ragged.any_.Context(),
-                       ragged.any_.TotSize(num_axes - 2));
-      SumPerSublist<T>(ragged.any_.Specialize<T>(), initial_value, &values);
+      Array1<T> values(ragged.any.Context(), ragged.any.TotSize(num_axes - 2));
+      SumPerSublist<T>(ragged.any.Specialize<T>(), initial_value, &values);
       return ToTorch(values);
     });
 

diff --git a/k2/python/csrc/torch/v2/fsa.cu b/k2/python/csrc/torch/v2/fsa.cu
@@ -0,0 +1,68 @@
+/**
+ * @brief python wrapper for Ragged<Arc>
+ *
+ * @copyright
+ * Copyright      2021  Xiaomi Corp.  (authors: Fangjun Kuang)
+ *
+ * @copyright
+ * See LICENSE for clarification regarding multiple authors
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "k2/csrc/ragged.h"
+#include "k2/python/csrc/torch/v2/fsa.h"
+#include "k2/python/csrc/torch/v2/ragged_arc.h"
+
+namespace k2 {
+
+void PybindRaggedArc(py::module &m) {
+  py::class_<RaggedArc> fsa(m, "Fsa");
+  fsa.def(py::init<>());
+
+  fsa.def(py::init<const std::string &, py::list>(), py::arg("s"),
+          py::arg("extra_label_names") = py::none());
+  fsa.def("__str__", &RaggedArc::ToString);
+  fsa.def("__repr__", &RaggedArc::ToString);
+
+  fsa.def("requires_grad_", &RaggedArc::SetRequiresGrad,
+          py::arg("requires_grad") = true);
+
+  fsa.def("arc_sort", &RaggedArc::ArcSort);
+
+  fsa.def_property(
+      "scores", [](RaggedArc &self) -> torch::Tensor { return self.Scores(); },
+      [](RaggedArc &self, torch::Tensor scores) {
+        self.Scores().copy_(scores);
+      });
+
+  fsa.def_property_readonly(
+      "grad", [](RaggedArc &self) -> torch::optional<torch::Tensor> {
+        if (!self.scores.defined()) return {};
+
+        return self.Scores().grad();
+      });
+
+  fsa.def_property(
+      "requires_grad",
+      [](RaggedArc &self) -> bool {
+        if (!self.scores.defined()) return false;
+
+        return self.Scores().requires_grad();
+      },
+      [](RaggedArc &self, bool requires_grad) -> void {
+        self.SetRequiresGrad(requires_grad);
+      });
+}
+
+}  // namespace k2