add test cases

yongwww · yongwww · commit 454ede4232f8 · 2023-12-16T08:53:24.000-08:00
diff --git a/include/tvm/relax/dataflow_pattern.h b/include/tvm/relax/dataflow_pattern.h
@@ -56,6 +56,7 @@ class NotPattern;
 class ShapePattern;
 class TypePattern;
 class DataTypePattern;
+class TargetPattern;
 class AttrPattern;
 class SameShapeConstraint;
 
@@ -120,6 +121,8 @@ class DFPattern : public ObjectRef {
   TVM_DLL DataTypePattern HasDtype(const std::string& dtype) const;
   /*! \brief Syntatic Sugar for creating a ShapePattern */
   TVM_DLL ShapePattern HasShape(const Array<PrimExpr>& shape) const;
+    /*! \brief Syntatic Sugar for creating a TargetPattern with a target */
+  TVM_DLL TargetPattern HasTarget(const Target& target) const;
   /*! \brief Syntatic Sugar for creating a ShapePattern */
   TVM_DLL SameShapeConstraint HasSameShapeAs(const DFPattern& other) const;
   /*! \brief Syntatic Sugar for duplicating the current pattern */
@@ -843,6 +846,34 @@ class DataTypePattern : public DFPattern {
   TVM_DEFINE_OBJECT_REF_METHODS(DataTypePattern, DFPattern, DataTypePatternNode);
 };
 
+/*!
+ * \brief A pattern that asserting a root pattern has a certain target.
+ * \sa TargetPattern
+ */
+class TargetPatternNode : public DFPatternNode {
+ public:
+  DFPattern pattern; /*!< The root pattern to match */
+  Target target;    /*!< The target to match */
+
+  void VisitAttrs(tvm::AttrVisitor* v) {
+    v->Visit("pattern", &pattern);
+    v->Visit("target", &target);
+  }
+
+  static constexpr const char* _type_key = "relax.dpl.TargetPattern";
+  TVM_DECLARE_FINAL_OBJECT_INFO(TargetPatternNode, DFPatternNode);
+};
+
+/*!
+ * \brief Managed reference to TargetPatternNode.
+ * \sa TargetPatternNode
+ */
+class TargetPattern : public DFPattern {
+ public:
+  TVM_DLL TargetPattern(DFPattern pattern, Target target);
+  TVM_DEFINE_OBJECT_REF_METHODS(TargetPattern, DFPattern, TargetPatternNode);
+};
+
 /*!
  * \brief A pattern that asserting a root pattern has certain attributes.
  * \sa AttrPattern
diff --git a/include/tvm/relax/dataflow_pattern_functor.h b/include/tvm/relax/dataflow_pattern_functor.h
@@ -91,6 +91,7 @@ class DFPatternFunctor<R(const DFPattern& n, Args...)> {
   virtual R VisitDFPattern_(const ExprPatternNode* op, Args... args) DFPATTERN_FUNCTOR_DEFAULT;
   virtual R VisitDFPattern_(const FunctionPatternNode* op, Args... args) DFPATTERN_FUNCTOR_DEFAULT;
   virtual R VisitDFPattern_(const ShapePatternNode* op, Args... args) DFPATTERN_FUNCTOR_DEFAULT;
+  virtual R VisitDFPattern_(const TargetPatternNode* op, Args... args) DFPATTERN_FUNCTOR_DEFAULT;
   virtual R VisitDFPattern_(const TupleGetItemPatternNode* op,
                             Args... args) DFPATTERN_FUNCTOR_DEFAULT;
   virtual R VisitDFPattern_(const TuplePatternNode* op, Args... args) DFPATTERN_FUNCTOR_DEFAULT;
@@ -127,6 +128,7 @@ class DFPatternFunctor<R(const DFPattern& n, Args...)> {
     RELAX_DFPATTERN_FUNCTOR_DISPATCH(ExprPatternNode);
     RELAX_DFPATTERN_FUNCTOR_DISPATCH(FunctionPatternNode);
     RELAX_DFPATTERN_FUNCTOR_DISPATCH(ShapePatternNode);
+    RELAX_DFPATTERN_FUNCTOR_DISPATCH(TargetPatternNode);
     RELAX_DFPATTERN_FUNCTOR_DISPATCH(TupleGetItemPatternNode);
     RELAX_DFPATTERN_FUNCTOR_DISPATCH(TuplePatternNode);
     RELAX_DFPATTERN_FUNCTOR_DISPATCH(TypePatternNode);
@@ -161,6 +163,7 @@ class DFPatternVisitor : public DFPatternFunctor<void(const DFPattern&)> {
   void VisitDFPattern_(const ExprPatternNode* op) override;
   void VisitDFPattern_(const FunctionPatternNode* op) override;
   void VisitDFPattern_(const ShapePatternNode* op) override;
+  void VisitDFPattern_(const TargetPatternNode* op) override;
   void VisitDFPattern_(const TupleGetItemPatternNode* op) override;
   void VisitDFPattern_(const TuplePatternNode* op) override;
   void VisitDFPattern_(const TypePatternNode* op) override;
diff --git a/python/tvm/relax/backend/__init__.py b/python/tvm/relax/backend/__init__.py
@@ -18,3 +18,4 @@
 
 from . import contrib
 from .pattern_registry import get_pattern, get_patterns_with_prefix
+from .dispatch_ops import DispatchOps
diff --git a/python/tvm/relax/backend/dispatch_ops.py b/python/tvm/relax/backend/dispatch_ops.py
@@ -24,6 +24,7 @@
 from tvm.relax.dpl import is_op, rewrite_call, wildcard, has_target
 
 from ..transform import function_pass
+from tvm.topi.utils import prod, swap
 
 
 @function_pass(opt_level=0)
@@ -35,10 +36,21 @@ class DispatchOps:
     def __init__(self):
         self.input = wildcard()
         # cumsum on cpu will be legalized
+        self.cumsum_cpu = is_op("relax.cumsum")(self.input) & has_target("llvm")
         self.cumsum_gpu = is_op("relax.cumsum")(self.input) & has_target("cuda")
-        self.sort_gpu = is_op("relax.sort")(self.input) & has_target("cuda")
         self.sort_cpu = is_op("relax.sort")(self.input) & has_target("llvm")
-        self.pattern = self.cumsum_gpu | self.sort_gpu | self.sort_cpu
+        self.sort_gpu = is_op("relax.sort")(self.input) & has_target("cuda")
+        # if no target is specified, default will be on GPU
+        self.sort = is_op("relax.sort")(self.input)
+        self.cumsum = is_op("relax.cumsum")(self.input)
+        self.pattern = (
+            self.cumsum_gpu
+            | self.cumsum_cpu
+            | self.sort_gpu
+            | self.sort_cpu
+            | self.sort
+            | self.cumsum
+        )
 
     def transform_function(self, func: Expr, mod: IRModule, ctx: PassContext) -> IRModule:
         """
@@ -64,55 +76,81 @@ def transform_function(self, func: Expr, mod: IRModule, ctx: PassContext) -> IRM
                 continue
 
             def rewriter(expr, matches):
-                print("got here 70, expr: ", expr)
                 arg = matches[self.input]
-                print("got arg: ", arg)
 
-                if self.cumsum_gpu in matches:
-                    print("86 matches[self.no_op_reshape]: ", matches[self.cumsum_gpu])
-                    return relax.call_dps_packed(
+                if self.cumsum_gpu in matches or (
+                    self.cumsum in matches and self.cumsum_cpu not in matches
+                ):
+                    axis = matches[self.cumsum_gpu].attrs.axis
+                    output_dtype = matches[self.cumsum_gpu].attrs.dtype
+                    if output_dtype is None:
+                        output_dtype = out_sinfo.dtype
+                    out_sinfo = arg.struct_info
+                    if axis is None:
+                        axis = 0
+                        new_shape = (prod(arg.struct_info.shape),)
+                        arg = relax.op.reshape(arg, new_shape)
+                        out_sinfo = relax.TensorStructInfo(
+                            new_shape, output_dtype, out_sinfo.vdevice
+                        )
+                    return relax.op.call_dps_packed(
                         "tvm.contrib.thrust.sum_scan",
-                        [arg],
-                        out_sinfo=arg.struct_info,
-                    )
-                elif self.sort_gpu in matches:
-                    print("86 matches[self.no_op_reshape]: ", matches[self.sort_gpu])
-                    return relax.call_dps_packed(
-                        "tvm.contrib.thrust.sort",
-                        [arg],
-                        out_sinfo=arg.struct_info,
+                        [arg, int(axis)],
+                        out_sinfo=out_sinfo,
                     )
+
                 elif self.sort_cpu in matches:
+                    axis = int(matches[self.sort_cpu].attrs.axis)
+                    is_ascend = int(matches[self.sort_cpu].attrs.is_ascend)
+                    out_sinfo = arg.struct_info
+                    if axis is None:
+                        axis = 0
+                        new_shape = (prod(arg.struct_info.shape),)
+                        out_sinfo = relax.TensorStructInfo(
+                            new_shape, arg.struct_info.dtype, out_sinfo.vdevice
+                        )
+
                     return relax.call_dps_packed(
                         "tvm.contrib.sort.sort",
-                        [arg],
-                        out_sinfo=arg.struct_info,
+                        [arg, axis, is_ascend],
+                        out_sinfo=out_sinfo,
                     )
 
+                elif self.sort_gpu in matches or self.sort in matches:
+                    axis = matches[self.sort_gpu].attrs.axis
+                    if axis is None:
+                        axis = -1
+                    axis = int(axis)
+
+                    is_ascend = matches[self.sort_gpu].attrs.is_ascend
+                    if is_ascend is None:
+                        is_ascend = True
+                    out_sinfo = arg.struct_info
+                    ndim = arg.struct_info.ndim
+
+                    axis = ndim + axis if axis < 0 else axis
+                    if axis != ndim - 1:
+                        # Prepare for sorting along axis -1.
+                        axes = swap(list(range(ndim)), axis)
+                        arg = relax.op.permute_dims(arg, axes)
+                        new_shape = [out_sinfo.shape[i] for i in axes]
+                        out_sinfo = relax.TensorStructInfo(
+                            new_shape, out_sinfo.dtype, out_sinfo.vdevice
+                        )
+
+                    out = relax.op.call_dps_packed(
+                        "tvm.contrib.thrust.sort",
+                        [arg, int(is_ascend)],
+                        out_sinfo=out_sinfo,
+                    )
+                    if axis != ndim - 1:
+                        # Prepare for sorting along axis -1.
+                        axes = swap(list(range(ndim)), axis)
+                        out = relax.op.permute_dims(out, axes)
+                    return out
+
                 return expr
 
             updated_func = rewrite_call(self.pattern, rewriter, func)
 
         return updated_func
-
-
-# Option 0): add a global dict for it: {op, target, condition, dps_packed},
-#    condition is some specific setting like the value of k in topk
-#    Q: how to work it with pattern match?
-#
-# Option 1): normal python mod pass, straightforward, but not easy to hack like topk
-#
-# Option 2): c++ pass, not easy to be updated. Don't go
-#
-# How to handle with target? don't require RealizeVDevice, just specify the vdevice in inputs
-# but vdevice is necessary, we could have default for it
-#
-# Sample map
-# cumsum - cpu => ignore for legalization
-# cumsum - gpu =>  relax.call_dps_packed(
-#                "tvm.contrib.thrust.sum_scan",
-#                [data],
-#                out_sinfo=data.struct_info,
-#            )
-# f32_233 = wildcard().has_shape((2, 3, 3)) & has_dtype("float32") # and pattern
-# is_op("nn.conv2d")(xp, yp).has_attr({"kernel_size": [4, 3]}).match(conv2d)
diff --git a/python/tvm/relax/dpl/pattern.py b/python/tvm/relax/dpl/pattern.py
@@ -177,6 +177,22 @@ def has_shape(self, shape: List[PrimExpr]) -> "ShapePattern":
             raise ValueError("has_shape takes a list or tuple as input.")
         return ShapePattern(pattern=self, shape=shape)
 
+    def has_target(self, target: tvm.target.Target) -> "TargetPattern":
+        """
+        Add a target constraint to this pattern
+
+        Parameters
+        ----------
+        target: Target
+            The target to match
+
+        Returns
+        -------
+        result: TargetPattern
+            The resulting TargetPattern
+        """
+        return has_target(target, self)
+
     def match(self, expr, var2val: Optional[Dict[Var, Expr]] = None) -> bool:
         """
         Match a relax.Expr syntactically
@@ -626,6 +642,23 @@ def __init__(self, pattern: "DFPattern", shape: List[tvm.ir.PrimExpr]):
         self.__init_handle_by_constructor__(ffi.ShapePattern, pattern, shape)  # type: ignore
 
 
+@register_df_node
+class TargetPattern(DFPattern):
+    """A pattern that matches another pattern with a certain target
+
+    Parameters
+    ----------
+    pattern: tvm.relax.dpl.DFPattern
+        The input pattern that needs type annotation.
+
+    target:
+        The target to match.
+    """
+
+    def __init__(self, pattern: "DFPattern", target: tvm.target.Target):
+        self.__init_handle_by_constructor__(ffi.TargetPattern, pattern, target)  # type: ignore
+
+
 @register_df_node
 class SameShapeConstraint(DFConstraint):
     """A pattern that requires a set of patterns to have the same shape
@@ -837,6 +870,30 @@ def has_dtype(dtype: str, pattern: DFPattern = None) -> DataTypePattern:
     return DataTypePattern(pattern, dtype)
 
 
+def has_target(target: tvm.target.Target, pattern: DFPattern = None) -> TargetPattern:
+    """
+    Syntatic sugar for creating a TargetPattern
+
+    Parameters
+    ----------
+    target: Target
+        The target to match
+
+    pattern: tvm.relax.dpl.DFPattern
+        The pattern that needs type annotation
+
+    Returns
+    -------
+    result: tvm.relax.dpl.TargetPattern
+        The resulting TargetPattern
+    """
+    if pattern is None:
+        pattern = wildcard()
+    if isinstance(target, (dict, str)):
+        target = tvm.target.Target(tvm.runtime.convert(target))
+    return TargetPattern(pattern, target)
+
+
 def is_shape(shape: List[tvm.ir.PrimExpr]) -> "PrimArrPattern":
     """
     Directly matches a shape which is an array of PrimExpr
diff --git a/src/relax/ir/dataflow_matcher.cc b/src/relax/ir/dataflow_matcher.cc
@@ -525,6 +525,15 @@ bool DFPatternMatcher::VisitDFPattern_(const DataTypePatternNode* op, const Expr
   return false;
 }
 
+bool DFPatternMatcher::VisitDFPattern_(const TargetPatternNode* op, const Expr& expr) {
+  const auto* sinfo = GetStructInfoAs<TensorStructInfoNode>(expr);
+  if (sinfo->vdevice.defined()) {
+    VDevice vdev = sinfo->vdevice.value();
+    return vdev->target->kind == op->target->kind;
+  }
+  return false;
+}
+
 bool DFPatternMatcher::VisitDFPattern_(const VarPatternNode* op, const Expr& expr) {
   // We don't jump for var pattern, as there's no need to access its value to judge it.
   if (const auto* var_node = expr.as<VarNode>()) {
diff --git a/src/relax/ir/dataflow_matcher_impl.h b/src/relax/ir/dataflow_matcher_impl.h
@@ -57,6 +57,7 @@ class DFPatternMatcher : public DFPatternFunctor<bool(const DFPattern&, const Ex
   bool VisitDFPattern_(const ExprPatternNode* op, const Expr& expr) override;
   bool VisitDFPattern_(const FunctionPatternNode* op, const Expr& expr) override;
   bool VisitDFPattern_(const ShapePatternNode* op, const Expr& expr) override;
+  bool VisitDFPattern_(const TargetPatternNode* op, const Expr& expr) override;
   bool VisitDFPattern_(const TupleGetItemPatternNode* op, const Expr& expr) override;
   bool VisitDFPattern_(const TuplePatternNode* op, const Expr& expr) override;
   bool VisitDFPattern_(const TypePatternNode* op, const Expr& expr) override;
diff --git a/src/relax/ir/dataflow_pattern.cc b/src/relax/ir/dataflow_pattern.cc
@@ -315,6 +315,21 @@ RELAX_PATTERN_PRINTER_DEF(DataTypePatternNode, [](auto p, auto node) {
   p->stream << "DataTypePattern(" << node->pattern << " has dtype " << node->dtype << ")";
 });
 
+TVM_REGISTER_NODE_TYPE(TargetPatternNode);
+TargetPattern::TargetPattern(DFPattern pattern, Target target) {
+  ObjectPtr<TargetPatternNode> n = make_object<TargetPatternNode>();
+  n->pattern = std::move(pattern);
+  n->target = std::move(target);
+  data_ = std::move(n);
+}
+TVM_REGISTER_GLOBAL("relax.dpl.TargetPattern")
+    .set_body_typed([](DFPattern pattern, Target target) {
+      return TargetPattern(pattern, target);
+    });
+RELAX_PATTERN_PRINTER_DEF(TargetPatternNode, [](auto p, auto node) {
+  p->stream << "TargetPattern(" << node->pattern << " has target " << node->target << ")";
+});
+
 TVM_REGISTER_NODE_TYPE(AttrPatternNode);
 AttrPattern::AttrPattern(DFPattern pattern, DictAttrs attrs) {
   ObjectPtr<AttrPatternNode> n = make_object<AttrPatternNode>();
@@ -367,6 +382,9 @@ class DFPatternDuplicator : public DFPatternFunctor<DFPattern(const DFPattern&)>
   DFPattern VisitDFPattern_(const DataTypePatternNode* op) override {
     return DataTypePattern(op->pattern, op->dtype);
   }
+  DFPattern VisitDFPattern_(const TargetPatternNode* op) override {
+    return TargetPattern(op->pattern, op->target);
+  }
   DFPattern VisitDFPattern_(const FunctionPatternNode* op) override {
     return FunctionPattern(op->params, op->body);
   }
@@ -410,6 +428,9 @@ DataTypePattern DFPattern::HasDtype(const std::string& dtype) const {
 ShapePattern DFPattern::HasShape(const Array<PrimExpr>& shape) const {
   return ShapePattern(*this, shape);
 }
+TargetPattern DFPattern::HasTarget(const Target& target) const {
+  return TargetPattern(*this, target);
+}
 
 DFPattern::operator PatternSeq() const { return PatternSeq{{*this}}; }
 
diff --git a/src/relax/ir/dataflow_pattern_functor.cc b/src/relax/ir/dataflow_pattern_functor.cc
@@ -63,6 +63,10 @@ void DFPatternVisitor::VisitDFPattern_(const DataTypePatternNode* op) {
   VisitDFPattern(op->pattern);
 }
 
+void DFPatternVisitor::VisitDFPattern_(const TargetPatternNode* op) {
+  VisitDFPattern(op->pattern);
+}
+
 void DFPatternVisitor::VisitDFPattern_(const ExprPatternNode* op) {}
 
 void DFPatternVisitor::VisitDFPattern_(const FunctionPatternNode* op) {
diff --git a/src/script/printer/relax/utils.h b/src/script/printer/relax/utils.h
@@ -109,7 +109,6 @@ inline int FindVDeviceIndexByTargetKind(const VDevice& vdevice, const IRDocsifie
       kind_index++;
     }
   }
-  LOG(WARNING) << "The VDevice was not found in the global_infos map: " << vdevice;
   return -1;
 }
 
diff --git a/tests/python/relax/test_backend_dispatch_ops.py b/tests/python/relax/test_backend_dispatch_ops.py
diff --git a/tests/python/relax/test_dataflow_pattern.py b/tests/python/relax/test_dataflow_pattern.py

Original file line number	Diff line number	Diff line change
`@@ -18,3 +18,4 @@`
`18`	`18`
`19`	`19`	`from . import contrib`
`20`	`20`	`from .pattern_registry import get_pattern, get_patterns_with_prefix`
	`21`	`+from .dispatch_ops import DispatchOps`
Original file line number	Diff line number	Diff line change
`@@ -63,6 +63,10 @@ void DFPatternVisitor::VisitDFPattern_(const DataTypePatternNode* op) {`
`63`	`63`	`VisitDFPattern(op->pattern);`
`64`	`64`	`}`
`65`	`65`
	`66`	`+void DFPatternVisitor::VisitDFPattern_(const TargetPatternNode* op) {`
	`67`	`+ VisitDFPattern(op->pattern);`
	`68`	`+}`
	`69`	`+`
`66`	`70`	`void DFPatternVisitor::VisitDFPattern_(const ExprPatternNode* op) {}`
`67`	`71`
`68`	`72`	`void DFPatternVisitor::VisitDFPattern_(const FunctionPatternNode* op) {`
Original file line number	Diff line number	Diff line change
`@@ -109,7 +109,6 @@ inline int FindVDeviceIndexByTargetKind(const VDevice& vdevice, const IRDocsifie`
`109`	`109`	`kind_index++;`
`110`	`110`	`}`
`111`	`111`	`}`
`112`		`- LOG(WARNING) << "The VDevice was not found in the global_infos map: " << vdevice;`
`113`	`112`	`return -1;`
`114`	`113`	`}`
`115`	`114`