taichi-dev · Hanke98 · Sep 23, 2020 · Sep 15, 2020 · Sep 15, 2020 · Sep 22, 2020
diff --git a/python/taichi/lang/ops.py b/python/taichi/lang/ops.py
@@ -420,6 +420,12 @@ def bit_sar(a, b):
     return _binary_operation(ti_core.expr_bit_sar, ops.rshift, a, b)
 
 
+@taichi_scope
+@binary
+def bit_shr(a, b):
+    return _binary_operation(ti_core.expr_bit_shr, ops.rshift, a, b)
+
+
 # We don't have logic_and/or instructions yet:
 logical_or = bit_or
 logical_and = bit_and

diff --git a/taichi/codegen/codegen_llvm.cpp b/taichi/codegen/codegen_llvm.cpp
@@ -416,8 +416,13 @@ void CodeGenLLVM::visit(BinaryOpStmt *stmt) {
     llvm_val[stmt] =
         builder->CreateShl(llvm_val[stmt->lhs], llvm_val[stmt->rhs]);
   } else if (op == BinaryOpType::bit_sar) {
-    llvm_val[stmt] =
-        builder->CreateAShr(llvm_val[stmt->lhs], llvm_val[stmt->rhs]);
+    if (is_signed(stmt->lhs->element_type())) {
+      llvm_val[stmt] =
+          builder->CreateAShr(llvm_val[stmt->lhs], llvm_val[stmt->rhs]);
+    } else {
+      llvm_val[stmt] =
+          builder->CreateLShr(llvm_val[stmt->lhs], llvm_val[stmt->rhs]);
+    }
   } else if (op == BinaryOpType::max) {
     if (is_real(ret_type)) {
       llvm_val[stmt] =

diff --git a/taichi/inc/binary_op.inc.h b/taichi/inc/binary_op.inc.h
@@ -11,6 +11,7 @@ PER_BINARY_OP(bit_and)
 PER_BINARY_OP(bit_or)
 PER_BINARY_OP(bit_xor)
 PER_BINARY_OP(bit_shl)
+PER_BINARY_OP(bit_shr)
 PER_BINARY_OP(bit_sar)
 PER_BINARY_OP(cmp_lt)
 PER_BINARY_OP(cmp_le)

diff --git a/taichi/ir/expression_ops.h b/taichi/ir/expression_ops.h
@@ -100,6 +100,7 @@ DEFINE_EXPRESSION_FUNC(atan2);
 DEFINE_EXPRESSION_FUNC(pow);
 DEFINE_EXPRESSION_FUNC(truediv);
 DEFINE_EXPRESSION_FUNC(floordiv);
+DEFINE_EXPRESSION_FUNC(bit_shr)
 
 #undef DEFINE_EXPRESSION_OP_UNARY
 #undef DEFINE_EXPRESSION_OP_BINARY

diff --git a/taichi/lang_util.h b/taichi/lang_util.h
@@ -109,6 +109,22 @@ inline bool constexpr is_unsigned(DataType dt) {
   return !is_signed(dt);
 }
 
+inline DataType to_unsigned(DataType dt) {
+  TI_ASSERT(is_signed(dt));
+  switch (dt) {
+    case DataType::i8:
+      return DataType::u8;
+    case DataType::i16:
+      return DataType::u16;
+    case DataType::i32:
+      return DataType::u32;
+    case DataType::i64:
+      return DataType::u32;
+    default:
+      return DataType::unknown;
+  }
+}
+
 inline bool needs_grad(DataType dt) {
   return is_real(dt);
 }

diff --git a/taichi/python/export_lang.cpp b/taichi/python/export_lang.cpp
@@ -430,6 +430,7 @@ void export_lang(py::module &m) {
   m.def("expr_bit_or", expr_bit_or);
   m.def("expr_bit_xor", expr_bit_xor);
   m.def("expr_bit_shl", expr_bit_shl);
+  m.def("expr_bit_shr", expr_bit_shr);
   m.def("expr_bit_sar", expr_bit_sar);
   m.def("expr_bit_not", expr_bit_not);
   m.def("expr_logic_not", expr_logic_not);

diff --git a/taichi/transforms/demote_operations.cpp b/taichi/transforms/demote_operations.cpp
@@ -73,6 +73,29 @@ class DemoteOperations : public BasicStmtVisitor {
         modifier.insert_before(stmt, std::move(floor));
         modifier.erase(stmt);
       }
+    } else if (stmt->op_type == BinaryOpType::bit_shr &&
+               is_integral(lhs->element_type()) &&
+               is_integral(rhs->element_type()) &&
+               is_signed(lhs->element_type())) {
+      // @ti.func
+      // def bit_shr(a, b):
+      //     signed_a = ti.cast(a, ti.uXX)
+      //     shifted = ti.bit_sar(a, b)
+      //     ret = ti.cast(a, ti.iXX)
+      //     return ret
+      auto unsigned_cast = Stmt::make<UnaryOpStmt>(UnaryOpType::cast_bits, lhs);
+      unsigned_cast->as<UnaryOpStmt>()->cast_type =
+          to_unsigned(lhs->element_type());
+      auto shift = Stmt::make<BinaryOpStmt>(BinaryOpType::bit_sar,
+                                            unsigned_cast.get(), rhs);
+      auto signed_cast =
+          Stmt::make<UnaryOpStmt>(UnaryOpType::cast_bits, shift.get());
+      signed_cast->as<UnaryOpStmt>()->cast_type = lhs->element_type();
+      stmt->replace_with(signed_cast.get());
+      modifier.insert_before(stmt, std::move(unsigned_cast));
+      modifier.insert_before(stmt, std::move(shift));
+      modifier.insert_before(stmt, std::move(signed_cast));
+      modifier.erase(stmt);
     }
   }
 

diff --git a/tests/python/test_bit_operations.py b/tests/python/test_bit_operations.py
@@ -29,3 +29,19 @@ def sar(a: ti.i32, b: ti.i32) -> ti.i32:
     # for negative number
     for i in range(n):
         assert sar(neg_test_num, i) == -2**(n - i)
+
+
+@ti.test()
+def test_bit_shr():
+    @ti.kernel
+    def shr(a: ti.i32, b: ti.i32) -> ti.i32:
+        return ti.bit_shr(a, b)
+
+    n = 8
+    test_num = 2**n
+    neg_test_num = -test_num
+    for i in range(n):
+        assert shr(test_num, i) == 2**(n - i)
+    for i in range(n):
+        offset = 0x100000000 if i > 0 else 0
+        assert shr(neg_test_num, i) == (neg_test_num + offset) >> i
 void visit(BinaryOpStmt *stmt) override { 
 void visit(BinaryOpStmt *stmt) override {