[CIR] Add support for ExtVector Bool Type

lanza · lanza · commit ab3795b457c7 · 2025-11-21T20:11:08.000-08:00
Implements support for ext_vector_type with bool elements. Bool vectors are represented as integers in CIR (e.g., bool4 uses !cir.int<u, 8>), matching traditional CodeGen's approach. Key changes: - CIRGenTypes: Convert ExtVectorBoolType to integer storage (iN where N = max(num_elements, 8)) - CIRGenExprConst: Pack bool elements into integer bits during constant initialization - CIRGenExprScalar: Handle subscript access by extracting bits from integer - CIRGenExpr: Skip vector optimizations for ExtVectorBoolType in load/store paths Tests added for basic initialization, subscript access, and bitwise operations. ghstack-source-id: b8879c0 Pull-Request: #1998
diff --git a/clang/lib/CIR/CodeGen/CIRGenExpr.cpp b/clang/lib/CIR/CodeGen/CIRGenExpr.cpp
@@ -634,6 +634,14 @@ CIRGenCallee CIRGenFunction::emitCallee(const clang::Expr *E) {
 
 mlir::Value CIRGenFunction::emitToMemory(mlir::Value Value, QualType Ty) {
   // Bool has a different representation in memory than in registers.
+
+  // ExtVectorBoolType: In ClangIR, ExtVectorBoolType is always represented
+  // as an integer type (!cir.int<u, N>) throughout the IR, including both
+  // in registers and in memory. This differs from traditional CodeGen where
+  // it may exist as a vector type that needs conversion to integer for storage.
+  // Since we use integer representation consistently, no conversion is needed.
+  // See CIRGenTypes.cpp:675-683 for the type conversion logic.
+
   return Value;
 }
 
@@ -653,18 +661,21 @@ void CIRGenFunction::emitStoreOfScalar(mlir::Value value, Address addr,
 
   auto eltTy = addr.getElementType();
   if (const auto *clangVecTy = ty->getAs<clang::VectorType>()) {
-    // Boolean vectors use `iN` as storage type.
+    // Boolean vectors use `iN` as storage type. The type conversion in
+    // CIRGenTypes::convertType (lines 675-683) returns an integer type for
+    // ExtVectorBoolType, so eltTy is already an integer. Skip vector
+    // optimizations for bool vectors since they're not actually vectors in CIR.
     if (clangVecTy->isExtVectorBoolType()) {
-      llvm_unreachable("isExtVectorBoolType NYI");
-    }
-
-    // Handle vectors of size 3 like size 4 for better performance.
-    const auto vTy = cast<cir::VectorType>(eltTy);
-    auto newVecTy =
-        CGM.getABIInfo().getOptimalVectorMemoryType(vTy, getLangOpts());
+      // Storage is already an integer type, nothing special needed
+    } else {
+      // Handle vectors of size 3 like size 4 for better performance.
+      const auto vTy = cast<cir::VectorType>(eltTy);
+      auto newVecTy =
+          CGM.getABIInfo().getOptimalVectorMemoryType(vTy, getLangOpts());
 
-    if (vTy != newVecTy) {
-      llvm_unreachable("NYI");
+      if (vTy != newVecTy) {
+        llvm_unreachable("NYI");
+      }
     }
   }
 
@@ -2956,6 +2967,13 @@ mlir::Value CIRGenFunction::emitFromMemory(mlir::Value Value, QualType Ty) {
     llvm_unreachable("NIY");
   }
 
+  // ExtVectorBoolType: In ClangIR, ExtVectorBoolType is always represented
+  // as an integer type (!cir.int<u, N>) throughout the IR, including both
+  // in registers and in memory. This differs from traditional CodeGen where
+  // it may need truncation from storage type to value type. Since we use
+  // integer representation consistently, no conversion is needed.
+  // See CIRGenTypes.cpp:675-683 for the type conversion logic.
+
   return Value;
 }
 
@@ -2977,24 +2995,27 @@ mlir::Value CIRGenFunction::emitLoadOfScalar(Address addr, bool isVolatile,
   auto eltTy = addr.getElementType();
 
   if (const auto *clangVecTy = ty->getAs<clang::VectorType>()) {
-    // Boolean vectors use `iN` as storage type.
+    // Boolean vectors use `iN` as storage type. The type conversion in
+    // CIRGenTypes::convertType (lines 675-683) returns an integer type for
+    // ExtVectorBoolType, so eltTy is already an integer. Skip vector
+    // optimizations for bool vectors since they're not actually vectors in CIR.
     if (clangVecTy->isExtVectorBoolType()) {
-      llvm_unreachable("NYI");
-    }
-
-    // Handle vectors of size 3 like size 4 for better performance.
-    const auto vTy = cast<cir::VectorType>(eltTy);
-    auto newVecTy =
-        CGM.getABIInfo().getOptimalVectorMemoryType(vTy, getLangOpts());
-
-    if (vTy != newVecTy) {
-      const Address cast = addr.withElementType(builder, newVecTy);
-      mlir::Value v = builder.createLoad(loc, cast, isVolatile);
-      const uint64_t oldNumElements = vTy.getSize();
-      SmallVector<int64_t, 16> mask(oldNumElements);
-      std::iota(mask.begin(), mask.end(), 0);
-      v = builder.createVecShuffle(loc, v, mask);
-      return emitFromMemory(v, ty);
+      // Storage is already an integer type, nothing special needed
+    } else {
+      // Handle vectors of size 3 like size 4 for better performance.
+      const auto vTy = cast<cir::VectorType>(eltTy);
+      auto newVecTy =
+          CGM.getABIInfo().getOptimalVectorMemoryType(vTy, getLangOpts());
+
+      if (vTy != newVecTy) {
+        const Address cast = addr.withElementType(builder, newVecTy);
+        mlir::Value v = builder.createLoad(loc, cast, isVolatile);
+        const uint64_t oldNumElements = vTy.getSize();
+        SmallVector<int64_t, 16> mask(oldNumElements);
+        std::iota(mask.begin(), mask.end(), 0);
+        v = builder.createVecShuffle(loc, v, mask);
+        return emitFromMemory(v, ty);
+      }
     }
   }
 
diff --git a/clang/lib/CIR/CodeGen/CIRGenExprConst.cpp b/clang/lib/CIR/CodeGen/CIRGenExprConst.cpp
@@ -1134,11 +1134,42 @@ class ConstExprEmitter
   }
 
   mlir::Attribute EmitVectorInitialization(InitListExpr *ILE, QualType T) {
-    cir::VectorType VecTy = mlir::cast<cir::VectorType>(CGM.convertType(T));
-    unsigned NumElements = VecTy.getSize();
+    auto *VecTy = T->castAs<VectorType>();
+
+    // ExtVectorBoolType uses integer storage, not vector type
+    if (VecTy->isExtVectorBoolType()) {
+      // For ExtVectorBoolType, the storage is an integer type
+      // Compute the value by packing bools into an integer
+      uint64_t numElements = VecTy->getNumElements();
+      unsigned numInits = ILE->getNumInits();
+      assert(numElements >= numInits && "Too many initializers for a vector");
+
+      // Create integer value by packing bool elements
+      uint64_t value = 0;
+      for (unsigned i = 0; i < numInits; ++i) {
+        auto Init = ILE->getInit(i);
+        Expr::EvalResult result;
+        if (!Init->EvaluateAsRValue(result, CGM.getASTContext()))
+          return {};
+        bool boolVal = result.Val.getInt().getBoolValue();
+        if (boolVal)
+          value |= (uint64_t(1) << i);
+      }
+
+      // Pad to at least 8 bits
+      uint64_t storageBits = std::max<uint64_t>(numElements, 8);
+      auto storageTy =
+          cir::IntType::get(CGM.getBuilder().getContext(), storageBits,
+                            /*isSigned=*/false);
+      return cir::IntAttr::get(storageTy, value);
+    }
+
+    // Regular vector type
+    cir::VectorType CIRVecTy = mlir::cast<cir::VectorType>(CGM.convertType(T));
+    unsigned NumElements = CIRVecTy.getSize();
     unsigned NumInits = ILE->getNumInits();
     assert(NumElements >= NumInits && "Too many initializers for a vector");
-    QualType EltTy = T->castAs<VectorType>()->getElementType();
+    QualType EltTy = VecTy->getElementType();
     SmallVector<mlir::Attribute, 8> Elts;
     // Process the explicit initializers
     for (unsigned i = 0; i < NumInits; ++i) {
@@ -1149,10 +1180,11 @@ class ConstExprEmitter
     }
     // Zero-fill the rest of the vector
     for (unsigned i = NumInits; i < NumElements; ++i) {
-      Elts.push_back(CGM.getBuilder().getZeroInitAttr(VecTy.getElementType()));
+      Elts.push_back(
+          CGM.getBuilder().getZeroInitAttr(CIRVecTy.getElementType()));
     }
     return cir::ConstVectorAttr::get(
-        VecTy, mlir::ArrayAttr::get(CGM.getBuilder().getContext(), Elts));
+        CIRVecTy, mlir::ArrayAttr::get(CGM.getBuilder().getContext(), Elts));
   }
 
   mlir::Attribute VisitImplicitValueInitExpr(ImplicitValueInitExpr *E,
diff --git a/clang/lib/CIR/CodeGen/CIRGenExprScalar.cpp b/clang/lib/CIR/CodeGen/CIRGenExprScalar.cpp
@@ -309,8 +309,39 @@ class ScalarExprEmitter : public StmtVisitor<ScalarExprEmitter, mlir::Value> {
     if (E->getBase()->getType()->isVectorType()) {
       assert(!cir::MissingFeatures::scalableVectors() &&
              "NYI: index into scalable vector");
-      // Subscript of vector type.  This is handled differently, with a custom
-      // operation.
+
+      // ExtVectorBoolType uses integer storage, handle it specially
+      const auto *VecTy = E->getBase()
+                              ->getType()
+                              .getCanonicalType()
+                              ->getAs<clang::VectorType>();
+      if (VecTy && VecTy->isExtVectorBoolType()) {
+        // For ExtVectorBoolType, extract a bit from the integer
+        mlir::Value IntValue = Visit(E->getBase());
+        mlir::Value IndexValue = Visit(E->getIdx());
+
+        // Extract the bit: (IntValue >> IndexValue) & 1
+        auto Loc = CGF.getLoc(E->getSourceRange());
+        auto BoolTy = CGF.builder.getBoolTy();
+        auto IntTy = IntValue.getType();
+
+        // Shift right by index: IntValue >> IndexValue
+        mlir::Value Shifted =
+            cir::ShiftOp::create(CGF.builder, Loc, IntTy, IntValue, IndexValue,
+                                 /*isShiftLeft=*/false);
+
+        // Mask with 1: Shifted & 1
+        mlir::Value One = CGF.builder.getConstInt(Loc, IntTy, 1);
+        mlir::Value Masked = cir::BinOp::create(
+            CGF.builder, Loc, IntTy, cir::BinOpKind::And, Shifted, One);
+
+        // Convert to bool: Masked != 0
+        mlir::Value Zero = CGF.builder.getConstInt(Loc, IntTy, 0);
+        return cir::CmpOp::create(CGF.builder, Loc, BoolTy, cir::CmpOpKind::ne,
+                                  Masked, Zero);
+      }
+
+      // Regular vector subscript
       mlir::Value VecValue = Visit(E->getBase());
       mlir::Value IndexValue = Visit(E->getIdx());
       return cir::VecExtractOp::create(CGF.getBuilder(),
diff --git a/clang/lib/CIR/CodeGen/CIRGenTypes.cpp b/clang/lib/CIR/CodeGen/CIRGenTypes.cpp
@@ -670,8 +670,18 @@ mlir::Type CIRGenTypes::convertType(QualType T) {
   case Type::ExtVector:
   case Type::Vector: {
     const VectorType *V = cast<VectorType>(Ty);
-    auto ElementType = convertTypeForMem(V->getElementType());
-    ResultType = cir::VectorType::get(ElementType, V->getNumElements());
+    // Boolean vectors use an integer as storage type, matching traditional
+    // CodeGen. For N bool elements, storage is iM where M = max(N, 8).
+    if (V->isExtVectorBoolType()) {
+      uint64_t numElements = V->getNumElements();
+      // Pad to at least one byte (8 bits)
+      uint64_t storageBits = std::max<uint64_t>(numElements, 8);
+      ResultType = cir::IntType::get(Builder.getContext(), storageBits,
+                                     /*isSigned=*/false);
+    } else {
+      auto ElementType = convertTypeForMem(V->getElementType());
+      ResultType = cir::VectorType::get(ElementType, V->getNumElements());
+    }
     break;
   }
   case Type::ConstantMatrix: {
diff --git a/clang/test/CIR/CodeGen/extvector-bool.cpp b/clang/test/CIR/CodeGen/extvector-bool.cpp
@@ -0,0 +1,155 @@
+// RUN: %clang_cc1 -triple x86_64-unknown-linux-gnu -fclangir -emit-cir %s -o %t.cir
+// RUN: FileCheck --input-file=%t.cir %s
+
+// Test basic ext_vector_type with bool elements
+typedef bool bool4 __attribute__((ext_vector_type(4)));
+typedef bool bool2 __attribute__((ext_vector_type(2)));
+typedef bool bool16 __attribute__((ext_vector_type(16)));
+
+// CHECK-LABEL: cir.func {{.*}}@_Z10test_basicv
+void test_basic() {
+  // CHECK: %[[ALLOCA:.*]] = cir.alloca !u8i, !cir.ptr<!u8i>, ["v"
+  bool4 v = {true, false, true, false};
+  // CHECK: %[[CONST:.*]] = cir.const #cir.int<5> : !u8i
+  // CHECK: cir.store {{.*}} %[[CONST]], %[[ALLOCA]]
+}
+
+// CHECK-LABEL: cir.func {{.*}}@_Z14test_subscriptv
+void test_subscript() {
+  bool4 v = {true, false, true, false};
+  // CHECK: %[[LOAD:.*]] = cir.load{{.*}}!u8i
+  // CHECK: %[[IDX:.*]] = cir.const #cir.int<2>
+  // CHECK: %[[SHIFT:.*]] = cir.shift(right, %[[LOAD]]{{.*}}, %[[IDX]]
+  // CHECK: cir.binop(and,{{.*}}){{.*}}!u8i
+  // CHECK: cir.cmp(ne,{{.*}}){{.*}}!cir.bool
+  bool b = v[2];
+}
+
+// CHECK-LABEL: cir.func {{.*}}@_Z8test_ops
+void test_ops(bool4 a, bool4 b) {
+  // CHECK: cir.binop(and,{{.*}}){{.*}}!u8i
+  bool4 c = a & b;
+}
+
+// NOTE: The following operations are not yet fully implemented for
+// ExtVectorBoolType and require special handling:
+// - Element assignment (v[2] = true): Requires bit manipulation to set/clear individual bits
+// - Unary logical NOT (!v): May require special handling beyond bitwise NOT
+
+// Test bitwise operations
+// CHECK-LABEL: cir.func {{.*}}@_Z16test_bitwise_opsv
+void test_bitwise_ops() {
+  bool4 a = {true, false, true, false};
+  bool4 b = {false, true, true, false};
+
+  // Bitwise AND
+  // CHECK: cir.binop(and,{{.*}}){{.*}}!u8i
+  bool4 c = a & b;
+
+  // Bitwise OR
+  // CHECK: cir.binop(or,{{.*}}){{.*}}!u8i
+  bool4 d = a | b;
+
+  // Bitwise XOR
+  // CHECK: cir.binop(xor,{{.*}}){{.*}}!u8i
+  bool4 e = a ^ b;
+}
+
+// Test different vector sizes
+// CHECK-LABEL: cir.func {{.*}}@_Z17test_vector_sizesv
+void test_vector_sizes() {
+  // bool2 uses u8i (padded to 8 bits minimum)
+  // CHECK: cir.alloca !u8i, !cir.ptr<!u8i>, ["v2"
+  bool2 v2 = {true, false};
+  // CHECK-DAG: cir.const #cir.int<1> : !u8i
+  // CHECK-DAG: cir.store{{.*}}!u8i, !cir.ptr<!u8i>
+
+  // bool16 uses u16i
+  // CHECK-DAG: cir.alloca !u16i, !cir.ptr<!u16i>, ["v16"
+  bool16 v16 = {true, false, true, false, true, false, true, false,
+                false, true, false, true, false, true, false, true};
+  // CHECK-DAG: cir.const #cir.int<43605> : !u16i
+  // CHECK-DAG: cir.store{{.*}}!u16i, !cir.ptr<!u16i>
+}
+
+// Test function parameters and returns
+// CHECK-LABEL: cir.func {{.*}}@_Z12invert_bool4
+// CHECK-SAME: %arg0: !u8i
+// CHECK-SAME: -> !u8i
+bool4 invert_bool4(bool4 v) {
+  // Bitwise NOT
+  // CHECK: %[[LOAD:.*]] = cir.load{{.*}}!u8i
+  // CHECK: cir.unary(not, %[[LOAD]]){{.*}}!u8i
+  return ~v;
+}
+
+// Test all bits set and all bits clear
+// CHECK-LABEL: cir.func {{.*}}@_Z15test_edge_casesv
+void test_edge_cases() {
+  // All false (0)
+  // CHECK-DAG: cir.alloca !u8i, !cir.ptr<!u8i>, ["all_false"
+  bool4 all_false = {false, false, false, false};
+  // CHECK-DAG: cir.const #cir.int<0> : !u8i
+  // CHECK-DAG: cir.store{{.*}}!u8i, !cir.ptr<!u8i>
+
+  // All true (15 = 0b1111 for 4 bits)
+  // CHECK-DAG: cir.alloca !u8i, !cir.ptr<!u8i>, ["all_true"
+  bool4 all_true = {true, true, true, true};
+  // CHECK-DAG: cir.const #cir.int<15> : !u8i
+  // CHECK-DAG: cir.store{{.*}}!u8i, !cir.ptr<!u8i>
+}
+
+// Test subscript with variable index
+// CHECK-LABEL: cir.func {{.*}}@_Z23test_variable_subscript
+void test_variable_subscript(int idx) {
+  bool4 v = {true, false, true, false};
+  // CHECK: cir.load{{.*}}!u8i
+  // CHECK: cir.load{{.*}}!s32i
+  // CHECK: cir.shift(right,{{.*}}){{.*}}!u8i
+  // CHECK: cir.binop(and,{{.*}}){{.*}}!u8i
+  bool b = v[idx];
+}
+
+// Test initialization with all same value
+// CHECK-LABEL: cir.func {{.*}}@_Z18test_same_init_valv
+void test_same_init_val() {
+  // Initialize all elements to true using splat
+  // CHECK: cir.alloca !u8i, !cir.ptr<!u8i>, ["v"
+  bool4 v = {true, true, true, true};
+  // CHECK: cir.const #cir.int<15> : !u8i
+  // CHECK: cir.store{{.*}}!u8i, !cir.ptr<!u8i>
+}
+
+// Test multiple operations in sequence
+// CHECK-LABEL: cir.func {{.*}}@_Z17test_multiple_opsv
+void test_multiple_ops() {
+  bool4 a = {true, false, true, false};
+  bool4 b = {false, true, true, false};
+
+  // CHECK: cir.binop(and,{{.*}}){{.*}}!u8i
+  bool4 c = a & b;
+  // CHECK: cir.binop(or,{{.*}}){{.*}}!u8i
+  bool4 d = c | b;
+  // CHECK: cir.unary(not,{{.*}}){{.*}}!u8i
+  bool4 e = ~d;
+}
+
+// Test reading specific elements
+// CHECK-LABEL: cir.func {{.*}}@_Z18test_read_elementsv
+void test_read_elements() {
+  bool4 v = {true, false, true, false};
+
+  // Read element 0
+  // CHECK: cir.load{{.*}}!u8i
+  // CHECK: cir.const #cir.int<0>
+  // CHECK: cir.shift(right,{{.*}}){{.*}}!u8i
+  // CHECK: cir.binop(and,{{.*}}){{.*}}!u8i
+  bool e0 = v[0];
+
+  // Read element 3
+  // CHECK: cir.load{{.*}}!u8i
+  // CHECK: cir.const #cir.int<3>
+  // CHECK: cir.shift(right,{{.*}}){{.*}}!u8i
+  // CHECK: cir.binop(and,{{.*}}){{.*}}!u8i
+  bool e3 = v[3];
+}