Skip to content

Commit b1fa9d1

Browse files
authored
[flang][cuda] Correctly embox logical constant (llvm#116445)
1 parent 64c4550 commit b1fa9d1

File tree

2 files changed

+27
-2
lines changed

2 files changed

+27
-2
lines changed

flang/lib/Optimizer/Transforms/CUFOpConversion.cpp

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -473,9 +473,16 @@ static mlir::Value emboxSrc(mlir::PatternRewriter &rewriter,
473473
mlir::Type srcTy = fir::unwrapRefType(op.getSrc().getType());
474474
if (fir::isa_trivial(srcTy) &&
475475
mlir::matchPattern(op.getSrc().getDefiningOp(), mlir::m_Constant())) {
476+
mlir::Value src = op.getSrc();
477+
if (srcTy.isInteger(1)) {
478+
// i1 is not a supported type in the descriptor and it is actually coming
479+
// from a LOGICAL constant. Store it as a fir.logical.
480+
srcTy = fir::LogicalType::get(rewriter.getContext(), 4);
481+
src = createConvertOp(rewriter, loc, srcTy, src);
482+
}
476483
// Put constant in memory if it is not.
477484
mlir::Value alloc = builder.createTemporary(loc, srcTy);
478-
builder.create<fir::StoreOp>(loc, op.getSrc(), alloc);
485+
builder.create<fir::StoreOp>(loc, src, alloc);
479486
addr = alloc;
480487
} else {
481488
addr = getDeviceAddress(rewriter, op.getSrcMutable(), symtab);

flang/test/Fir/CUDA/cuda-data-transfer.fir

Lines changed: 19 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -385,7 +385,6 @@ func.func @_QPdevice_addr_conv() {
385385
// CHECK: fir.embox %[[DEV_ADDR_CONV]](%{{.*}}) : (!fir.ref<!fir.array<4xf32>>, !fir.shape<1>) -> !fir.box<!fir.array<4xf32>>
386386
// CHECK: fir.call @_FortranACUFDataTransferDescDescNoRealloc
387387

388-
389388
func.func @_QQchar_transfer() attributes {fir.bindc_name = "char_transfer"} {
390389
%c1 = arith.constant 1 : index
391390
%c10 = arith.constant 10 : index
@@ -447,5 +446,24 @@ func.func @_QPdevmul(%arg0: !fir.ref<!fir.array<1x?xf32>> {fir.bindc_name = "b"}
447446
// CHECK: %[[DST:.*]] = fir.convert %[[ALLOCA0]] : (!fir.ref<!fir.box<!fir.array<?x?xf32>>>) -> !fir.ref<!fir.box<none>>
448447
// CHECK: fir.call @_FortranACUFDataTransferDescDesc(%[[DST]], %{{.*}}, %{{.*}}, %{{.*}}, %{{.*}}) : (!fir.ref<!fir.box<none>>, !fir.ref<!fir.box<none>>, i32, !fir.ref<i8>, i32) -> none
449448

449+
func.func @_QPlogical_cst() {
450+
%c0_i64 = arith.constant 0 : i64
451+
%false = arith.constant false
452+
%c0 = arith.constant 0 : index
453+
%0 = cuf.alloc !fir.box<!fir.heap<!fir.array<?x?x!fir.logical<1>>>> {bindc_name = "id2", data_attr = #cuf.cuda<device>, uniq_name = "_QFlogical_cstEid2"} -> !fir.ref<!fir.box<!fir.heap<!fir.array<?x?x!fir.logical<1>>>>>
454+
%4 = fir.declare %0 {data_attr = #cuf.cuda<device>, fortran_attrs = #fir.var_attrs<allocatable>, uniq_name = "_QFlogical_cstEid2"} : (!fir.ref<!fir.box<!fir.heap<!fir.array<?x?x!fir.logical<1>>>>>) -> !fir.ref<!fir.box<!fir.heap<!fir.array<?x?x!fir.logical<1>>>>>
455+
cuf.data_transfer %false to %4 {transfer_kind = #cuf.cuda_transfer<host_device>} : i1, !fir.ref<!fir.box<!fir.heap<!fir.array<?x?x!fir.logical<1>>>>>
456+
return
457+
}
458+
459+
// CHECK-LABEL: func.func @_QPlogical_cst()
460+
// CHECK: %[[DESC:.*]] = fir.alloca !fir.box<!fir.logical<4>>
461+
// CHECK: %[[CONST:.*]] = fir.alloca !fir.logical<4>
462+
// CHECK: %[[CONV:.*]] = fir.convert %false : (i1) -> !fir.logical<4>
463+
// CHECK: fir.store %[[CONV]] to %[[CONST]] : !fir.ref<!fir.logical<4>>
464+
// CHECK: %[[EMBOX:.*]] = fir.embox %[[CONST]] : (!fir.ref<!fir.logical<4>>) -> !fir.box<!fir.logical<4>>
465+
// CHECK: fir.store %[[EMBOX]] to %[[DESC]] : !fir.ref<!fir.box<!fir.logical<4>>>
466+
// CHECK: %[[BOX_NONE:.*]] = fir.convert %[[DESC]] : (!fir.ref<!fir.box<!fir.logical<4>>>) -> !fir.ref<!fir.box<none>>
467+
// CHECK: fir.call @_FortranACUFDataTransferDescDesc(%{{.*}}, %[[BOX_NONE]], %{{.*}}, %{{.*}}, %{{.*}}) : (!fir.ref<!fir.box<none>>, !fir.ref<!fir.box<none>>, i32, !fir.ref<i8>, i32) -> none
450468

451469
} // end of module

0 commit comments

Comments
 (0)