import torch
from torch._C._nvfuser import Fusion, FusionDefinition, DataType
# Construct and Define Fusion
fusion = Fusion()
with FusionDefinition(fusion) as fd :
t0 = fd.define_tensor(0)
fd.add_input(t0)
c0 = fd.define_constant(1.5)
t1 = fd.Ops.div(c0, t0)
fd.add_output(t1)
fusion.print_ir()
Inputs:
T0_g[ iS0{i0}, iS1{i2} ], float
Outputs:
T1_g[ iS2{i0}, iS3{i2} ], float
%kernel_math {
T1_g[ iS2{i0}, iS3{i2} ]
= T0_g[ iS0{i0}, iS1{i2} ] # this should be double(1.5)
/ T0_g[ iS0{i0}, iS1{i2} ];
}
.
🐛 Describe the bug
Output:
The bug is on this line
pytorch/torch/csrc/jit/codegen/cuda/arith.cpp
Line 736 in a054b3e
Versions
.