cuda.tile.floor#
- cuda.tile.floor(x, /)#
Perform floor on a tile.
Examples
tx = ct.full((4,), 3.7, dtype=ct.float32) print(f"{ct.floor(tx):.1f}")
import cuda.tile as ct import torch @ct.kernel def kernel(): tx = ct.full((4,), 3.7, dtype=ct.float32) print(f"{ct.floor(tx):.1f}") torch.cuda.init() ct.launch(torch.cuda.current_stream(), (1,), kernel, ()) torch.cuda.synchronize()
Output
[3.0, 3.0, 3.0, 3.0]