cuda_tile.module @example_module {
entry @example_kernel(%data_pr : tile<ptr<f32>>) {
print_tko "Running example module\n" -> token
%offsets = iota : tile<128xi32>
%data_ptr_reshaped = reshape %data_pr : tile<ptr<f32>> -> tile<1xptr<f32>>
%data_ptr_broadcasted = broadcast %data_ptr_reshaped : tile<1xptr<f32>> -> tile<128xptr<f32>>
%data_ptr_tensor = offset %data_ptr_broadcasted, %offsets : tile<128xptr<f32>>, tile<128xi32> -> tile<128xptr<f32>>
%data, %token = load_ptr_tko weak %data_ptr_tensor : tile<128xptr<f32>> -> tile<128xf32>, token
print_tko "Data: %f\n", %data : tile<128xf32> -> token
return
}
}
the cuda tile custom op
printhas been renamed toprint_tkosince version 13.2. The example in README.md could be re-written as