Skip to content
6 changes: 6 additions & 0 deletions csrc/scheduler/pointwise.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -1040,6 +1040,12 @@ void schedulePointwise(Fusion* fusion, const PointwiseParams* pparams) {
auto output = entry.second;
inner_most_tensors.erase(output);
}
// IndexSelectOp supports vectorized load on lookupTv. It should be treated
Comment thread
jjsjann123 marked this conversation as resolved.
Outdated
// the same as a cached input and excluded from inner_most_tensors.
for (auto idx_sel : ir_utils::getOpsOfType<IndexSelectOp>(fusion)) {
inner_most_tensors.erase(idx_sel->output(0)->as<TensorView>());
Comment thread
naoyam marked this conversation as resolved.
}

inlineMost(inner_most_tensors);

scheduler_utils::promoteProducerMemoryTypes(fusion, cached_inputs);
Expand Down