Skip to content

Commit

Permalink
Update import of sdpa_with_kv_cache to custom_ops (#1470)
Browse files Browse the repository at this point in the history
  • Loading branch information
Jack-Khuu authored Jan 22, 2025
1 parent 45cd239 commit b2d8f2a
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion torchchat/model.py
Original file line number Diff line number Diff line change
Expand Up @@ -1025,7 +1025,7 @@ def apply_rotary_emb(x: Tensor, freqs_cis: Tensor) -> Tensor:
# For quantized_decomposed ops
from executorch.kernels import quantized # no-qa
# For llama::sdpa_with_kv_cache.out, preprocess ops
from executorch.extension.llm.custom_ops import sdpa_with_kv_cache # no-qa
from executorch.extension.llm.custom_ops import custom_ops # no-qa

class PTEModel(nn.Module):
def __init__(self, config, path) -> None:
Expand Down

0 comments on commit b2d8f2a

Please sign in to comment.