We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 9293b78 commit 85b7869Copy full SHA for 85b7869
examples/models/llama2/runner/generation.py
@@ -17,6 +17,11 @@
17
from executorch.examples.models.llama2.tokenizer.tiktoken import Tokenizer
18
from executorch.extension.pybindings.portable_lib import _load_for_executorch
19
20
+from executorch.extension.pybindings import portable_lib # noqa # usort: skip
21
+
22
+# Note: import this after portable_lib
23
+from executorch.extension.llm.custom_ops import sdpa_with_kv_cache # noqa # usort: skip
24
25
26
class CompletionPrediction(TypedDict, total=False):
27
generation: str
0 commit comments