fix missing operators for eval_llama_lib

helunwencser · helunwencser · commit 73158948880b · 2024-08-14T13:35:02.000-07:00
diff --git a/examples/models/llama2/eval_llama_lib.py b/examples/models/llama2/eval_llama_lib.py
@@ -44,8 +44,12 @@ def __init__(
         super().__init__(None, tokenizer, max_seq_length)
         self._model = model  # Expects model to be path to a .pte file
 
+        from executorch.extension.pybindings import portable_lib  # noqa
         from executorch.extension.pybindings.portable_lib import _load_for_executorch
-
+        # Note: import this after portable_lib
+        from executorch.extension.llm.custom_ops import sdpa_with_kv_cache  # noqa
+        from executorch.kernels import quantized
+        
         self._et_model = _load_for_executorch(self._model)
         self._use_kv_cache = self._et_model.run_method("use_kv_cache")[0]