Fix llamacpp caching by making LlamaCppTokenizer pickleable

outlines-dev · May 29, 2024 · 4a99aa3 · 4a99aa3
1 parent 538f77a
commit 4a99aa3
Showing 1 changed file with 10 additions and 0 deletions.
diff --git a/outlines/integrations/llamacpp.py b/outlines/integrations/llamacpp.py
@@ -66,6 +66,16 @@ def __init__(self, model: "Llama"):
     def convert_token_to_string(self, token: str) -> str:
         return token
 
+    def __getstate__(self):
+        """Allow tokenizer to be used as hash key by excluding self.decode"""
+        return (
+            sorted(self.vocabulary.items()),
+            self.eos_token_id,
+            self.eos_token,
+            self.pad_token_id,
+            sorted(self.special_tokens),
+        )
+
 
 class LogitsProcessor:
     """Bias LlamaCpp generation using a finite state machine.