dealing with whitespace tokens in nth nearest perturbation

leap-laboratories · Jul 25, 2024 · 07f52e8 · 07f52e8
1 parent 1f36de7
commit 07f52e8
Showing 1 changed file with 9 additions and 2 deletions.
diff --git a/attribution/token_perturbation.py b/attribution/token_perturbation.py
@@ -58,10 +58,17 @@ def get_replacement_units(self, units_to_replace: list[Unit]) -> list[Unit]:
         for unit in units_to_replace:
             replacement_tokens = []
             for token in unit:
-                token_id = self.tokenizer.encode(token, add_special_tokens=False)[0]
+                # Stripping whitespace token if present as it often results in a completely different replacement token
+                stripped_token = token.strip("Ġ")
+                token_id = self.tokenizer.encode(stripped_token, add_special_tokens=False)[0]
                 replacement_token_id = self.get_replacement_token(token_id)
                 replacement_token = self.tokenizer._convert_id_to_token(replacement_token_id)
-                replacement_tokens.append(f"Ġ{replacement_token}")
+
+                # Re-add whitespace prefix if necessary
+                if token.startswith("Ġ") and not replacement_token.startswith("Ġ"):
+                    replacement_token = f"Ġ{replacement_token}"
+
+                replacement_tokens.append(replacement_token)
 
             replacement_units.append(replacement_tokens)