Temporarily remove language selection (#10097)

Adapting Microsoft Presidio to other languages requires a bit more work, so for now it will be good idea to remove the language option to choose, so as not to cause errors and confusion. https://microsoft.github.io/presidio/analyzer/languages/ I will handle different languages after the weekend 😄
2025-08-15 07:36:08 +00:00 · 2023-09-01 20:30:48 +02:00 · 2023-09-01 20:30:48 +02:00 · b5a74fb973
commit b5a74fb973
parent 71c418725f
1 changed files with 1 additions and 4 deletions
--- a/libs/experimental/langchain_experimental/data_anonymizer/presidio.py
+++ b/libs/experimental/langchain_experimental/data_anonymizer/presidio.py
@ -18,14 +18,12 @@ class PresidioAnonymizer(AnonymizerBase):
    def __init__(
        self,
        analyzed_fields: Optional[List[str]] = None,
        language: str = "en",
        operators: Optional[Dict[str, OperatorConfig]] = None,
    ):
        """
        Args:
            analyzed_fields: List of fields to detect and then anonymize.
                Defaults to all entities supported by Microsoft Presidio.
            language: Language to use for analysis. Defaults to english.
            operators: Operators to use for anonymization.
                Operators allow for custom anonymization of detected PII.
                Learn more:
@ -54,7 +52,6 @@ class PresidioAnonymizer(AnonymizerBase):
            if analyzed_fields is not None
            else list(get_pseudoanonymizer_mapping().keys())
        )
        self.language = language
        self.operators = (
            operators
            if operators is not None
@ -72,7 +69,7 @@ class PresidioAnonymizer(AnonymizerBase):
        results = self._analyzer.analyze(
            text,
            entities=self.analyzed_fields,
-            language=self.language,
+            language="en",
        )
        return self._anonymizer.anonymize(