File size: 1,148 Bytes
a8f12f6
764e30e
a8f12f6
 
 
 
 
764e30e
 
 
1915c66
a8f12f6
764e30e
a8f12f6
764e30e
a8f12f6
 
764e30e
a8f12f6
 
764e30e
a8f12f6
 
1915c66
fd20bd2
764e30e
fd20bd2
1915c66
a8f12f6
764e30e
a8f12f6
 
1915c66
764e30e
 
a8f12f6
 
764e30e
a8f12f6
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
import logging
from services.regex_pii_remover import RegexPIIRemover

logger = logging.getLogger(__name__)


class FileService:
    def __init__(self):
        """Initialize file service with PII remover"""
        self.pii_remover = RegexPIIRemover()
        logger.info("FileService initialized")
    
    def remove_pii(self, text: str) -> tuple[str, int]:
        """
        Remove PII from text using regex patterns
        
        Args:
            text: Input text containing potential PII
            
        Returns:
            tuple: (cleaned_text, pii_count)
        """
        try:
            logger.info(f"Starting PII removal (text length: {len(text)})")
            
            cleaned_text, pii_count = self.pii_remover.remove_pii(text)
            
            logger.info(f"PII removal complete: {pii_count} entities removed")
            
            return cleaned_text, pii_count
            
        except Exception as e:
            logger.error(f"Error during PII removal: {str(e)}")
            # Return original text if PII removal fails
            return text, 0


# Global instance
file_service = FileService()