Files
Presidio/conf/recognizers/Business/french/siret_siren.yaml
2025-09-15 19:04:38 +02:00

18 lines
641 B
YAML

# Recognizer pour SIRET/SIREN français
recognizer_registry:
recognizers:
- name: FrenchSIRETRecognizer
supported_language: fr
supported_entity: SIRET_SIREN_FRANCAIS
patterns:
- name: SIRET complet
regex: "\\b[0-9]{3}\\s?[0-9]{3}\\s?[0-9]{3}\\s?[0-9]{5}\\b"
score: 0.9
- name: SIREN
regex: "\\b[0-9]{3}\\s?[0-9]{3}\\s?[0-9]{3}\\b"
score: 0.85
- name: SIRET avec espaces
regex: "\\bSIRET\\s*:?\\s*[0-9]{3}\\s[0-9]{3}\\s[0-9]{3}\\s[0-9]{5}\\b"
score: 0.95
context: ["SIRET", "SIREN", "établissement", "entreprise", "société"]