Actualiser conf/default.yaml
This commit is contained in:
@@ -1,9 +1,9 @@
|
||||
# =====================================================================
|
||||
# CONFIGURATION PRESIDIO - v24
|
||||
# CONFIGURATION PRESIDIO - v25
|
||||
# =====================================================================
|
||||
supported_languages: [en, fr]
|
||||
|
||||
# 1. CONFIGURATION DU MOTEUR NLP
|
||||
# 1. CONFIGURATION DU MOTEUR NLP (INCHANGÉ)
|
||||
# =====================================================================
|
||||
nlp_configuration:
|
||||
nlp_engine_name: spacy
|
||||
@@ -30,12 +30,18 @@ nlp_configuration:
|
||||
LOCATION: 0.4
|
||||
ORGANIZATION: 0.55
|
||||
|
||||
# 2. CONFIGURATION DU REGISTRE DES DÉTECTEURS
|
||||
# 2. CONFIGURATION DU REGISTRE DES DÉTECTEURS (AVEC L'AJOUT POUR LES WARNINGS)
|
||||
# =====================================================================
|
||||
recognizer_registry:
|
||||
load_predefined_recognizers: true
|
||||
|
||||
recognizers:
|
||||
# --- On déclare le détecteur NLP de base ---
|
||||
- name: SpacyRecognizer
|
||||
supported_language: fr
|
||||
- name: SpacyRecognizer
|
||||
supported_language: en
|
||||
|
||||
|
||||
- name: FlexibleDateRecognizer
|
||||
supported_language: fr
|
||||
@@ -49,7 +55,6 @@ recognizer_registry:
|
||||
score: 1.0
|
||||
context: ["date", "né le", "signé le", "incident du"]
|
||||
|
||||
|
||||
- name: BelgianAddressRecognizer
|
||||
supported_language: fr
|
||||
supported_entity: BE_ADDRESS
|
||||
@@ -59,7 +64,6 @@ recognizer_registry:
|
||||
score: 1.0
|
||||
context: ["demeurant", "adresse", "siège social", "bureaux situés"]
|
||||
|
||||
|
||||
- name: BelgianPhoneRecognizer
|
||||
supported_language: fr
|
||||
supported_entity: BE_PHONE_NUMBER
|
||||
@@ -69,7 +73,6 @@ recognizer_registry:
|
||||
score: 0.95
|
||||
context: ["Tel", "Tél", "téléphone", "gsm", "mobile"]
|
||||
|
||||
|
||||
- name: SmartOrganizationRecognizer
|
||||
supported_language: fr
|
||||
supported_entity: ORGANIZATION
|
||||
@@ -82,7 +85,6 @@ recognizer_registry:
|
||||
score: 0.9
|
||||
context: ["société", "entreprise", "gérant de la"]
|
||||
|
||||
|
||||
- name: ProfessionalIdRecognizer
|
||||
supported_language: fr
|
||||
supported_entity: BE_PRO_ID
|
||||
@@ -92,7 +94,6 @@ recognizer_registry:
|
||||
score: 1.0
|
||||
context: ["expert-comptable"]
|
||||
|
||||
|
||||
- name: BelgianEnterpriseRecognizer
|
||||
supported_language: fr
|
||||
supported_entity: BE_ENTERPRISE_NUMBER
|
||||
@@ -102,7 +103,6 @@ recognizer_registry:
|
||||
score: 1.0
|
||||
context: ["BCE", "TVA", "intracommunautaire"]
|
||||
|
||||
|
||||
- name: EmailRecognizer
|
||||
supported_language: fr
|
||||
supported_entity: EMAIL_ADDRESS
|
||||
@@ -127,9 +127,10 @@ recognizer_registry:
|
||||
score: 0.95
|
||||
context: ["sécurité sociale", "insee", "nir"]
|
||||
|
||||
# 3. LISTE D'EXCLUSION (ALLOW LIST)
|
||||
# 3. LISTE D'EXCLUSION
|
||||
# =====================================================================
|
||||
allow_list:
|
||||
- Adresse
|
||||
- ADRESSE
|
||||
- Contrat
|
||||
- Document
|
||||
@@ -171,12 +172,14 @@ allow_list:
|
||||
- Taux
|
||||
- Valeur
|
||||
- Prix
|
||||
- Coordonnées
|
||||
- Témoins
|
||||
|
||||
# 4. CONFIGURATION DES TRANSFORMATIONS D'ANONYMISATION
|
||||
|
||||
# 4. CONFIGURATION DES TRANSFORMATIONS D'ANONYMISATION
|
||||
# =====================================================================
|
||||
anonymizer_config:
|
||||
default_anonymizers:
|
||||
# Entités de base
|
||||
PERSON: replace
|
||||
LOCATION: replace
|
||||
ORGANIZATION: replace
|
||||
@@ -194,7 +197,6 @@ anonymizer_config:
|
||||
IP_ADDRESS: replace
|
||||
|
||||
replacements:
|
||||
# Remplacements de base
|
||||
PERSON: "<PERSONNE>"
|
||||
LOCATION: "<LIEU>"
|
||||
ORGANIZATION: "<ORGANISATION>"
|
||||
@@ -206,7 +208,6 @@ anonymizer_config:
|
||||
BE_NATIONAL_REGISTER_NUMBER: "<NRN_BELGE>"
|
||||
FR_SOCIAL_SECURITY_NUMBER: "<NUM_SECU_FR>"
|
||||
BE_PHONE_NUMBER: "<TELEPHONE_BE>"
|
||||
# Ajout des remplacements pour les nouvelles entités SÛRES
|
||||
FLEXIBLE_DATE: "<DATE>"
|
||||
BE_ADDRESS: "<ADRESSE_BELGE>"
|
||||
BE_PRO_ID: "<ID_PROFESSIONNEL>"
|
||||
|
||||
Reference in New Issue
Block a user