presidio modulaire

This commit is contained in:
nBiqoz
2025-09-07 12:29:08 +02:00
parent 85d95d05e5
commit c62e5b92d5
42 changed files with 1802 additions and 324 deletions

View File

@@ -0,0 +1,33 @@
nlp_configuration:
nlp_engine_name: spacy
models:
- lang_code: en
model_name: en_core_web_lg
- lang_code: fr
model_name: fr_core_news_lg
# Configuration NER globale (sans confidence_thresholds)
ner_model_configuration:
model_to_presidio_entity_mapping:
PER: PERSON
PERSON: PERSON
ORG: ORGANIZATION
ORGANIZATION: ORGANIZATION
LOC: LOCATION
LOCATION: LOCATION
DATE: DATE_TIME
TIME: DATE_TIME
MISC: DATE_TIME
labels_to_ignore:
- LOCATION
- MISC
- CARDINAL
- EVENT
- LANGUAGE
- LAW
- ORDINAL
- PERCENT
- PRODUCT
- QUANTITY
- WORK_OF_ART
low_score_entity_names: []