-
Notifications
You must be signed in to change notification settings - Fork 965
Expand file tree
/
Copy path__init__.py
More file actions
220 lines (200 loc) · 8.08 KB
/
__init__.py
File metadata and controls
220 lines (200 loc) · 8.08 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
"""Predefined recognizers package. Holds all the default recognizers."""
# Australia recognizers
from presidio_analyzer.predefined_recognizers.nlp_engine_recognizers.transformers_recognizer import ( # noqa: E501
TransformersRecognizer,
)
from .country_specific.australia.au_abn_recognizer import AuAbnRecognizer
from .country_specific.australia.au_acn_recognizer import AuAcnRecognizer
from .country_specific.australia.au_medicare_recognizer import AuMedicareRecognizer
from .country_specific.australia.au_tfn_recognizer import AuTfnRecognizer
# Finland recognizers
from .country_specific.finland.fi_personal_identity_code_recognizer import (
FiPersonalIdentityCodeRecognizer,
)
# Germany recognizers
from .country_specific.germany.de_bsnr_recognizer import DeBsnrRecognizer
from .country_specific.germany.de_commercial_register_recognizer import (
DeCommercialRegisterRecognizer,
)
from .country_specific.germany.de_driver_license_recognizer import (
DeDriverLicenseRecognizer,
)
from .country_specific.germany.de_kvnr_recognizer import DeKvnrRecognizer
from .country_specific.germany.de_lanr_recognizer import DeLanrRecognizer
from .country_specific.germany.de_license_plate_recognizer import (
DeLicensePlateRecognizer,
)
from .country_specific.germany.de_passport_recognizer import DePassportRecognizer
from .country_specific.germany.de_personal_id_recognizer import DePersonalIdRecognizer
from .country_specific.germany.de_postal_code_recognizer import DePostalCodeRecognizer
from .country_specific.germany.de_social_security_recognizer import (
DeSocialSecurityRecognizer,
)
from .country_specific.germany.de_tax_id_recognizer import DeTaxIdRecognizer
from .country_specific.germany.de_telematik_id_recognizer import DeTelematikIdRecognizer
from .country_specific.germany.de_vat_code_recognizer import DeVatCodeRecognizer
# India recognizers
from .country_specific.india import (
InVehicleRegistrationRecognizer,
)
from .country_specific.india.in_aadhaar_recognizer import InAadhaarRecognizer
from .country_specific.india.in_gstin_recognizer import InGstinRecognizer
from .country_specific.india.in_pan_recognizer import InPanRecognizer
from .country_specific.india.in_passport_recognizer import InPassportRecognizer
from .country_specific.india.in_voter_recognizer import InVoterRecognizer
# Italy recognizers
from .country_specific.italy.it_driver_license_recognizer import (
ItDriverLicenseRecognizer,
)
from .country_specific.italy.it_fiscal_code_recognizer import ItFiscalCodeRecognizer
from .country_specific.italy.it_identity_card_recognizer import ItIdentityCardRecognizer
from .country_specific.italy.it_passport_recognizer import ItPassportRecognizer
from .country_specific.italy.it_vat_code import ItVatCodeRecognizer
# Korea recognizers
from .country_specific.korea.kr_brn_recognizer import KrBrnRecognizer
from .country_specific.korea.kr_driver_license_recognizer import (
KrDriverLicenseRecognizer,
)
from .country_specific.korea.kr_frn_recognizer import KrFrnRecognizer
from .country_specific.korea.kr_passport_recognizer import KrPassportRecognizer
from .country_specific.korea.kr_rrn_recognizer import KrRrnRecognizer
# Poland recognizers
from .country_specific.poland.pl_pesel_recognizer import PlPeselRecognizer
# Singapore recognizers
from .country_specific.singapore.sg_fin_recognizer import SgFinRecognizer
from .country_specific.singapore.sg_uen_recognizer import SgUenRecognizer
# Spain recognizers
from .country_specific.spain.es_nie_recognizer import EsNieRecognizer
from .country_specific.spain.es_nif_recognizer import EsNifRecognizer
# Thai recognizers
from .country_specific.thai.th_tnin_recognizer import ThTninRecognizer
# UK recognizers
from .country_specific.uk.uk_nhs_recognizer import NhsRecognizer
from .country_specific.uk.uk_nino_recognizer import UkNinoRecognizer
from .country_specific.uk.uk_postcode_recognizer import UkPostcodeRecognizer
# US recognizers
from .country_specific.us.aba_routing_recognizer import AbaRoutingRecognizer
from .country_specific.us.medical_license_recognizer import MedicalLicenseRecognizer
from .country_specific.us.us_bank_recognizer import UsBankRecognizer
from .country_specific.us.us_driver_license_recognizer import UsLicenseRecognizer
from .country_specific.us.us_itin_recognizer import UsItinRecognizer
from .country_specific.us.us_mbi_recognizer import UsMbiRecognizer
from .country_specific.us.us_npi_recognizer import UsNpiRecognizer
from .country_specific.us.us_passport_recognizer import UsPassportRecognizer
from .country_specific.us.us_ssn_recognizer import UsSsnRecognizer
# Generic recognizers
from .generic.credit_card_recognizer import CreditCardRecognizer
from .generic.crypto_recognizer import CryptoRecognizer
from .generic.date_recognizer import DateRecognizer
from .generic.email_recognizer import EmailRecognizer
from .generic.iban_recognizer import IbanRecognizer
from .generic.ip_recognizer import IpRecognizer
from .generic.mac_recognizer import MacAddressRecognizer
from .generic.phone_recognizer import PhoneRecognizer
from .generic.url_recognizer import UrlRecognizer
# NER recognizers
from .ner.gliner_recognizer import GLiNERRecognizer
from .ner.huggingface_ner_recognizer import HuggingFaceNerRecognizer
from .ner.medical_ner_recognizer import MedicalNERRecognizer
# NLP Engine recognizers
from .nlp_engine_recognizers.spacy_recognizer import SpacyRecognizer
from .nlp_engine_recognizers.stanza_recognizer import StanzaRecognizer
from .third_party.ahds_recognizer import AzureHealthDeidRecognizer
# Third-party recognizers
from .third_party.azure_ai_language import AzureAILanguageRecognizer
from .third_party.azure_openai_langextract_recognizer import (
AzureOpenAILangExtractRecognizer,
)
from .third_party.basic_langextract_recognizer import BasicLangExtractRecognizer
from .third_party.langextract_recognizer import LangExtractRecognizer
PREDEFINED_RECOGNIZERS = [
"PhoneRecognizer",
"CreditCardRecognizer",
"CryptoRecognizer",
"DateRecognizer",
"EmailRecognizer",
"IpRecognizer",
"IbanRecognizer",
"MedicalLicenseRecognizer",
"UrlRecognizer",
]
NLP_RECOGNIZERS = {
"spacy": SpacyRecognizer,
"stanza": StanzaRecognizer,
"transformers": TransformersRecognizer,
}
__all__ = [
"AbaRoutingRecognizer",
"CreditCardRecognizer",
"DeBsnrRecognizer",
"DeCommercialRegisterRecognizer",
"DeDriverLicenseRecognizer",
"DeKvnrRecognizer",
"DeLanrRecognizer",
"DeLicensePlateRecognizer",
"DePassportRecognizer",
"DePersonalIdRecognizer",
"DePostalCodeRecognizer",
"DeSocialSecurityRecognizer",
"DeTaxIdRecognizer",
"DeTelematikIdRecognizer",
"DeVatCodeRecognizer",
"CryptoRecognizer",
"DateRecognizer",
"EmailRecognizer",
"IbanRecognizer",
"IpRecognizer",
"NhsRecognizer",
"MedicalLicenseRecognizer",
"MacAddressRecognizer",
"PhoneRecognizer",
"SgFinRecognizer",
"UrlRecognizer",
"UsBankRecognizer",
"UsItinRecognizer",
"UsLicenseRecognizer",
"UsMbiRecognizer",
"UsNpiRecognizer",
"UsPassportRecognizer",
"UsSsnRecognizer",
"EsNifRecognizer",
"SpacyRecognizer",
"StanzaRecognizer",
"NLP_RECOGNIZERS",
"AuAbnRecognizer",
"AuAcnRecognizer",
"AuTfnRecognizer",
"AuMedicareRecognizer",
"TransformersRecognizer",
"ItDriverLicenseRecognizer",
"ItFiscalCodeRecognizer",
"ItVatCodeRecognizer",
"ItIdentityCardRecognizer",
"ItPassportRecognizer",
"InPanRecognizer",
"GLiNERRecognizer",
"HuggingFaceNerRecognizer",
"PlPeselRecognizer",
"AzureAILanguageRecognizer",
"InAadhaarRecognizer",
"InGstinRecognizer",
"InVehicleRegistrationRecognizer",
"SgUenRecognizer",
"InVoterRecognizer",
"InPassportRecognizer",
"FiPersonalIdentityCodeRecognizer",
"EsNieRecognizer",
"UkNinoRecognizer",
"UkPostcodeRecognizer",
"AzureHealthDeidRecognizer",
"KrBrnRecognizer",
"KrRrnRecognizer",
"KrDriverLicenseRecognizer",
"KrFrnRecognizer",
"ThTninRecognizer",
"LangExtractRecognizer",
"AzureOpenAILangExtractRecognizer",
"BasicLangExtractRecognizer",
"KrPassportRecognizer",
"MedicalNERRecognizer",
]