-
Notifications
You must be signed in to change notification settings - Fork 1
/
Anonymiser.ini
26 lines (19 loc) · 1.96 KB
/
Anonymiser.ini
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
# Config file for Anonymiser
[Anonymiser]
AnonymiseNames = true # default: false
AnonymiseNumbers = true # default: false
AnonymiseDates = true # default: false
AnonymiseTitlesOfWork = true # default: false
AnonymiseTitleCasedWordSequences = true # default: false
AnonymiseUrls = true # default: false
AnonymiseEmails = true # default: false
AnonymisePhoneNumbers = true # default: false
NamedEntityRecognitionModel = "en_core_web_trf" # options: en_core_web_sm (default), en_core_web_md, en_core_web_lg, en_core_web_trf (for Russian language, it will automatically switch to Russian model of same size)
UseOnlyNumericReplacements = true # default: true - Set to "false" if you want to allow letter-based replacements in the style "Person A", "Place B", etc. When letter-based replacements run out then numberic replacements will be used in any case. So, after "Place Z" there will be "Place 1", "Place 2", etc. By default, replacements like "Person 1", "Place 2", etc will be used from the start since this enables more replacements with same style.
Encoding = "auto" # options: "utf-8" (default), "auto"
CsvAnonymiseHeader = false # default: false - Whether to anonymise texts in the header row of CSV. This setting applies to Excel and OpenDocument Sheet files as well.
CsvDelimiter = "auto" # options: "auto", "," (default), ";", "any other char"
CsvQuoteChar = "auto" # options: "auto", "double" (default), "single", "any other char". NB! For " use "double", for ' use "single" - do not write """ or "'".
CsvDoubleQuote = "auto" # default: "auto", "true" (default), "false" - When quotechar is specified and quoting is not QUOTE_NONE, indicate whether or not to interpret two consecutive quotechar elements INSIDE a field as a single quotechar element.
CsvEscapeChar = "auto" # options: "auto", "none" (default), "any other char"
# more config sections may be added later