-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathconfig.yaml
60 lines (56 loc) · 1.42 KB
/
config.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
PHI:
AGE:
AGE: keep
DATE:
DATE: shift
BIRTHDATE: shift
CONTACT:
PHONE: replace
FAX: replace
EMAIL: replace
URL: replace
IPADDRESS: replace
ID:
PATIENTID: replace
STUDYID: replace
OTHER: replace
LOCATION:
ORGANIZATION: replace
HOSPITAL: replace
STREET: replace
CITY: replace
ZIP: replace
COUNTRY: replace
STATE: replace
OTHER: replace
NAME:
PATIENT: replace
STAFF: replace
OTHER: replace
PROFESSION:
PROFESSION: replace
STATUS: replace
OTHER:
OTHER: replace
OFFSET:
# Offset table must have the format: "patientid,timeoffset" -> timeoffset must be specified in miliseconds
TABLE_PATH: /path/to/offset_table
DATE_POSITIVE_BOUNDARY: 15
DATE_NEGATIVE_BOUNDARY: -14
AGE_POSITIVE_BOUNDARY: 3
AGE_NEGATIVE_BOUNDARY: -2
RESULTS:
JSON_INPUT_PATH: /path/to/json_bundle
JSON_OUTPUT_PATH: /path/to/json_result
TXT_OUTPUT_PATH: /path/to/text_result
INPUT:
FORMAT: cas
PATH: /path/to/cas
TS: /path/to/ts
# the filenames must have the structure "Patient:patientid_ResourceType:resourceid.dataending" for example "Patient:0a1a3cd_Observation:7d7bcb.xmi"
# the name of the resource type can be customized with this parameter
RESOURCE_TYPE: Observation
NAMES:
MODEL: bert-base-multilingual-cased-ner-hrl_bert-base-multilingual-cased-ner-hrl
TOKENIZER: Davlan/bert-base-multilingual-cased-ner-hrl
DATASET: Dataset_Name