-
Notifications
You must be signed in to change notification settings - Fork 16
/
config.sh
executable file
·27 lines (23 loc) · 989 Bytes
/
config.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
#!/bin/bash
#
# Set environment variables for the training and testing of stanza modules.
# Set UDBASE to the location of UD data folder
# The data should be CoNLL-U format
# For details, see http://universaldependencies.org/conll18/data.html (CoNLL-18 UD data)
export UDBASE=../data/udbase
# Set NERBASE to the location of NER data folder
# The data should be BIO format
# For details, see https://www.aclweb.org/anthology/W03-0419.pdf (CoNLL-03 NER paper)
export NERBASE=../data/nerbase
# Set directories to store processed training/evaluation files
export DATA_ROOT=../data/processed
export TOKENIZE_DATA_DIR=$DATA_ROOT/tokenize
export MWT_DATA_DIR=$DATA_ROOT/mwt
export LEMMA_DATA_DIR=$DATA_ROOT/lemma
export POS_DATA_DIR=$DATA_ROOT/pos
export DEPPARSE_DATA_DIR=$DATA_ROOT/depparse
export ETE_DATA_DIR=$DATA_ROOT/ete
export NER_DATA_DIR=$DATA_ROOT/ner
export CHARLM_DATA_DIR=$DATA_ROOT/charlm
# Set directories to store external word vector data
export WORDVEC_DIR=../data/wordvec