-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathconfig.cf.default
More file actions
45 lines (40 loc) · 1.26 KB
/
config.cf.default
File metadata and controls
45 lines (40 loc) · 1.26 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
[DB]
# Connector: mysql
dbCONNECTOR = mysql
dbUSER =
dbPASS =
dbSERVER = localhost
#Leave dbSOCKET empty for tcp connection
dbSOCKET = /var/run/mysqld/mysqld.sock
[S2]
#Database name. Needs to be created before executing the sript
dbNAME = db_Pu_S2
data_files =
#Number or cores for parallel processing
#Set to 0 to deactivate parallel processing
ncpu = 0
#Size of chunks for paper processing and database ingestion
chunksize = 100000
[FIS]
#Database name. Needs to be created before executing the script
dbNAME = db_Pr_FIS
download_folder =
#time to sleep between URL downloads. Increasing facilitates a complete
#download in one execution, at the cost of increasing execution time
ttsleep = 5
[BOE]
dbNAME = db_Law_BOE
xml_dir = data_Law_BOE/XML/
lemas_dir = data_Law_BOE/LEMAS/
[Lemmatizer]
server = http://localhost:7777/en/annotations/
#Online demonstration service
#server = http://librairy.linkeddata.es/nlp/annotations/
stw_file = ./lemmatizer/lemafiles/stopwords/stop-words-english5.txt
dict_eq_file =
POS = "NOUN", "VERB", "ADJECTIVE"
removenumbers = True
#If true, sentence information will be kept, which is necessary when training embedding models
keepSentence = True
#Number of threads that will concurrently send lemmatization requests to the server
concurrent_posts = 10