1	fontfile	arialuni.ttf
2	fontname	Arial Unicode MS
3	database encoding	utf-8
4	database communication encoding	utf-8
5	content encoding	utf-8
6	browser version	1.0
7	build release	null
8	build date	2019-02-21
9	build user	dgoldhahn
10	build location	bender:/data/toolchain_2018/toolchain/external/Medusa
11	build file encoding	UTF-8
12	build system	Linux on amd64
13	build architecture model	64
14	build java version	10.0.2
15	release date	unknownDate
16	release user	null
17	corpus file	/data/toolchain_2018/toolchain/data/bul_wikipedia_2018_1M/05_Tables/bul_wikipedia_2018_1M.medusa.sorted
18	used memory	4294967296
19	de.uni_leipzig.asv.medusa.filter.sidx.IDXSentenceFilterImpl.n	1000000
20	de.uni_leipzig.asv.medusa.filter.sidx.IDXInvertedListFilterImpl.n	1000000
21	de.uni_leipzig.asv.medusa.filter.sidx.IDXInvertedSourceListFilterImpl.n	1000000
22	WORD_TYPES	690711
23	de.uni_leipzig.asv.medusa.filter.sidx.IDXSentenceFilterImpl.SIG_COOCCURRENCE_TOKENS	130976406
24	de.uni_leipzig.asv.medusa.filter.sidx.IDXNeighbourhoodFilterImpl.n	18051052
25	BOW_WORD_TOKENS	17436762
26	de.uni_leipzig.asv.medusa.filter.sidx.IDXNeighbourhoodFilterImpl.COOCCURRENCE_TYPES	777253
27	WORD_TOKENS	19051052
28	SOURCES	175793
29	de.uni_leipzig.asv.medusa.filter.sidx.IDXNeighbourhoodFilterImpl.SIG_COOCCURRENCE_TOKENS	11804622
30	de.uni_leipzig.asv.medusa.filter.sidx.IDXSentenceFilterImpl.SIG_COOCCURRENCE_TYPES	4129418
31	de.uni_leipzig.asv.medusa.filter.sidx.IDXSentenceFilterImpl.COOCCURRENCE_TYPES	12184324
32	de.uni_leipzig.asv.medusa.filter.sidx.IDXNeighbourhoodFilterImpl.SIG_COOCCURRENCE_TYPES	586168
33	SENTENCES	1000000
34	auto mwu detection enabled	false
35	duration of word numbers generation	0 hour(s) 0 min 52,170 sec
36	most frequent word	.
37	duration of executing de.uni_leipzig.asv.medusa.filter.sidx.IDXInvertedListFilterImpl	0 hour(s) 0 min 35,308 sec
38	duration of executing de.uni_leipzig.asv.medusa.filter.sidx.IDXSentenceFilterImpl	0 hour(s) 1 min 37,196 sec
39	duration of generation bow frequencies	0 hour(s) 0 min 0,982 sec
40	duration for generation wnc file	0 hour(s) 0 min 0,500 sec
41	duration of exporting de.uni_leipzig.asv.medusa.filter.sidx.IDXNeighbourhoodFilterImpl	0 hour(s) 0 min 3,146 sec
42	duration of exporting de.uni_leipzig.asv.medusa.filter.sidx.IDXInvertedListFilterImpl	0 hour(s) 0 min 4,178 sec
43	duration of executing de.uni_leipzig.asv.medusa.filter.sidx.IDXNeighbourhoodFilterImpl	0 hour(s) 0 min 17,957 sec
44	duration of executing de.uni_leipzig.asv.medusa.filter.sidx.IDXInvertedSourceListFilterImpl	0 hour(s) 0 min 0,188 sec
45	duration of wswn transformation 	0 hour(s) 0 min 2,908 sec
46	most frequent word's frequency	993006
47	duration of exporting de.uni_leipzig.asv.medusa.filter.sidx.IDXSentenceFilterImpl	0 hour(s) 0 min 35,930 sec
48	duration of tokenisation	0 hour(s) 0 min 48,911 sec
