bigdata - Revision 24: /opennlp/trunk/leipzig/data
..
afr-za_web_2015_100K-sentences.txt
afr-za_web_2015_3M-sentences.txt
afr_newscrawl_2012_300K-sentences.txt
afr_wikipedia_2016_300K-sentences.txt
amh_community_2017-sentences.txt
amh_wikipedia_2014_30K-sentences.txt
amh_wikipedia_2016_30K-sentences.txt
ara-ae_web_2015_300K-sentences.txt
ara-sy_newscrawl_2012_300K-sentences.txt
ara_news_2011_1M-sentences.txt
ara_wikipedia_2016_1M-sentences.txt
asm_community_2017-sentences.txt
asm_wikipedia_2014_30K-sentences.txt
asm_wikipedia_2016_30K-sentences.txt
ast_wikipedia_2016_100K-sentences.txt
aze_newscrawl_2013_3M-sentences.txt
aze_wikipedia_2016_300K-sentences.txt
azj-az_web_2015_1M-sentences.txt
azj_wikipedia_2007_10K-sentences.txt
bak_newscrawl_2011_100K-sentences.txt
bak_wikipedia_2016_100K-sentences.txt
ban-id_web_2013_30K-sentences.txt
ban_community_2017-sentences.txt
bel-by_web_2015_300K-sentences.txt
bel_news_2011_300K-sentences.txt
bel_newscrawl_2011_1M-sentences.txt
bel_wikipedia_2016_300K-sentences.txt
ben-bd_web_2014_100K-sentences.txt
ben_newscrawl_2011_100K-sentences.txt
ben_wikipedia_2011_100K-sentences.txt
bih_wikipedia_2016_10K-sentences.txt
bos_newscrawl_2011_300K-sentences.txt
bos_wikipedia_2016_300K-sentences.txt
bre_wikipedia_2016_100K-sentences.txt
bul_news_2007_100K-sentences.txt
bul_newscrawl_2011_1M-sentences.txt
bul_wikipedia_2016_1M-sentences.txt
cat-ad_web_2015_300K-sentences.txt
cat_newscrawl_2011_300K-sentences.txt
cat_wikipedia_2016_3M-sentences.txt
ceb_wikipedia_2016_1M-sentences.txt
ces-eu_web_2014_1M-sentences.txt
ces_news_2005-2007_1M-sentences.txt
ces_newscrawl_2011_1M-sentences.txt
ces_wikipedia_2016_1M-sentences.txt
che_wikipedia_2016_100K-sentences.txt
cmn_wikipedia_2012_300K-sentences.txt
cym_wikipedia_2016_100K-sentences.txt
dan-dk_web_2014_1M-sentences.txt
dan_mixed_2014_1M-sentences.txt
dan_news_2007_1M-sentences.txt
dan_newscrawl_2011_1M-sentences.txt
dan_wikipedia_2016_1M-sentences.txt
deu_news_2015_3M-sentences.txt
deu_wikipedia_2016_3M-sentences.txt
div-mv_web_2016_1M-sentences.txt
div_newscrawl_2015_300K-sentences.txt
ekk_wikipedia_2016_300K-sentences.txt
ell_news_2011_300K-sentences.txt
ell_newscrawl_2011_1M-sentences.txt
ell_web_2011_1M-sentences.txt
ell_wikipedia_2016_1M-sentences.txt
eng_news_2015_3M-sentences.txt
eng_wikipedia_2012_3M-sentences.txt
epo_mixed_2012_1M-sentences.txt
epo_web_2012_1M-sentences.txt
epo_wikipedia_2016_300K-sentences.txt
est_news_2014_300K-sentences.txt
est_newscrawl_2011_1M-sentences.txt
eus_newscrawl_2012_300K-sentences.txt
eus_web_2002_300K-sentences.txt
eus_wikipedia_2016_300K-sentences.txt
fao_mixed_2013_300K-sentences.txt
fao_web_2013_300K-sentences.txt
fas_newscrawl_2011_1M-sentences.txt
fas_wikipedia_2012_300K-sentences.txt
fin_news_2005-2007_300K-sentences.txt
fin_newscrawl_2011_1M-sentences.txt
fin_web_2002_1M-sentences.txt
fin_wikipedia_2016_3M-sentences.txt
fra_mixed_2009_1M-sentences.txt
fra_news_2010_1M-sentences.txt
fra_wikipedia_2010_1M-sentences.txt
fry_newscrawl_2014_100K-sentences.txt
fry_wikipedia_2016_100K-sentences.txt
gle_newscrawl_2014_300K-sentences.txt
glg_wikipedia_2016_300K-sentences.txt
gom_community_2017-sentences.txt
gom_newscrawl_2011_30K-sentences.txt
gom_wikipedia_2016_10K-sentences.txt
gsw_wikipedia_2016_100K-sentences.txt
guj_newscrawl_2011_300K-sentences.txt
guj_wikipedia_2016_100K-sentences.txt
hat-ht_web_2015_30K-sentences.txt
hat_community_2017-sentences.txt
heb_newscrawl_2011_1M-sentences.txt
heb_wikipedia_2016_1M-sentences.txt
hin-in_web_2015_3M-sentences.txt
hin_news_2011_1M-sentences.txt
hin_newscrawl_2012_1M-sentences.txt
hin_wikipedia_2016_300K-sentences.txt
hrv_newscrawl_2011_1M-sentences.txt
hrv_wikipedia_2016_1M-sentences.txt
hun_mixed_2012_1M-sentences.txt
hun_newscrawl_2011_1M-sentences.txt
hun_wikipedia_2016_3M-sentences.txt
hye-am_web_2015_1M-sentences.txt
hye_newscrawl_2011_100K-sentences.txt
hye_wikipedia_2016_300K-sentences.txt
ind-id_web_2015_3M-sentences.txt
ind_mixed_2012_1M-sentences.txt
ind_news_2012_300K-sentences.txt
ind_newscrawl_2012_1M-sentences.txt
ind_wikipedia_2016_1M-sentences.txt
isl-is_web_2015_3M-sentences.txt
isl_mixed_2011_tagged_1M-sentences.txt
isl_newscrawl_2011_1M-sentences.txt
isl_wikipedia_2016_100K-sentences.txt
ita_news_2010_1M-sentences.txt
ita_web_2011_1M-sentences.txt
ita_wikipedia_2016_3M-sentences.txt
jav_wikipedia_2016_100K-sentences.txt
jpn_news_2005-2008_1M-sentences.txt
kan_wikipedia_2016_300K-sentences.txt
kas_community_2017-sentences.txt
kat_newscrawl_2011_300K-sentences.txt
kat_wikipedia_2016_300K-sentences.txt
kaz_newscrawl_2011_100K-sentences.txt
kaz_wikipedia_2016_300K-sentences.txt
khm_community_2017-sentences.txt
kir_newscrawl_2011_300K-sentences.txt
kir_wikipedia_2016_300K-sentences.txt
knn-in_web_2015_10K-sentences.txt
knn_community_2017-sentences.txt
kor_news_2007_1M-sentences.txt
kor_wikipedia_2016_1M-sentences.txt
lao_community_2017-sentences.txt
lao_community_2021-sentences.txt
lat_wikipedia_2016_100K-sentences.txt
lav_newscrawl_2011_1M-sentences.txt
lim_wikipedia_2016_100K-sentences.txt
lit-lt_web_2014_3M-sentences.txt
lit_newscrawl_2011_1M-sentences.txt
lit_wikipedia_2016_300K-sentences.txt
ltz_wikipedia_2016_100K-sentences.txt
lvs_wikipedia_2016_300K-sentences.txt
mal_newscrawl_2011_100K-sentences.txt
mar_news_2010_300K-sentences.txt
mar_newscrawl_2011_100K-sentences.txt
mar_wikipedia_2016_100K-sentences.txt
mhr_wikipedia_2014_10K-sentences.txt
mhr_wikipedia_2016_30K-sentences.txt
min_wikipedia_2016_100K-sentences.txt
mkd_newscrawl_2011_300K-sentences.txt
mkd_newscrwal_2011_300K-sentences.txt
mkd_wikipedia_2016_300K-sentences.txt
mlt_newscrawl_2012_100K-sentences.txt
mlt_web_2012_300K-sentences.txt
mon_wikipedia_2016_100K-sentences.txt
mri_web_2011_100K-sentences.txt
msa_newscrawl_2011_100K-sentences.txt
msa_newscrwal_2011_100K-sentences.txt
msa_wikipedia_2016_300K-sentences.txt
mya_community_2017-sentences.txt
nan_wikipedia_2016_100K-sentences.txt
nds_wikipedia_2016_100K-sentences.txt
nep_news_2010_300K-sentences.txt
nep_wikipedia_2016_100K-sentences.txt
new_wikipedia_2010_30K-sentences.txt
new_wikipedia_2016_30K-sentences.txt
nld_mixed_2012_1M-sentences.txt
nld_wikipedia_2016_3M-sentences.txt
nno-no_web_2013_300K-sentences.txt
nno_wikipedia_2016_300K-sentences.txt
nob_news_2013_1M-sentences.txt
nob_web_2002_1M-sentences.txt
nob_wikipedia_2014_1M-sentences.txt
oci_wikipedia_2016_100K-sentences.txt
ori_community_2017-sentences.txt
ori_wikipedia_2014_30K-sentences.txt
ori_wikipedia_2016_30K-sentences.txt
pan_wikipedia_2016_100K-sentences.txt
pes-ir_web_2011_100K-sentences.txt
pes_wikipedia_2016_1M-sentences.txt
plt_wikipedia_2016_100K-sentences.txt
pnb_wikipedia_2016_100K-sentences.txt
pol_news_2008_1M-sentences.txt
pol_newscrawl_2011_1M-sentences.txt
pol_wikipedia_2016_3M-sentences.txt
por-pt_web_2014_1M-sentences.txt
por_newscrawl_2011_1M-sentences.txt
por_wikipedia_2016_3M-sentences.txt
pus_newscrawl_2011_100K-sentences.txt
ron_newscrawl_2011_1M-sentences.txt
ron_web_2011_1M-sentences.txt
ron_wikipedia_2011_300K-sentences.txt
rus_news_2010_1M-sentences.txt
rus_wikipedia_2016_3M-sentences.txt
san_wikipedia_2016_100K-sentences.txt
sin_wikipedia_2016_100K-sentences.txt
slk-sk_web_2014_1M-sentences.txt
slk_newscrawl_2011_1M-sentences.txt
slk_wikipedia_2016_300K-sentences.txt
slv-si_web_2014_1M-sentences.txt
slv_newscrawl_2011_1M-sentences.txt
slv_wikipedia_2016_300K-sentences.txt
som_newscrawl_2011_100K-sentences.txt
spa_news_2011_1M-sentences.txt
spa_newscrawl_2011_1M-sentences.txt
spa_wikipedia_2016_3M-sentences.txt
sqi_wikipedia_2016_300K-sentences.txt
srp_wikipedia_2016_1M-sentences.txt
sun-id_web_2013_300K-sentences.txt
swa_wikipedia_2016_100K-sentences.txt
swe_news_2007_1M-sentences.txt
swe_web_2002_1M-sentences.txt
swe_wikipedia_2016_3M-sentences.txt
tam_newscrawl_2011_1M-sentences.txt
tam_wikipedia_2016_300K-sentences.txt
tat_mixed_2015_1M-sentences.txt
tat_news_2015_1M-sentences.txt
tat_wikipedia_2016_100K-sentences.txt
tel_newscrawl_2011_300K-sentences.txt
tel_wikipedia_2016_300K-sentences.txt
tgk_newscrawl_2011_100K-sentences.txt
tgk_wikipedia_2016_100K-sentences.txt
tgl_newscrwal_2011_300K-sentences.txt
tgl_wikipedia_2016_100K-sentences.txt
tha_newscrawl_2011_100K-sentences.txt
tuk-tm_web_2015_30K-sentences.txt
tuk-tm_web_2016_100K-sentences.txt
tuk_community_2017-sentences.txt
tuk_wikipedia_2016_30K-sentences.txt
tur_mixed_2014_1M-sentences.txt
tur_news_2005_1M-sentences.txt
tur_newscrawl_2011_300K-sentences.txt
tur_wikipedia_2016_1M-sentences.txt
uig_community_2017-sentences.txt
uig_community_2021-sentences.txt
ukr_mixed_2012_1M-sentences.txt
ukr_newscrawl_2011_1M-sentences.txt
ukr_web_2012_1M-sentences.txt
ukr_wikipedia_2016_3M-sentences.txt
urd_newscrawl_2011_300K-sentences.txt
urd_wikipedia_2016_300K-sentences.txt
uzb_newscrawl_2011_100K-sentences.txt
uzb_wikipedia_2016_100K-sentences.txt
vie_newscrwal_2011_1M-sentences.txt
vie_wikipedia_2016_1M-sentences.txt
vol_wikipedia_2016_100K-sentences.txt
war_wikipedia_2016_300K-sentences.txt
xho_community_2017-sentences.txt
xho_mixed_2016_30K-sentences.txt
yid_wikipedia_2010_30K-sentences.txt
yid_wikipedia_2016_30K-sentences.txt
zho-simp-tw_web_2014_300K-sentences.txt
zho-trad_newscrawl_2011_1M-sentences.txt
zsm_mixed-tufs4_2012_300K-sentences.txt
zsm_web-tufs13_2012_300K-sentences.txt
zsm_wikipedia-tufs16_2016_300K-sentences.txt
zul_mixed_2014_100K-sentences.txt