dc.contributor.author | Mareček, David |
dc.contributor.author | Straka, Milan |
dc.date.accessioned | 2017-01-20T10:45:06Z |
dc.date.available | 2017-01-20T10:45:06Z |
dc.date.issued | 2016-12-22 |
dc.identifier.uri | http://hdl.handle.net/11234/1-1953 |
dc.description | This toolkit comprises the tools and supporting scripts for unsupervised induction of dependency trees from raw texts or texts with already assigned part-of-speech tags. There are also scripts for simple machine translation based on unsupervised parsing and scripts for minimally supervised parsing into Universal-Dependencies style. |
dc.language.iso | eng |
dc.publisher | Charles University, Faculty of Mathematics and Physics, Institute of Formal and Applied Linguistics (UFAL) |
dc.rights | GNU General Public Licence, version 3 |
dc.rights.uri | http://opensource.org/licenses/GPL-3.0 |
dc.source.uri | http://ufal.mff.cuni.cz/listr |
dc.subject | parsing |
dc.subject | unsupervised machine learning |
dc.subject | machine translation |
dc.subject | grammar induction |
dc.title | LiStr: Linguistic Structure Induction Tookit |
dc.type | toolService |
metashare.ResourceInfo#ResourceComponentType#ToolServiceInfo.languageDependent | false |
metashare.ResourceInfo#ContentInfo.detailedType | tool |
dc.rights.label | PUB |
has.files | yes |
branding | LINDAT / CLARIAH-CZ |
contact.person | David Mareček marecek@ufal.mff.cuni.cz Charles University in Prague, UFAL |
sponsor | Czech Science Foundation GAP406/14/06548P Sentence structure induction without annotated corpora nationalFunds |
files.size | 225815 |
files.count | 1 |
Soubory tohoto záznamu
- Název
- listr-16.12.tar.gz
- Velikost
- 220.52 KB
- Formát
- application/x-gzip
- Popis
- LiStr toolkit, version 16.12
- MD5
- 793e1c1866bdc9d5a7668d0b71387430
- scripts
- pos_and_structure.pl11 kB
- delete_punctuation.pl2 kB
- split_on_punctuation.pl805 B
- ngram_reducibility.pl4 kB
- tokenize.pl10 kB
- function_tag_stop.pl4 kB
- merged_trees
- translate_nb.pl2 kB
- extract_dictionary.pl3 kB
- czeng2paratags.pl4 kB
- train_nb.pl3 kB
- extract_short_sentences.pl407 B
- sort_sentences_by_length.pl943 B
- eval.pl2 kB
- get_stop_priors.pl5 kB
- posguess
- knn_classifier.pl3 kB
- get_statistics.pl6 kB
- knn_dictionary.pl3 kB
- gibbs_tagger.pl4 kB
- udpc
- models
- attach.h2 kB
- baseline.cpp2 kB
- attach.cpp9 kB
- stop.cpp9 kB
- model.h2 kB
- model.cpp1 kB
- stop.h2 kB
- baseline.h1 kB
- CHANGES48 B
- Makefile849 B
- README2 kB
- AUTHORS67 B
- common.cpp1 kB
- .objs
- parser.o45 kB
- models
- baseline.dep106 B
- model.o11 kB
- attach.dep114 B
- stop.dep108 B
- stop.o64 kB
- baseline.o26 kB
- model.dep96 B
- attach.o83 kB
- common.o8 kB
- common.dep36 B
- corpus
- corpus.o42 kB
- corpus.dep83 B
- gibbs_sampler
- gibbs_sampler_incremental.o14 kB
- gibbs_sampler_block.o49 kB
- gibbs_sampler_block.dep187 B
- gibbs_sampler.dep271 B
- gibbs_sampler_incremental.dep205 B
- gibbs_sampler.o19 kB
- parser.dep262 B
- utils
- utils.dep60 B
- distribution.dep84 B
- distribution.o6 kB
- options.o12 kB
- options.dep66 B
- utils.o11 kB
- graph
- directed_mst.o25 kB
- directed_mst.dep84 B
- parser.cpp3 kB
- corpus
- corpus.h2 kB
- corpus.cpp8 kB
- gibbs_sampler
- gibbs_sampler.cpp4 kB
- gibbs_sampler_block.cpp10 kB
- gibbs_sampler_incremental.cpp6 kB
- gibbs_sampler.h1 kB
- gibbs_sampler_block.h2 kB
- gibbs_sampler_incremental.h1 kB
- common.h1 kB
- utils
- options.cpp1 kB
- distribution.h1 kB
- options.h887 B
- utils.cpp2 kB
- distribution.cpp1 kB
- utils.h1 kB
- graph
- directed_mst.h1 kB
- directed_mst.cpp3 kB
- COPYING34 kB
- models
- stop_estimates
- eu07.stp3 kB
- el07.stp1 kB
- cs07.stp2 kB
- da06.stp1 kB
- ar07.stp1 kB
- bg06.stp2 kB
- sv06.stp1 kB
- en07.stp2 kB
- hu07.stp2 kB
- es06.stp2 kB
- cs06.stp2 kB
- README318 B
- it07.stp1 kB
- ar06.stp955 B
- ja06.stp3 kB
- tr07.stp1 kB
- ca07.stp2 kB
- de06.stp2 kB
- pt06.stp1 kB
- sl06.stp2 kB
- nl06.stp18 kB
- README4 kB
- COPYING34 kB
- universal_priors
- stop_priors.tsv404 B
- attach_priors.tsv62 B