Files in this item
Download all files in item (598.92 MB)- Name
- ud-treebanks-v2.12.tgz
- Size
- 497.82 MB
- Format
- application/x-gzip
- Description
- Treebank data
- MD5
- afb7546d9591a82f372686bcc100db52
- ud-treebanks-v2.12
- UD_English-PUD
- stats.xml8 kB
- en_pud-ud-test.conllu1 MB
- README.md6 kB
- en_pud-ud-test.txt109 kB
- LICENSE.txt19 kB
- UD_Finnish-PUD
- stats.xml17 kB
- README.txt2 kB
- fi_pud-ud-test.txt119 kB
- LICENSE.txt202 B
- fi_pud-ud-test.conllu1 MB
- UD_Telugu-MTG
- te_mtg-ud-test.txt10 kB
- README.md1 kB
- te_mtg-ud-train.conllu494 kB
- te_mtg-ud-dev.conllu64 kB
- stats.xml3 kB
- te_mtg-ud-test.conllu70 kB
- LICENSE.txt202 B
- te_mtg-ud-dev.txt9 kB
- te_mtg-ud-train.txt72 kB
- UD_Neapolitan-RB
- stats.xml1 kB
- README.md1 kB
- nap_rb-ud-test.conllu431 B
- LICENSE.txt202 B
- nap_rb-ud-test.txt56 B
- UD_Swedish-Talbanken
- sv_talbanken-ud-test.txt122 kB
- README.md7 kB
- sv_talbanken-ud-train.txt402 kB
- stats.xml9 kB
- LICENSE.txt20 kB
- sv_talbanken-ud-train.conllu5 MB
- sv_talbanken-ud-dev.conllu834 kB
- sv_talbanken-ud-test.conllu1 MB
- sv_talbanken-ud-dev.txt58 kB
- UD_Romanian-RRT
- README.md5 kB
- ro_rrt-ud-dev.txt98 kB
- ro_rrt-ud-train.conllu13 MB
- stats.xml12 kB
- LICENSE.txt66 B
- ro_rrt-ud-dev.conllu1 MB
- ro_rrt-ud-test.conllu1 MB
- ro_rrt-ud-train.txt1 MB
- ro_rrt-ud-test.txt94 kB
- UD_Czech-CLTT
- cs_cltt-ud-dev.conllu1 MB
- cs_cltt-ud-test.txt81 kB
- README.md3 kB
- cs_cltt-ud-train.txt96 kB
- cs_cltt-ud-dev.txt76 kB
- stats.xml13 kB
- cs_cltt-ud-train.conllu1 MB
- LICENSE.txt265 B
- cs_cltt-ud-test.conllu1 MB
- UD_Czech-PUD
- stats.xml16 kB
- README.md3 kB
- cs_pud-ud-test.txt114 kB
- LICENSE.txt202 B
- cs_pud-ud-test.conllu2 MB
- UD_Sinhala-STB
- stats.xml14 kB
- README.md1 kB
- LICENSE.txt202 B
- si_stb-ud-test.txt11 kB
- si_stb-ud-test.conllu109 kB
- UD_German-GSD
- README.md9 kB
- de_gsd-ud-dev.conllu882 kB
- de_gsd-ud-dev.txt72 kB
- de_gsd-ud-train.txt1 MB
- de_gsd-ud-test.conllu1 MB
- stats.xml11 kB
- de_gsd-ud-train.conllu18 MB
- LICENSE.txt202 B
- de_gsd-ud-test.txt97 kB
- UD_Zaar-Autogramm
- stats.xml10 kB
- README.md2 kB
- say_autogramm-ud-test.conllu951 kB
- LICENSE.txt202 B
- say_autogramm-ud-test.txt42 kB
- UD_Akuntsu-TuDeT
- stats.xml7 kB
- aqz_tudet-ud-test.conllu89 kB
- README.md3 kB
- aqz_tudet-ud-test.txt6 kB
- LICENSE.txt202 B
- UD_Komi_Permyak-UH
- stats.xml14 kB
- README.md6 kB
- koi_uh-ud-test.conllu107 kB
- LICENSE.txt202 B
- koi_uh-ud-test.txt8 kB
- UD_Pomak-Philotis
- README.md2 kB
- qpm_philotis-ud-train.conllu5 MB
- qpm_philotis-ud-test.txt45 kB
- qpm_philotis-ud-train.txt357 kB
- qpm_philotis-ud-dev.txt45 kB
- qpm_philotis-ud-dev.conllu690 kB
- qpm_philotis-ud-test.conllu695 kB
- stats.xml12 kB
- LICENSE.txt417 B
- UD_Faroese-FarPaHC
- fo_farpahc-ud-dev.conllu465 kB
- fo_farpahc-ud-dev.txt42 kB
- README.md4 kB
- fo_farpahc-ud-test.conllu459 kB
- fo_farpahc-ud-train.txt105 kB
- fo_farpahc-ud-train.conllu1 MB
- stats.xml5 kB
- fo_farpahc-ud-test.txt42 kB
- LICENSE.txt202 B
- UD_Turkish-Penn
- README.md1 kB
- tr_penn-ud-dev.conllu477 kB
- tr_penn-ud-train.conllu11 MB
- tr_penn-ud-test.txt69 kB
- stats.xml13 kB
- LICENSE.txt202 B
- tr_penn-ud-test.conllu682 kB
- tr_penn-ud-dev.txt48 kB
- tr_penn-ud-train.txt1 MB
- UD_Japanese-PUDLUW
- stats.xml4 kB
- README.md5 kB
- ja_pudluw-ud-test.txt138 kB
- LICENSE.txt202 B
- ja_pudluw-ud-test.conllu4 MB
- UD_Chinese-PUD
- stats.xml5 kB
- README.md5 kB
- zh_pud-ud-test.conllu2 MB
- zh_pud-ud-test.txt101 kB
- LICENSE.txt19 kB
- UD_Teko-TuDeT
- stats.xml14 kB
- eme_tudet-ud-test.conllu206 kB
- eme_tudet-ud-test.txt17 kB
- README.md1 kB
- LICENSE.txt202 B
- UD_Latin-UDante
- la_udante-ud-train.conllu2 MB
- README.md10 kB
- la_udante-ud-dev.conllu1 MB
- la_udante-ud-train.txt170 kB
- stats.xml19 kB
- la_udante-ud-test.txt78 kB
- la_udante-ud-dev.txt67 kB
- LICENSE.txt202 B
- la_udante-ud-test.conllu1 MB
- UD_Buryat-BDT
- stats.xml12 kB
- README.txt1 kB
- bxr_bdt-ud-train.txt1 kB
- bxr_bdt-ud-train.conllu11 kB
- LICENSE.txt202 B
- bxr_bdt-ud-test.txt114 kB
- bxr_bdt-ud-test.conllu699 kB
- UD_Italian-MarkIT
- it_markit-ud-dev.txt54 kB
- README.md1 kB
- it_markit-ud-train.txt102 kB
- it_markit-ud-test.txt52 kB
- stats.xml8 kB
- it_markit-ud-train.conllu1 MB
- LICENSE.txt188 B
- it_markit-ud-test.conllu642 kB
- it_markit-ud-dev.conllu649 kB
- UD_Abaza-ATB
- stats.xml17 kB
- abq_atb-ud-test.conllu125 kB
- README.md1 kB
- abq_atb-ud-test.txt9 kB
- LICENSE.txt202 B
- UD_Slovenian-SST
- stats.xml11 kB
- sl_sst-ud-test.txt53 kB
- README.md5 kB
- sl_sst-ud-train.conllu1 MB
- sl_sst-ud-test.conllu988 kB
- LICENSE.txt441 B
- sl_sst-ud-train.txt103 kB
- UD_English-GUMReddit
- README.md24 kB
- en_gumreddit-ud-train.txt23 kB
- en_gumreddit-ud-train.conllu1 MB
- en_gumreddit-ud-dev.conllu171 kB
- get_text.py28 kB
- en_gumreddit-ud-dev.txt3 kB
- stats.xml6 kB
- en_gumreddit-ud-test.txt3 kB
- LICENSE.txt313 B
- en_gumreddit-ud-test.conllu172 kB
- UD_Guarani-OldTuDeT
- stats.xml8 kB
- README.md2 kB
- gn_oldtudet-ud-test.txt1 kB
- LICENSE.txt202 B
- gn_oldtudet-ud-test.conllu18 kB
- UD_Warlpiri-UFAL
- stats.xml6 kB
- README.md870 B
- LICENSE.txt202 B
- wbp_ufal-ud-test.txt2 kB
- wbp_ufal-ud-test.conllu37 kB
- UD_Norwegian-Bokmaal
- README.md7 kB
- no_bokmaal-ud-dev.txt195 kB
- no_bokmaal-ud-train.txt1 MB
- no_bokmaal-ud-test.txt161 kB
- stats.xml9 kB
- no_bokmaal-ud-train.conllu15 MB
- no_bokmaal-ud-test.conllu1 MB
- no_bokmaal-ud-dev.conllu2 MB
- LICENSE.txt68 B
- UD_French-FQB
- stats.xml8 kB
- fr_fqb-ud-test.conllu1 MB
- README.md3 kB
- fr_fqb-ud-test.txt117 kB
- LICENSE.txt14 kB
- UD_South_Levantine_Arabic-MADAR
- stats.xml4 kB
- README.md2 kB
- ajp_madar-ud-test.conllu42 kB
- ajp_madar-ud-test.txt5 kB
- LICENSE.txt202 B
- UD_Chinese-GSDSimp
- zh_gsdsimp-ud-test.txt53 kB
- README.md2 kB
- zh_gsdsimp-ud-dev.conllu1 MB
- zh_gsdsimp-ud-train.txt433 kB
- zh_gsdsimp-ud-train.conllu8 MB
- stats.xml5 kB
- LICENSE.txt202 B
- zh_gsdsimp-ud-dev.txt55 kB
- zh_gsdsimp-ud-test.conllu1 MB
- UD_Galician-CTG
- gl_ctg-ud-dev.conllu1 MB
- README.md2 kB
- gl_ctg-ud-test.conllu1 MB
- gl_ctg-ud-dev.txt155 kB
- gl_ctg-ud-train.conllu4 MB
- gl_ctg-ud-test.txt156 kB
- stats.xml4 kB
- gl_ctg-ud-train.txt413 kB
- LICENSE.txt173 B
- UD_Slovenian-SSJ
- sl_ssj-ud-dev.conllu1 MB
- README.md5 kB
- sl_ssj-ud-train.txt1 MB
- sl_ssj-ud-test.conllu1 MB
- sl_ssj-ud-train.conllu15 MB
- sl_ssj-ud-dev.txt147 kB
- stats.xml12 kB
- LICENSE.txt222 B
- sl_ssj-ud-test.txt141 kB
- UD_French-PUD
- fr_pud-ud-test.txt130 kB
- stats.xml8 kB
- fr_pud-ud-test.conllu1 MB
- README.md5 kB
- LICENSE.txt19 kB
- UD_English-GUM
- en_gum-ud-test.txt99 kB
- README.md24 kB
- en_gum-ud-dev.txt94 kB
- en_gum-ud-train.conllu12 MB
- en_gum-ud-dev.conllu1 MB
- stats.xml10 kB
- en_gum-ud-test.conllu1 MB
- en_gum-ud-train.txt716 kB
- LICENSE.txt1 kB
- UD_Moksha-JR
- stats.xml26 kB
- README.md6 kB
- LICENSE.txt202 B
- mdf_jr-ud-test.txt42 kB
- mdf_jr-ud-test.conllu466 kB
- UD_Munduruku-TuDeT
- stats.xml8 kB
- README.md2 kB
- myu_tudet-ud-test.conllu73 kB
- LICENSE.txt202 B
- myu_tudet-ud-test.txt5 kB
- UD_Indonesian-GSD
- README.md6 kB
- id_gsd-ud-test.txt69 kB
- id_gsd-ud-dev.conllu969 kB
- id_gsd-ud-train.conllu7 MB
- stats.xml8 kB
- LICENSE.txt202 B
- id_gsd-ud-test.conllu903 kB
- id_gsd-ud-dev.txt73 kB
- id_gsd-ud-train.txt573 kB
- UD_Kyrgyz-KTMU
- stats.xml14 kB
- README.md1 kB
- ky_ktmu-ud-train.conllu62 kB
- LICENSE.txt202 B
- ky_ktmu-ud-train.txt8 kB
- ky_ktmu-ud-test.conllu594 kB
- ky_ktmu-ud-test.txt78 kB
- UD_French-ParTUT
- README.md5 kB
- fr_partut-ud-dev.conllu117 kB
- fr_partut-ud-train.conllu1 MB
- fr_partut-ud-test.txt14 kB
- fr_partut-ud-train.txt128 kB
- stats.xml8 kB
- LICENSE.txt18 kB
- fr_partut-ud-test.conllu165 kB
- fr_partut-ud-dev.txt9 kB
- UD_Turkish-Tourism
- tr_tourism-ud-test.conllu715 kB
- README.md1 kB
- tr_tourism-ud-dev.conllu747 kB
- tr_tourism-ud-train.conllu5 MB
- stats.xml13 kB
- tr_tourism-ud-train.txt477 kB
- LICENSE.txt202 B
- tr_tourism-ud-dev.txt69 kB
- tr_tourism-ud-test.txt67 kB
- UD_Spanish-GSD
- README.md5 kB
- es_gsd-ud-test.conllu716 kB
- es_gsd-ud-train.conllu22 MB
- es_gsd-ud-test.txt61 kB
- es_gsd-ud-train.txt1 MB
- es_gsd-ud-dev.conllu2 MB
- es_gsd-ud-dev.txt191 kB
- stats.xml11 kB
- LICENSE.txt202 B
- UD_Ancient_Greek-Perseus
- README.md4 kB
- grc_perseus-ud-dev.txt250 kB
- grc_perseus-ud-test.conllu1 MB
- grc_perseus-ud-test.txt231 kB
- grc_perseus-ud-train.txt1 MB
- stats.xml10 kB
- grc_perseus-ud-train.conllu14 MB
- LICENSE.txt279 B
- grc_perseus-ud-dev.conllu1 MB
- UD_Mbya_Guarani-Thomas
- stats.xml8 kB
- README.md3 kB
- gun_thomas-ud-test.txt7 kB
- LICENSE.txt202 B
- gun_thomas-ud-test.conllu90 kB
- UD_Tagalog-Ugnayan
- stats.xml3 kB
- README.md1 kB
- tl_ugnayan-ud-test.txt5 kB
- tl_ugnayan-ud-test.conllu53 kB
- LICENSE.txt219 B
- UD_Italian-TWITTIRO
- README.md3 kB
- it_twittiro-ud-test.conllu184 kB
- it_twittiro-ud-test.txt15 kB
- it_twittiro-ud-train.conllu1 MB
- it_twittiro-ud-train.txt120 kB
- stats.xml9 kB
- it_twittiro-ud-dev.txt15 kB
- it_twittiro-ud-dev.conllu188 kB
- LICENSE.txt202 B
- UD_Skolt_Sami-Giellagas
- stats.xml12 kB
- sms_giellagas-ud-test.conllu233 kB
- sms_giellagas-ud-test.txt17 kB
- README.md4 kB
- LICENSE.txt202 B
- UD_English-Atis
- en_atis-ud-test.conllu342 kB
- README.md1 kB
- en_atis-ud-train.conllu2 MB
- en_atis-ud-test.txt36 kB
- en_atis-ud-train.txt271 kB
- en_atis-ud-dev.txt36 kB
- stats.xml6 kB
- LICENSE.txt202 B
- en_atis-ud-dev.conllu341 kB
- UD_Polish-LFG
- pl_lfg-ud-dev.txt74 kB
- pl_lfg-ud-train.txt596 kB
- README.md6 kB
- pl_lfg-ud-test.txt74 kB
- pl_lfg-ud-dev.conllu1 MB
- pl_lfg-ud-test.conllu1 MB
- stats.xml14 kB
- LICENSE.txt34 kB
- pl_lfg-ud-train.conllu11 MB
- UD_Russian-GSD
- ru_gsd-ud-dev.conllu1 MB
- README.md1 kB
- ru_gsd-ud-test.conllu1003 kB
- ru_gsd-ud-dev.txt123 kB
- ru_gsd-ud-train.txt794 kB
- ru_gsd-ud-test.txt120 kB
- stats.xml13 kB
- LICENSE.txt202 B
- ru_gsd-ud-train.conllu6 MB
- UD_Classical_Chinese-Kyoto
- lzh_kyoto-ud-train.conllu34 MB
- README.md4 kB
- lzh_kyoto-ud-test.conllu2 MB
- lzh_kyoto-ud-train.txt1 MB
- lzh_kyoto-ud-dev.txt97 kB
- lzh_kyoto-ud-dev.conllu2 MB
- stats.xml7 kB
- lzh_kyoto-ud-test.txt84 kB
- LICENSE.txt202 B
- UD_Estonian-EWT
- et_ewt-ud-train.txt379 kB
- README.md4 kB
- et_ewt-ud-dev.txt54 kB
- et_ewt-ud-dev.conllu698 kB
- et_ewt-ud-test.conllu926 kB
- et_ewt-ud-test.txt76 kB
- et_ewt-ud-train.conllu4 MB
- stats.xml13 kB
- LICENSE.txt202 B
- UD_Chinese-PatentChar
- stats.xml2 kB
- README.md1009 B
- zh_patentchar-ud-test.txt11 kB
- LICENSE.txt202 B
- zh_patentchar-ud-test.conllu115 kB
- UD_Yakut-YKTDT
- stats.xml10 kB
- README.md2 kB
- sah_yktdt-ud-test.txt15 kB
- LICENSE.txt202 B
- sah_yktdt-ud-test.conllu148 kB
- UD_Indonesian-CSUI
- stats.xml7 kB
- README.md3 kB
- id_csui-ud-test.txt59 kB
- id_csui-ud-train.txt108 kB
- LICENSE.txt202 B
- id_csui-ud-test.conllu589 kB
- id_csui-ud-train.conllu1 MB
- UD_Portuguese-PetroGold
- README.md3 kB
- pt_petrogold-ud-test.txt154 kB
- pt_petrogold-ud-dev.conllu1 MB
- pt_petrogold-ud-train.conllu12 MB
- stats.xml9 kB
- pt_petrogold-ud-dev.txt115 kB
- LICENSE.txt202 B
- pt_petrogold-ud-train.txt1 MB
- pt_petrogold-ud-test.conllu1 MB
- UD_Lithuanian-ALKSNIS
- lt_alksnis-ud-train.txt317 kB
- README.md4 kB
- lt_alksnis-ud-test.conllu1 MB
- lt_alksnis-ud-train.conllu4 MB
- lt_alksnis-ud-test.txt69 kB
- lt_alksnis-ud-dev.conllu1 MB
- stats.xml13 kB
- LICENSE.txt202 B
- lt_alksnis-ud-dev.txt78 kB
- UD_Dutch-Alpino
- nl_alpino-ud-test.conllu901 kB
- nl_alpino-ud-train.conllu14 MB
- nl_alpino-ud-train.txt1016 kB
- nl_alpino-ud-dev.conllu942 kB
- nl_alpino-ud-dev.txt62 kB
- stats.xml7 kB
- LICENSE.txt19 kB
- README.txt5 kB
- nl_alpino-ud-test.txt64 kB
- UD_Apurina-UFPA
- stats.xml9 kB
- README.md3 kB
- LICENSE.txt202 B
- apu_ufpa-ud-test.conllu115 kB
- apu_ufpa-ud-test.txt5 kB
- UD_Livvi-KKPP
- stats.xml10 kB
- olo_kkpp-ud-train.txt808 B
- README.md4 kB
- olo_kkpp-ud-test.txt9 kB
- olo_kkpp-ud-test.conllu103 kB
- LICENSE.txt202 B
- olo_kkpp-ud-train.conllu15 kB
- UD_German-PUD
- stats.xml10 kB
- README.md5 kB
- LICENSE.txt19 kB
- de_pud-ud-test.txt126 kB
- de_pud-ud-test.conllu1 MB
- UD_Western_Armenian-ArmTDP
- README.md3 kB
- hyw_armtdp-ud-test.txt141 kB
- hyw_armtdp-ud-train.txt1006 kB
- hyw_armtdp-ud-dev.txt133 kB
- hyw_armtdp-ud-test.conllu1 MB
- hyw_armtdp-ud-dev.conllu1 MB
- stats.xml24 kB
- LICENSE.txt202 B
- hyw_armtdp-ud-train.conllu12 MB
- UD_Urdu-UDTB
- README.md2 kB
- ur_udtb-ud-train.txt853 kB
- ur_udtb-ud-test.txt117 kB
- ur_udtb-ud-train.conllu11 MB
- ur_udtb-ud-test.conllu1 MB
- stats.xml11 kB
- ur_udtb-ud-dev.txt115 kB
- LICENSE.txt247 B
- ur_udtb-ud-dev.conllu1 MB
- UD_Akkadian-PISANDUB
- stats.xml3 kB
- README.md871 B
- akk_pisandub-ud-test.txt15 kB
- LICENSE.txt202 B
- akk_pisandub-ud-test.conllu99 kB
- UD_Galician-TreeGal
- stats.xml9 kB
- README.md5 kB
- gl_treegal-ud-test.txt50 kB
- gl_treegal-ud-train.conllu1 MB
- LICENSE.txt14 kB
- gl_treegal-ud-train.txt76 kB
- gl_treegal-ud-test.conllu670 kB
- UD_Old_Turkish-Tonqq
- stats.xml2 kB
- otk_tonqq-ud-test.txt1 kB
- README.md1 kB
- otk_tonqq-ud-test.conllu10 kB
- LICENSE.txt6 kB
- UD_Gheg-GPS
- stats.xml8 kB
- README.md2 kB
- aln_gps-ud-test.txt71 kB
- LICENSE.txt202 B
- aln_gps-ud-test.conllu984 kB
- UD_Czech-FicTree
- README.md3 kB
- cs_fictree-ud-test.conllu1 MB
- cs_fictree-ud-test.txt86 kB
- cs_fictree-ud-train.conllu13 MB
- cs_fictree-ud-dev.txt86 kB
- stats.xml15 kB
- cs_fictree-ud-dev.conllu1 MB
- LICENSE.txt219 B
- cs_fictree-ud-train.txt696 kB
- UD_Italian-PoSTWITA
- it_postwita-ud-test.conllu759 kB
- it_postwita-ud-train.txt526 kB
- README.md4 kB
- it_postwita-ud-dev.conllu732 kB
- it_postwita-ud-train.conllu5 MB
- stats.xml9 kB
- LICENSE.txt18 kB
- it_postwita-ud-dev.txt64 kB
- it_postwita-ud-test.txt67 kB
- UD_Low_Saxon-LSDC
- stats.xml10 kB
- README.md4 kB
- nds_lsdc-ud-test.conllu236 kB
- LICENSE.txt202 B
- nds_lsdc-ud-test.txt13 kB
- UD_Hebrew-IAHLTwiki
- README.md2 kB
- he_iahltwiki-ud-train.conllu8 MB
- he_iahltwiki-ud-dev.txt60 kB
- he_iahltwiki-ud-dev.conllu713 kB
- he_iahltwiki-ud-test.conllu810 kB
- he_iahltwiki-ud-train.txt762 kB
- stats.xml12 kB
- he_iahltwiki-ud-test.txt68 kB
- LICENSE.txt202 B
- UD_Polish-PDB
- pl_pdb-ud-train.txt1 MB
- README.md5 kB
- pl_pdb-ud-dev.conllu3 MB
- pl_pdb-ud-test.txt203 kB
- pl_pdb-ud-train.conllu27 MB
- pl_pdb-ud-dev.txt210 kB
- stats.xml17 kB
- LICENSE.txt384 B
- pl_pdb-ud-test.conllu3 MB
- UD_Croatian-SET
- hr_set-ud-dev.conllu1 MB
- README.md5 kB
- hr_set-ud-dev.txt130 kB
- hr_set-ud-train.conllu11 MB
- hr_set-ud-train.txt901 kB
- stats.xml11 kB
- hr_set-ud-test.txt143 kB
- LICENSE.txt233 B
- hr_set-ud-test.conllu1 MB
- UD_North_Sami-Giella
- stats.xml10 kB
- README.md2 kB
- sme_giella-ud-train.conllu1 MB
- sme_giella-ud-train.txt107 kB
- LICENSE.txt202 B
- sme_giella-ud-test.conllu668 kB
- sme_giella-ud-test.txt70 kB
- UD_Old_Irish-DipWBG
- stats.xml8 kB
- README.md2 kB
- sga_dipwbg-ud-test.txt1 kB
- LICENSE.txt202 B
- sga_dipwbg-ud-test.conllu31 kB
- UD_Khunsari-AHA
- stats.xml4 kB
- README.md1 kB
- kfm_aha-ud-test.conllu6 kB
- kfm_aha-ud-test.txt542 B
- LICENSE.txt202 B
- UD_Xibe-XDT
- stats.xml16 kB
- sjo_xdt-ud-test.txt217 kB
- README.md1 kB
- LICENSE.txt202 B
- sjo_xdt-ud-test.conllu1 MB
- UD_Maltese-MUDT
- mt_mudt-ud-dev.txt55 kB
- README.md6 kB
- mt_mudt-ud-train.conllu1020 kB
- mt_mudt-ud-test.txt59 kB
- mt_mudt-ud-dev.conllu454 kB
- stats.xml3 kB
- LICENSE.txt202 B
- mt_mudt-ud-train.txt123 kB
- mt_mudt-ud-test.conllu489 kB
- UD_Persian-Seraji
- fa_seraji-ud-dev.conllu1 MB
- README.md5 kB
- fa_seraji-ud-test.txt134 kB
- fa_seraji-ud-train.conllu11 MB
- fa_seraji-ud-test.conllu1 MB
- stats.xml9 kB
- fa_seraji-ud-train.txt995 kB
- LICENSE.txt110 B
- fa_seraji-ud-dev.txt133 kB
- UD_Indonesian-PUD
- stats.xml8 kB
- README.md8 kB
- id_pud-ud-test.txt117 kB
- LICENSE.txt19 kB
- id_pud-ud-test.conllu1 MB
- UD_Belarusian-HSE
- be_hse-ud-test.txt180 kB
- README.md7 kB
- be_hse-ud-train.txt2 MB
- be_hse-ud-dev.conllu1 MB
- be_hse-ud-train.conllu27 MB
- be_hse-ud-test.conllu1 MB
- stats.xml17 kB
- LICENSE.txt1021 B
- be_hse-ud-dev.txt164 kB
- UD_Turkish-BOUN
- stats.xml14 kB
- README.md4 kB
- tr_boun-ud-train.conllu7 MB
- tr_boun-ud-dev.txt81 kB
- LICENSE.txt202 B
- tr_boun-ud-train.txt660 kB
- tr_boun-ud-test.conllu933 kB
- UD_Norwegian-Nynorsk
- no_nynorsk-ud-dev.conllu1 MB
- README.md5 kB
- no_nynorsk-ud-test.txt135 kB
- no_nynorsk-ud-dev.txt166 kB
- stats.xml8 kB
- no_nynorsk-ud-test.conllu1 MB
- LICENSE.txt68 B
- no_nynorsk-ud-train.txt1 MB
- no_nynorsk-ud-train.conllu14 MB
- UD_Guajajara-TuDeT
- stats.xml13 kB
- README.md3 kB
- gub_tudet-ud-test.txt47 kB
- gub_tudet-ud-test.conllu705 kB
- LICENSE.txt202 B
- UD_Ligurian-GLT
- stats.xml8 kB
- lij_glt-ud-test.conllu411 kB
- lij_glt-ud-train.txt918 B
- README.md1 kB
- lij_glt-ud-train.conllu14 kB
- LICENSE.txt3 kB
- lij_glt-ud-test.txt27 kB
- UD_Romanian-SiMoNERo
- ro_simonero-ud-test.conllu1 MB
- README.md2 kB
- ro_simonero-ud-dev.conllu1 MB
- ro_simonero-ud-test.txt93 kB
- ro_simonero-ud-train.txt719 kB
- ro_simonero-ud-dev.txt91 kB
- stats.xml11 kB
- ro_simonero-ud-train.conllu9 MB
- LICENSE.txt202 B
- UD_Spanish-PUD
- stats.xml9 kB
- es_pud-ud-test.conllu1 MB
- README.md6 kB
- LICENSE.txt19 kB
- es_pud-ud-test.txt123 kB
- UD_Cebuano-GJA
- ceb_gja-ud-test.conllu99 kB
- stats.xml7 kB
- README.md1 kB
- LICENSE.txt202 B
- ceb_gja-ud-test.txt5 kB
- UD_Serbian-SET
- sr_set-ud-test.txt67 kB
- README.md1 kB
- sr_set-ud-train.conllu5 MB
- sr_set-ud-dev.txt68 kB
- stats.xml11 kB
- sr_set-ud-test.conllu847 kB
- sr_set-ud-train.txt432 kB
- LICENSE.txt230 B
- sr_set-ud-dev.conllu888 kB
- UD_Tatar-NMCTT
- stats.xml12 kB
- README.md1 kB
- tt_nmctt-ud-test.txt26 kB
- LICENSE.txt202 B
- tt_nmctt-ud-test.conllu220 kB
- UD_Hittite-HitTB
- stats.xml9 kB
- README.md1 kB
- hit_hittb-ud-test.conllu115 kB
- LICENSE.txt202 B
- hit_hittb-ud-test.txt10 kB
- UD_Chinese-HK
- stats.xml4 kB
- README.md4 kB
- LICENSE.txt202 B
- zh_hk-ud-test.conllu872 kB
- zh_hk-ud-test.txt41 kB
- UD_Marathi-UFAL
- README.md1 kB
- mr_ufal-ud-train.conllu385 kB
- mr_ufal-ud-test.txt4 kB
- mr_ufal-ud-dev.conllu56 kB
- mr_ufal-ud-dev.txt4 kB
- mr_ufal-ud-train.txt33 kB
- stats.xml14 kB
- mr_ufal-ud-test.conllu51 kB
- LICENSE.txt202 B
- UD_Maghrebi_Arabic_French-Arabizi
- qaf_arabizi-ud-dev.conllu222 kB
- README.md3 kB
- qaf_arabizi-ud-train.txt81 kB
- qaf_arabizi-ud-test.conllu220 kB
- qaf_arabizi-ud-dev.txt11 kB
- qaf_arabizi-ud-train.conllu1 MB
- stats.xml6 kB
- LICENSE.txt202 B
- qaf_arabizi-ud-test.txt11 kB
- UD_Afrikaans-AfriBooms
- af_afribooms-ud-test.conllu618 kB
- af_afribooms-ud-train.conllu2 MB
- af_afribooms-ud-test.txt57 kB
- stats.xml8 kB
- LICENSE.txt202 B
- README.txt1 kB
- af_afribooms-ud-dev.txt30 kB
- af_afribooms-ud-dev.conllu321 kB
- af_afribooms-ud-train.txt195 kB
- UD_Czech-CAC
- cs_cac-ud-test.conllu1 MB
- cs_cac-ud-test.txt71 kB
- README.md6 kB
- cs_cac-ud-train.conllu51 MB
- cs_cac-ud-dev.txt72 kB
- cs_cac-ud-train.txt2 MB
- stats.xml19 kB
- LICENSE.txt265 B
- cs_cac-ud-dev.conllu1 MB
- UD_Arabic-PADT
- README.md6 kB
- ar_padt-ud-dev.conllu5 MB
- ar_padt-ud-train.conllu38 MB
- ar_padt-ud-train.txt1 MB
- ar_padt-ud-test.txt234 kB
- ar_padt-ud-test.conllu4 MB
- stats.xml11 kB
- ar_padt-ud-dev.txt241 kB
- LICENSE.txt19 kB
- UD_English-Pronouns
- stats.xml5 kB
- en_pronouns-ud-test.conllu138 kB
- README.md9 kB
- LICENSE.txt202 B
- en_pronouns-ud-test.txt7 kB
- UD_Upper_Sorbian-UFAL
- stats.xml11 kB
- hsb_ufal-ud-test.conllu730 kB
- README.md1 kB
- hsb_ufal-ud-train.conllu31 kB
- hsb_ufal-ud-test.txt64 kB
- LICENSE.txt202 B
- hsb_ufal-ud-train.txt2 kB
- UD_Czech-PDT
- cs_pdt-ud-train.conllu144 MB
- README.md12 kB
- cs_pdt-ud-test.conllu21 MB
- cs_pdt-ud-test.txt1 MB
- cs_pdt-ud-dev.txt989 kB
- cs_pdt-ud-dev.conllu19 MB
- stats.xml18 kB
- LICENSE.txt311 B
- cs_pdt-ud-train.txt7 MB
- UD_Bororo-BDT
- stats.xml8 kB
- README.md2 kB
- LICENSE.txt202 B
- bor_bdt-ud-test.conllu63 kB
- bor_bdt-ud-test.txt4 kB
- UD_Swedish_Sign_Language-SSLC
- stats.xml2 kB
- swl_sslc-ud-test.txt15 kB
- README.md1 kB
- LICENSE.txt19 kB
- swl_sslc-ud-test.conllu79 kB
- UD_Chinese-GSD
- README.md2 kB
- zh_gsd-ud-test.conllu1 MB
- zh_gsd-ud-train.conllu8 MB
- zh_gsd-ud-train.txt433 kB
- zh_gsd-ud-dev.txt55 kB
- zh_gsd-ud-dev.conllu1 MB
- stats.xml5 kB
- LICENSE.txt202 B
- zh_gsd-ud-test.txt53 kB
- UD_Xavante-XDT
- stats.xml6 kB
- xav_xdt-ud-test.txt8 kB
- README.md1 kB
- xav_xdt-ud-test.conllu119 kB
- LICENSE.txt202 B
- UD_Arabic-PUD
- stats.xml9 kB
- README.md5 kB
- ar_pud-ud-test.txt168 kB
- LICENSE.txt19 kB
- ar_pud-ud-test.conllu2 MB
- UD_Russian-PUD
- stats.xml12 kB
- README.md5 kB
- LICENSE.txt19 kB
- ru_pud-ud-test.txt209 kB
- ru_pud-ud-test.conllu1 MB
- UD_Erzya-JR
- stats.xml31 kB
- myv_jr-ud-test.txt107 kB
- README.txt6 kB
- myv_jr-ud-test.conllu1 MB
- LICENSE.txt202 B
- myv_jr-ud-train.txt102 kB
- myv_jr-ud-train.conllu1 MB
- UD_French-GSD
- fr_gsd-ud-train.conllu21 MB
- README.md7 kB
- fr_gsd-ud-dev.conllu2 MB
- fr_gsd-ud-dev.txt184 kB
- stats.xml10 kB
- fr_gsd-ud-test.conllu636 kB
- LICENSE.txt202 B
- fr_gsd-ud-test.txt49 kB
- fr_gsd-ud-train.txt1 MB
- UD_Assyrian-AS
- stats.xml7 kB
- aii_as-ud-test.conllu31 kB
- README.md1 kB
- aii_as-ud-test.txt4 kB
- LICENSE.txt202 B
- UD_Chukchi-HSE
- stats.xml3 kB
- README.md4 kB
- ckt_hse-ud-test.txt72 kB
- LICENSE.txt202 B
- ckt_hse-ud-test.conllu793 kB
- UD_Albanian-TSA
- stats.xml8 kB
- sq_tsa-ud-test.conllu61 kB
- README.md1 kB
- sq_tsa-ud-test.txt5 kB
- LICENSE.txt202 B
- UD_Javanese-CSUI
- stats.xml7 kB
- jv_csui-ud-test.txt77 kB
- README.md3 kB
- LICENSE.txt202 B
- jv_csui-ud-test.conllu936 kB
- UD_Old_East_Slavic-RNC
- README.md20 kB
- orv_rnc-ud-dev.txt87 kB
- orv_rnc-ud-dev.conllu945 kB
- orv_rnc-ud-test.conllu1 MB
- stats.xml17 kB
- orv_rnc-ud-train.txt175 kB
- LICENSE.txt202 B
- orv_rnc-ud-test.txt183 kB
- orv_rnc-ud-train.conllu1 MB
- UD_Old_Irish-DipSGG
- stats.xml8 kB
- README.md3 kB
- sga_dipsgg-ud-test.txt2 kB
- LICENSE.txt15 B
- sga_dipsgg-ud-test.conllu34 kB
- UD_Latin-LLCT
- la_llct-ud-dev.conllu2 MB
- README.md9 kB
- la_llct-ud-test.conllu2 MB
- la_llct-ud-train.conllu17 MB
- stats.xml13 kB
- la_llct-ud-dev.txt136 kB
- LICENSE.txt202 B
- la_llct-ud-test.txt136 kB
- la_llct-ud-train.txt1 MB
- UD_Japanese-BCCWJ
- ja_bccwj-ud-train.txt902 kB
- ja_bccwj-ud-train.conllu67 MB
- ja_bccwj-ud-dev.txt177 kB
- ja_bccwj-ud-test.conllu12 MB
- merge
- test_pos.pkl2 MB
- dev_pos.pkl2 MB
- script
- lib.py5 kB
- restore_word_unit_bccwj.py7 kB
- convert_core_bccwj_pkl.py746 B
- misc_mapping.pkl23 MB
- merge.sh1 kB
- train_pos.pkl13 MB
- stats.xml3 kB
- LICENSE.txt18 kB
- README.txt3 kB
- ja_bccwj-ud-test.txt165 kB
- ja_bccwj-ud-dev.conllu13 MB
- UD_Latin-ITTB
- la_ittb-ud-train.txt2 MB
- README.md11 kB
- la_ittb-ud-dev.txt168 kB
- la_ittb-ud-test.conllu2 MB
- la_ittb-ud-dev.conllu2 MB
- stats.xml17 kB
- LICENSE.txt19 kB
- la_ittb-ud-test.txt169 kB
- la_ittb-ud-train.conllu37 MB
- UD_Italian-ParlaMint
- stats.xml8 kB
- it_parlamint-ud-train.txt52 kB
- README.md2 kB
- it_parlamint-ud-train.conllu640 kB
- LICENSE.txt202 B
- it_parlamint-ud-test.conllu669 kB
- it_parlamint-ud-test.txt55 kB
- UD_Armenian-ArmTDP
- README.md4 kB
- hy_armtdp-ud-train.conllu5 MB
- hy_armtdp-ud-dev.conllu694 kB
- hy_armtdp-ud-dev.txt57 kB
- hy_armtdp-ud-test.txt51 kB
- hy_armtdp-ud-train.txt434 kB
- stats.xml24 kB
- hy_armtdp-ud-test.conllu656 kB
- LICENSE.txt202 B
- UD_Vietnamese-VTB
- README.md1 kB
- vi_vtb-ud-test.txt71 kB
- vi_vtb-ud-train.txt129 kB
- vi_vtb-ud-train.conllu924 kB
- vi_vtb-ud-dev.txt168 kB
- stats.xml6 kB
- LICENSE.txt19 kB
- vi_vtb-ud-test.conllu526 kB
- vi_vtb-ud-dev.conllu1 MB
- UD_Western_Sierra_Puebla_Nahuatl-ITML
- stats.xml12 kB
- nhi_itml-ud-test.txt51 kB
- README.md1 kB
- nhi_itml-ud-test.conllu1 MB
- LICENSE.txt202 B
- UD_Icelandic-IcePaHC
- is_icepahc-ud-dev.conllu11 MB
- is_icepahc-ud-test.txt738 kB
- README.md6 kB
- is_icepahc-ud-dev.txt735 kB
- is_icepahc-ud-train.conllu58 MB
- stats.xml11 kB
- LICENSE.txt202 B
- is_icepahc-ud-train.txt3 MB
- is_icepahc-ud-test.conllu11 MB
- UD_English-PUD
- ... too many files ...0 B
- Name
- ud-documentation-v2.12.tgz
- Size
- 100.29 MB
- Format
- application/x-gzip
- Description
- Documentation
- MD5
- 1b50998eb8c68d18934ccb86bbedf9b7
- ud-documentation-v2.12
- markdown-source
- _tl
- _jaa
- index.md10 kB
- feat
- Nmzr.md639 B
- Intension.md625 B
- Backgrounding.md780 B
- Aspect.md800 B
- Dist.md636 B
- OC.md639 B
- Cfm.md2 kB
- Voice.md618 B
- Away.md609 B
- Comt.md618 B
- Ch.md631 B
- Report.md616 B
- SecV.md636 B
- Middle.md615 B
- Sp.md611 B
- Tense.md721 B
- Rep.md736 B
- Polarity.md645 B
- Out.md606 B
- Mood.md1 kB
- Down.md610 B
- Poss.md621 B
- AC.md645 B
- Back.md609 B
- Decl.md716 B
- Red.md620 B
- Nom.md638 B
- Up.md603 B
- Coming.md615 B
- Cq.md632 B
- NCount.md663 B
- Evident.md929 B
- TenseEvid.md2 kB
- St.md614 B
- Redup.md632 B
- tokenization.md96 B
- _zh
- index.md8 kB
- syntax.md2 kB
- tokenization.md2 kB
- morphology.md2 kB
- feat
- PartType.md569 B
- dep-index.md372 B
- pos
- PRON.md3 kB
- VERB.md921 B
- ADV.md3 kB
- NUM.md921 B
- CCONJ.md743 B
- ADJ.md1 kB
- SCONJ.md1 kB
- SYM.md846 B
- DET.md2 kB
- NOUN.md1 kB
- PROPN.md975 B
- INTJ.md1 kB
- AUX_.md1 kB
- ADP.md2 kB
- PUNCT.md495 B
- X.md786 B
- PART.md2 kB
- dep
- nsubj.md717 B
- advcl.md3 kB
- obj.md3 kB
- vocative.md1 kB
- discourse-sp.md2 kB
- mark-prt.md3 kB
- obl-patient.md1001 B
- mark.md2 kB
- xcomp.md7 kB
- flat.md2 kB
- compound.md2 kB
- csubj.md1003 B
- reparandum.md1 kB
- dislocated-vo.md1 kB
- amod.md1 kB
- nmod.md2 kB
- nummod.md1 kB
- iobj.md1 kB
- nsubj-pass.md599 B
- acl.md3 kB
- case.md3 kB
- mark-rel.md2 kB
- punct.md4 kB
- advmod.md4 kB
- aux-pass.md1 kB
- obj-periph.md899 B
- case-loc.md1 kB
- clf.md4 kB
- ccomp.md7 kB
- parataxis.md4 kB
- goeswith.md1 kB
- appos.md2 kB
- compound-dir.md5 kB
- advmod-df.md2 kB
- cc.md1 kB
- csubj-pass.md868 B
- det.md1 kB
- obl-tmod.md2 kB
- discourse.md1 kB
- list.md2 kB
- obl-agent.md1 kB
- cop.md1 kB
- compound-ext.md4 kB
- compound-vv.md4 kB
- orphan.md4 kB
- aux_.md3 kB
- obl.md3 kB
- root.md2 kB
- dislocated.md4 kB
- compound-vo.md3 kB
- mark-adv.md636 B
- conj.md6 kB
- pos-index.md143 B
- _ta
- index.md3 kB
- dep
- nsubj-nc.md497 B
- obl-cmpr.md2 kB
- aux-neg.md1 kB
- obl-inst.md681 B
- advcl-cond.md1 kB
- obl-pmod.md351 B
- _as
- template-index.md1 kB
- _am
- index.md5 kB
- feat
- Voice.md3 kB
- Case.md3 kB
- _qpm
- index.md9 kB
- readme.md2 kB
- license.md402 B
- feat
- Definite.md2 kB
- Aspect.md2 kB
- Number.md2 kB
- Abbr.md1 kB
- Reflex.md2 kB
- Voice.md1 kB
- Foreign.md1 kB
- Degree.md5 kB
- Tense.md4 kB
- Gender.md2 kB
- Polarity.md2 kB
- VerbForm.md5 kB
- Mood.md2 kB
- Poss.md1 kB
- Person.md1 kB
- PronType.md5 kB
- NumType.md2 kB
- PartTypeQpm.md1 kB
- Animacy.md2 kB
- DeixisRef.md1 kB
- Case.md3 kB
- Variant.md881 B
- Number-psor.md895 B
- Deixis.md1 kB
- dep
- obj.md1 kB
- advcl.md616 B
- nsubj.md708 B
- vocative.md611 B
- xcomp.md1 kB
- compound.md508 B
- csubj.md452 B
- reparandum.md637 B
- amod.md942 B
- nmod.md633 B
- nummod.md568 B
- iobj.md513 B
- acl-relcl.md1 kB
- nmod-tmod.md831 B
- acl.md1 kB
- case.md838 B
- punct.md1 kB
- advmod.md1 kB
- aux-pass.md557 B
- ccomp.md1 kB
- parataxis.md2 kB
- nusbj-pass.md444 B
- obl-arg.md620 B
- appos.md1 kB
- cc.md1 kB
- obl-lmod.md402 B
- csubj-pass.md486 B
- fixed.md9 kB
- obl-tmod.md465 B
- compound-redup.md912 B
- obl-agent.md637 B
- advmod-emph.md1 kB
- orphan.md704 B
- aux_.md1 kB
- obl.md1 kB
- root.md889 B
- aux-q.md569 B
- conj.md1 kB
- pos
- PRON.md1 kB
- ADV.md5 kB
- VERB.md3 kB
- NUM.md1 kB
- CCONJ.md1 kB
- ADJ.md4 kB
- SCONJ.md1 kB
- DET.md8 kB
- NOUN.md910 B
- PROPN.md1 kB
- INTJ.md921 B
- ADP.md1 kB
- AUX_.md4 kB
- X.md1 kB
- PART.md3 kB
- contributors.md1 kB
- ext-format.md11 kB
- _bxr
- index.md4 kB
- dep
- advmod-neg.md565 B
- _sl
- index.md6 kB
- feat
- Definite.md1 kB
- Aspect.md1 kB
- Number.md1 kB
- Abbr.md521 B
- Gender-psor.md1 kB
- Reflex.md1 kB
- Foreign.md861 B
- Degree.md1 kB
- Tense.md1 kB
- Gender.md1 kB
- Polarity.md1 kB
- VerbForm.md3 kB
- Mood.md2 kB
- Person.md1 kB
- Poss.md869 B
- NumType.md1 kB
- PronType.md2 kB
- NumForm.md1 kB
- Animacy.md1 kB
- Case.md3 kB
- Variant.md1 kB
- Number-psor.md1 kB
- tokenization.md2 kB
- dep
- advcl.md2 kB
- obj.md2 kB
- nsubj.md1 kB
- vocative.md800 B
- cc-preconj.md920 B
- mark.md1 kB
- xcomp.md2 kB
- flat.md1 kB
- csubj.md2 kB
- reparandum.md563 B
- amod.md1 kB
- nmod.md2 kB
- nummod.md1 kB
- iobj.md1 kB
- acl.md2 kB
- case.md1 kB
- punct.md1 kB
- advmod.md3 kB
- ccomp.md1 kB
- parataxis.md4 kB
- goeswith.md892 B
- appos.md973 B
- cc.md2 kB
- fixed.md1 kB
- det.md1 kB
- discourse.md1 kB
- list.md823 B
- cop.md3 kB
- conj-extend.md747 B
- parataxis-discourse.md382 B
- orphan.md1 kB
- aux_.md1 kB
- obl.md4 kB
- root.md1 kB
- expl.md2 kB
- discourse-filler.md639 B
- dislocated.md970 B
- parataxis-restart.md757 B
- conj.md2 kB
- dep.md1 kB
- pos
- PRON.md1 kB
- ADV.md1 kB
- VERB.md1 kB
- CCONJ.md617 B
- NUM.md1 kB
- ADJ.md2 kB
- SCONJ.md733 B
- SYM.md1 kB
- DET.md2 kB
- NOUN.md629 B
- PROPN.md1 kB
- INTJ.md1 kB
- AUX_.md1 kB
- ADP.md1 kB
- PUNCT.md899 B
- X.md1 kB
- PART.md1 kB
- _da
- index.md4 kB
- pos-index.md132 B
- pos
- PRON.md1 kB
- ADV.md625 B
- VERB.md689 B
- CCONJ.md441 B
- NUM.md862 B
- ADJ.md800 B
- SCONJ.md466 B
- SYM.md330 B
- DET.md884 B
- NOUN.md352 B
- PROPN.md517 B
- INTJ.md438 B
- PUNCT.md386 B
- AUX_.md1 kB
- ADP.md334 B
- X.md564 B
- PART.md672 B
- _sk
- index.md14 kB
- _sla
- pos-index.md134 B
- pmltq.md5 kB
- introduction.md416 B
- pos
- PRON.md17 kB
- DET.md605 B
- _nap
- index.md3 kB
- _fy
- template-index.md1 kB
- _sa
- _qfn
- index.md2 kB
- _is
- index.md4 kB
- _shp
- template-index.md1 kB
- _bej
- index.md3 kB
- feat
- Definite.md420 B
- Aspect.md1 kB
- ReportedSpeech.md1 kB
- Number.md878 B
- Reflex.md772 B
- Foreign.md479 B
- Voice.md1 kB
- Degree.md1 kB
- Tense.md1 kB
- VerbType.md1 kB
- Singulative.md718 B
- Gender.md1 kB
- Polarity.md770 B
- VerbForm.md1001 B
- Mood.md948 B
- Poss.md684 B
- Person.md1 kB
- TokenType.md1 kB
- PronType.md1 kB
- NumType.md684 B
- Polite.md743 B
- VerbClass.md1 kB
- Case.md3 kB
- Deixis.md1 kB
- dep
- nsubj-aff.md741 B
- advcl.md738 B
- obj.md493 B
- nsubj.md662 B
- vocative.md559 B
- compound.md405 B
- reparandum.md560 B
- amod.md528 B
- conj-redup.md629 B
- dep-redup.md626 B
- nummod-det.md582 B
- nmod.md447 B
- acl-relcl.md650 B
- iobj.md815 B
- obl-mod.md379 B
- acl.md547 B
- nmod-poss.md405 B
- punct.md525 B
- advmod.md496 B
- case-aff.md628 B
- ccomp.md573 B
- parataxis.md724 B
- aux-aff.md675 B
- obl-arg.md466 B
- appos.md595 B
- cc.md723 B
- dep-comp.md697 B
- det.md444 B
- discourse.md543 B
- parataxis-mod.md609 B
- dep-aff.md702 B
- cop.md587 B
- acl-fixed.md526 B
- advmod-fixed.md585 B
- parataxis-coord.md447 B
- aux_.md532 B
- root.md546 B
- mark-aff.md706 B
- dep-conj.md672 B
- dislocated-subj.md484 B
- dislocated.md482 B
- pos
- PRON.md400 B
- ADV.md391 B
- VERB.md525 B
- CCONJ.md720 B
- NUM.md392 B
- ADJ.md475 B
- SCONJ.md778 B
- DET.md835 B
- NOUN.md425 B
- PROPN.md415 B
- INTJ.md367 B
- PUNCT.md523 B
- ADP.md521 B
- AUX_.md851 B
- X.md724 B
- PART.md534 B
- _lzh
- index.md3 kB
- dep
- discourse-sp.md1 kB
- flat-vv.md861 B
- template-index.md1 kB
- discussion.md1 kB
- _layouts
- home.html4 kB
- postag.html392 B
- feature.html453 B
- base.html4 kB
- relation.html414 B
- withembed.html141 B
- _nyn
- template-index.md1 kB
- _mag
- template-index.md1 kB
- _mdf
- index.md5 kB
- feat-index.md136 B
- feat
- Aspect.md1 kB
- AdvType.md1 kB
- Reflex.md867 B
- NameType.md2 kB
- NounType.md579 B
- VerbForm.md3 kB
- Mood.md4 kB
- Clitic.md2 kB
- Derivation.md2 kB
- NumType.md2 kB
- PartForm.md1 kB
- NumForm.md357 B
- Person-psor.md1 kB
- Connegative.md1 kB
- Valency.md883 B
- Variant.md1 kB
- Case.md6 kB
- PunctSide.md497 B
- Style.md370 B
- dep-index.md142 B
- dep
- advmod-freq.md652 B
- advmod-foc.md517 B
- obl-lmp.md1 kB
- nmod-poss.md487 B
- aux-cnd.md601 B
- advcl-eval.md584 B
- csubj-cop.md669 B
- obl-lto.md1 kB
- advmod-deg.md319 B
- advmod-lfrom.md758 B
- aux-opt.md752 B
- advmod-cmp.md532 B
- nmod-lmod.md732 B
- aux-neg.md1 kB
- nmod-appos.md935 B
- obl-cmp.md573 B
- nsubj-cop.md486 B
- advmod-mmod.md462 B
- nmod-bahuv.md578 B
- obl-inst.md681 B
- aux-q.md529 B
- advmod-tmod.md453 B
- advcl-cau.md651 B
- obl-lfrom.md924 B
- advcl-tcl.md757 B
- obl-freq.md700 B
- advmod-lto.md684 B
- advmod-cau.md624 B
- obl-cau.md618 B
- advmod-eval.md623 B
- nmod-gobj.md553 B
- nmod-tmod.md426 B
- aux-nec.md748 B
- _la
- .gitignore61 B
- index.md17 kB
- feat
- VerbForm.md27 kB
- Aspect.md16 kB
- AdvType.md3 kB
- NumValue.md2 kB
- Compound.md1 kB
- Variant.md2 kB
- PronType.md2 kB
- Form.md2 kB
- InflClass.md18 kB
- NumForm.md2 kB
- Degree.md13 kB
- NameType.md7 kB
- InflClass-nominal.md5 kB
- Proper.md2 kB
- dep
- nsubj-cleft.md3 kB
- obl-lmod.md5 kB
- iobj.md18 kB
- orphan-missing.md1 kB
- flat-gov.md1 kB
- conj-expl.md4 kB
- cop-outer.md1 kB
- advmod-lmod.md1 kB
- advcl-relcl.md5 kB
- advcl-cmp.md8 kB
- dislocated-ccomp.md2 kB
- obl-tmod.md2 kB
- dislocated-obj.md2 kB
- csubj-reported.md2 kB
- dislocated-csubj.md2 kB
- parataxis-rep.md2 kB
- csubj-cleft.md4 kB
- xcomp.md4 kB
- obl-cmp.md2 kB
- advmod-neg.md1 kB
- advmod-tmod.md1 kB
- parataxis-reporting.md1 kB
- dislocated-obl.md2 kB
- advcl-abs.md8 kB
- ccomp-reported.md1 kB
- csubj-relcl.md5 kB
- advcl-pred.md5 kB
- ccomp-relcl.md4 kB
- xcomp-relcl.md4 kB
- dislocated-advcl.md1 kB
- dislocated-nsubj.md1 kB
- template-index.md1 kB
- introduction.md4 kB
- _oc
- template-index.md1 kB
- _yue
- index.md2 kB
- pos-index.md145 B
- dep-index.md153 B
- dep
- obj.md3 kB
- advcl.md2 kB
- nsubj.md707 B
- vocative.md1 kB
- discourse-sp.md2 kB
- mark.md3 kB
- xcomp.md7 kB
- flat.md2 kB
- obl-patient.md918 B
- compound.md2 kB
- csubj.md977 B
- advcl-coverb.md2 kB
- reparandum.md1 kB
- dislocated-vo.md1 kB
- amod.md1 kB
- nmod.md2 kB
- nummod.md1 kB
- iobj.md1 kB
- clf-det.md1 kB
- nsubj-pass.md1 kB
- acl.md3 kB
- case.md3 kB
- mark-rel.md2 kB
- punct.md4 kB
- advmod.md4 kB
- aux-pass.md979 B
- obj-periph.md675 B
- case-loc.md1 kB
- clf.md4 kB
- ccomp.md7 kB
- parataxis.md4 kB
- goeswith.md1 kB
- appos.md2 kB
- compound-dir.md4 kB
- advmod-df.md2 kB
- cc.md1 kB
- csubj-pass.md842 B
- det.md1 kB
- obl-tmod.md2 kB
- compound-quant.md4 kB
- discourse.md4 kB
- list.md2 kB
- obl-agent.md1 kB
- cop.md1 kB
- nsubj-periph.md624 B
- compound-ext.md4 kB
- compound-vv.md4 kB
- orphan.md3 kB
- aux_.md3 kB
- obl.md3 kB
- root.md2 kB
- expl.md1 kB
- compound-vo.md3 kB
- dislocated.md4 kB
- mark-adv.md667 B
- conj.md5 kB
- pos
- PRON.md1 kB
- ADV.md3 kB
- VERB.md743 B
- CCONJ.md615 B
- NUM.md970 B
- ADJ.md1 kB
- SCONJ.md1 kB
- SYM.md850 B
- DET.md1 kB
- NOUN.md993 B
- PROPN.md825 B
- INTJ.md1 kB
- PUNCT.md495 B
- ADP.md1 kB
- AUX_.md1 kB
- X.md791 B
- PART.md2 kB
- _say
- index.md5 kB
- feat
- Mood.md738 B
- Aspect.md4 kB
- Tense.md1 kB
- _u-dep
- obj.md1 kB
- nsubj.md2 kB
- advcl.md2 kB
- vocative.md670 B
- det-numgov.md1 kB
- cc-preconj.md544 B
- mark.md1 kB
- flat.md9 kB
- compound-prt.md761 B
- xcomp.md6 kB
- compound.md1 kB
- csubj.md1 kB
- flat-foreign.md759 B
- expl-pv.md927 B
- reparandum.md457 B
- amod.md728 B
- flat-name.md1 kB
- nmod.md909 B
- nummod.md1 kB
- acl-relcl.md1 kB
- iobj.md11 kB
- nsubj-pass.md644 B
- nmod-tmod.md397 B
- expl-impers.md1 kB
- acl.md1 kB
- case.md5 kB
- nmod-poss.md533 B
- punct.md2 kB
- advmod.md1 kB
- aux-pass.md1 kB
- advmod-lmod.md415 B
- clf.md4 kB
- ccomp.md3 kB
- parataxis.md4 kB
- goeswith.md1 kB
- obl-arg.md2 kB
- appos.md4 kB
- compound-svc.md4 kB
- cc.md1 kB
- obl-lmod.md440 B
- csubj-pass.md760 B
- fixed.md1 kB
- det.md864 B
- obl-tmod.md442 B
- discourse.md917 B
- compound-redup.md1 kB
- list.md2 kB
- expl-pass.md616 B
- obl-agent.md1 kB
- cop.md4 kB
- advmod-emph.md1 kB
- det-nummod.md1 kB
- orphan.md1 kB
- aux_.md1 kB
- obl.md2 kB
- root.md1 kB
- nummod-gov.md1 kB
- csubj-outer.md1 kB
- nsubj-outer.md1 kB
- expl.md5 kB
- dislocated.md1 kB
- det-poss.md652 B
- compound-lvc.md1 kB
- dep.md599 B
- conj.md5 kB
- _pra
- index.md2 kB
- _fro
- dep
- obj-advmod.md951 B
- amod.md1 kB
- conj.md761 B
- cc.md793 B
- advmod.md1 kB
- obj-advneg.md948 B
- iobj.md1 kB
- obl-advmod.md851 B
- acl.md2 kB
- orphan.md1 kB
- nsubj-obj.md960 B
- ccomp.md1 kB
- dep
- _kpv
- index.md3 kB
- feat-index.md136 B
- feat
- Valency.md845 B
- VerbForm.md2 kB
- NounType.md541 B
- Variant.md1 kB
- Reflex.md896 B
- PronType.md1 kB
- NumType.md1 kB
- Case.md11 kB
- Person-psor.md1 kB
- PartForm.md972 B
- Connegative.md655 B
- Derivation.md5 kB
- Clitic.md1 kB
- dep-index.md142 B
- dep
- flat-num.md308 B
- aux-aspect.md572 B
- advmod-lfrom.md778 B
- cc-preconj.md759 B
- advmod-freq.md604 B
- obl-lfrom.md1006 B
- flat-foreign.md1 kB
- csubj.md436 B
- advmod-eval.md617 B
- advmod-lmp.md566 B
- nmod-lfrom.md619 B
- advcl-lcl.md810 B
- advmod-foc.md506 B
- nmod-lmod.md599 B
- obl-lmp.md900 B
- aux-nec.md716 B
- advcl-tcl.md731 B
- nmod-poss.md490 B
- advmod-lmod.md572 B
- nmod-subj.md592 B
- advmod-mmod.md540 B
- advcl-eval.md570 B
- advmod-tmod.md404 B
- nmod-prp.md505 B
- advmod-deg.md385 B
- aux-tense.md757 B
- aux-pot.md852 B
- aux-cnd.md518 B
- obl-lmod.md449 B
- obl-cmp.md803 B
- nsubj-cop.md587 B
- obl-agent.md479 B
- cop.md2 kB
- csubj-cop.md741 B
- advcl-lto.md850 B
- advmod-emph.md677 B
- nmod-comp.md782 B
- nmod-appos.md1 kB
- advmod-lto.md756 B
- advmod-cau.md546 B
- nmod-obj.md650 B
- obl-mcl.md651 B
- aux-neg.md1 kB
- obl-cau.md722 B
- obl-lto.md725 B
- pos
- PRON.md145 B
- VERB.md142 B
- ADV.md410 B
- NUM.md144 B
- CCONJ.md163 B
- ADJ.md146 B
- SCONJ.md164 B
- DET.md147 B
- NOUN.md352 B
- PROPN.md150 B
- INTJ.md150 B
- AUX_.md1 kB
- PUNCT.md150 B
- ADP.md147 B
- X.md140 B
- PART.md1 kB
- _gub
- index.md8 kB
- feat
- Aspect.md1 kB
- Prp.md532 B
- Number.md1 kB
- Voice.md1 kB
- Foreign.md685 B
- Degree.md586 B
- Nomzr.md1 kB
- Tense.md1 kB
- Int.md803 B
- Emph.md634 B
- Polarity.md839 B
- VerbForm.md767 B
- Mood.md1 kB
- Person.md1 kB
- Poss.md824 B
- Red.md799 B
- Foc.md733 B
- PronType.md1 kB
- Speech.md1 kB
- Detrans.md709 B
- Rel.md1 kB
- Clusivity.md760 B
- False.md720 B
- Evident.md1 kB
- Case.md2 kB
- NonFoc.md821 B
- Deo.md741 B
- dep
- obl.md721 B
- det.md452 B
- iobj.md782 B
- obl-subj.md663 B
- obl-obj.md663 B
- case.md906 B
- ccomp.md1 kB
- advcl.md871 B
- aux_.md1018 B
- nmod.md1007 B
- pos
- AUX_.md515 B
- ADP.md772 B
- ADV.md422 B
- _sjo
- index.md4 kB
- dep
- mark-plur.md335 B
- mark-rel.md468 B
- mark-adv.md1 kB
- _tr
- index.md3 kB
- feat-index.md145 B
- specific-syntax.md7 kB
- tokenization.md8 kB
- feat
- VerbForm.md2 kB
- Number-psor.md603 B
- Person.md2 kB
- Number.md2 kB
- Aspect.md3 kB
- Polarity.md1 kB
- Definite.md556 B
- Reflex.md630 B
- PronType.md1 kB
- NumType.md1 kB
- Case.md5 kB
- Degree.md892 B
- Person-psor.md782 B
- Evident.md1 kB
- Tense.md4 kB
- Voice.md7 kB
- Mood.md9 kB
- dep-index.md151 B
- pos
- PRON.md861 B
- ADV.md534 B
- VERB.md1 kB
- CCONJ.md492 B
- NUM.md901 B
- ADJ.md726 B
- SCONJ.md1 kB
- SYM.md326 B
- DET.md1 kB
- NOUN.md1 kB
- PROPN.md788 B
- INTJ.md539 B
- PUNCT.md565 B
- ADP.md1 kB
- AUX_.md872 B
- X.md331 B
- PART.md562 B
- dep
- advcl.md1 kB
- obj.md1 kB
- nsubj.md1 kB
- vocative.md362 B
- advcl-cond.md877 B
- discourse-q.md1 kB
- mark.md1 kB
- xcomp.md1 kB
- flat.md1 kB
- compound.md912 B
- flat-foreign.md517 B
- csubj.md628 B
- reparandum.md395 B
- amod.md681 B
- nmod.md783 B
- nummod.md632 B
- iobj.md354 B
- nsubj-pass.md504 B
- acl.md1 kB
- case.md1 kB
- punct.md311 B
- nmod-poss.md547 B
- advmod.md1 kB
- ccomp.md1 kB
- parataxis.md693 B
- dep-der.md1 kB
- goeswith.md423 B
- appos.md920 B
- cc.md1 kB
- csubj-pass.md635 B
- fixed.md934 B
- det.md609 B
- obl-tmod.md772 B
- discourse.md812 B
- list.md797 B
- compound-redup.md1 kB
- nsubj-cop.md579 B
- obl-agent.md830 B
- cop.md1 kB
- csubj-cop.md663 B
- advmod-emph.md655 B
- nmod-comp.md679 B
- orphan.md461 B
- aux_.md1 kB
- obj-cau.md1 kB
- obl.md1 kB
- root.md610 B
- nmod-part.md1 kB
- aux-q.md953 B
- dislocated.md1 kB
- compound-lvc.md1 kB
- obl-cau.md1 kB
- conj.md1 kB
- dep.md421 B
- pos-index.md132 B
- notes.md15 kB
- _data
- features.yaml26 kB
- postags.yaml12 kB
- relations.yaml51 kB
- validation.yaml41 B
- _be
- index.md9 kB
- feat
- Variant.md1 kB
- InflClass.md1 kB
- tokenization.md4 kB
- syntax.md508 B
- introduction.md2 kB
- _ajp
- index.md2 kB
- markdown-source
- ... too many files ...0 B
- Name
- ud-tools-v2.12.tgz
- Size
- 835.26 KB
- Format
- application/x-gzip
- Description
- Tools
- MD5
- 607ed66fed1f9410c7d54c8072f6fa0d
- ud-tools-v2.12
- check_text_wosp_match.sh814 B
- conll_convert_tags_to_uposf.pl1 kB
- conllu-sort-sentences-by-ids.pl1 kB
- check_sentence_ids.pl1 kB
- conllu-stats.py6 kB
- package_st_data.sh10 kB
- conllu-w2t.py2 kB
- file_util.pyc2 kB
- example-data
- long-token-to-text-wrong.txt333 B
- long-token-to-text-correct.txt332 B
- long-token-to-text.conllu2 kB
- tanl.conll471 B
- conllu-copy-basic-to-enhanced.pl1 kB
- evaluate_treebank.pl18 kB
- enhanced_classify_relations.pl26 kB
- package_ud_release.sh7 kB
- conllu-stats.pl107 kB
- conllu-dependency-stats.pl944 B
- check-space-after-paragraph.pl2 kB
- file_util.py2 kB
- conllu-quick-fix-id-sequence.pl2 kB
- conllu_copy_tokenization.pl10 kB
- check_release.pl31 kB
- conllu-formconvert.py3 kB
- find_duplicate_sentences.pl1 kB
- survey_misc.pl6 kB
- remove_duplicate_sentences.pl2 kB
- survey_feature_language.pl8 kB
- fix_format_of_deps.pl1 kB
- conllu_to_conllx.pl2 kB
- mwtoken-stats.pl1 kB
- LICENSE.txt17 kB
- restore_conllu_lines.pl1 kB
- Node.pm18 kB
- overlap.py2 kB
- collect_propn_sequences.pl3 kB
- __pycache__
- file_util.cpython-311.pyc4 kB
- file_util.cpython-37.pyc2 kB
- survey_features.pl11 kB
- fix-space-after-paragraph.pl4 kB
- survey_deprel_subtypes.pl8 kB
- udlib.pm61 kB
- compat
- argparse.pyc65 kB
- argparse.py85 kB
- __init__.pyc140 B
- __init__.py0 B
- v2-conversion
- convert.py3 kB
- README.md2 kB
- processors_en.py1 kB
- processors_universal.py5 kB
- nmod_obl_adjudication.py3 kB
- depgraph_utils.py6 kB
- text_without_spaces.pl2 kB
- conllu_copy_sentence_segmentation.pl7 kB
- generate_comparison_of_treebanks.pl2 kB
- remove_sense_suffixes_from_lemmas.pl1 kB
- csort.pm7 kB
- conllu_cut.pl2 kB
- enhanced_graph_properties.pl21 kB
- validate.py186 kB
- create_iso_639_3_symlinks.py175 kB
- conllu-quick-fix.pl20 kB
- eval.py42 kB
- conllu-break-cycles.pl3 kB
- survey_paradigms.pl20 kB
- test-cases
- nonvalid
- lowercase-postag.conllu141 B
- lowercase-feature-value-in-empty.conllu251 B
- empty-head.conllu114 B
- invalid-deps-id.conllu173 B
- misordered-feature.conllu243 B
- invalid-deps-syntax.conllu194 B
- missing-final-line.conllu155 B
- empty-field.conllu100 B
- head-not-0-deprel-root.conllu172 B
- ambiguous-feature.conllu175 B
- empty-sentence.conllu163 B
- trailing-tab.conllu127 B
- lowercase-postag-in-empty.conllu239 B
- head-0-deprel-not-root.conllu133 B
- malformed_deps.conllu683 B
- multiple-sent_id.conllu736 B
- lowercase-feature.conllu238 B
- head-not-empty-in-empty.conllu224 B
- duplicate-value.conllu137 B
- tanl-broken.conllu690 B
- misordered-layered-feature.conllu239 B
- whitespace_nonv.conllu274 B
- misplaced-comment-end.conllu429 B
- nonsequential-empty-node-id.conllu238 B
- dos-newlines.conllu698 B
- duplicate-layered-feature.conllu182 B
- cyclic-deps.conllu227 B
- invalid-head.conllu164 B
- id-with-extra-0.conllu140 B
- overlapping-multiword.conllu387 B
- duplicate-feature.conllu142 B
- token_with_cols_filled.conllu385 B
- self-cycle-deps.conllu164 B
- nonsequential-id.conllu176 B
- space-in-field.conllu127 B
- extra-empty-line.conllu287 B
- lowercase-feature-in-empty.conllu244 B
- non-proj.conllu109 B
- no-sent_id.conllu686 B
- misindexed-empty-node.conllu235 B
- id-starting-from-2.conllu247 B
- self-cycle-head.conllu190 B
- invalid-range.conllu375 B
- empty-node-without-dependent.conllu251 B
- multiword-with-pos.conllu407 B
- uppercase-deps-deprel.conllu206 B
- uppercase-deprel.conllu184 B
- invalid-deps-order.conllu409 B
- missing-space-after.conllu176 B
- extra-field.conllu130 B
- invalid-range-format.conllu380 B
- duplicate-id.conllu171 B
- deprel-not-empty-in-empty.conllu233 B
- misplaced-comment-mid.conllu401 B
- misordered-multiword.conllu392 B
- lowercase-value.conllu237 B
- valid
- maximal-empty-node.conllu273 B
- multiple-features.conllu295 B
- whitespace.conllu294 B
- id_test_part2.conllu375 B
- empty-nodes.conllu324 B
- id_test_part1.conllu375 B
- tanl.conllu673 B
- empty-file.conllu0 B
- minimal-empty-node.conllu239 B
- layered-features.conllu272 B
- nonvalid
- README.md12 kB
- save_evaluation_logs.sh962 B
- conllu-tenfold.pl2 kB
- conllu-remove-enhanced-deps.pl443 B
- mergept.pl2 kB
- Graph.pm12 kB
- normalize_unicode.pl511 B
- data
- deprel.shopen311 B
- edeprel.ta2 kB
- tokens_w_space.ud27 B
- edeprel.ar27 kB
- tokens_w_space.br443 B
- tokens_w_space.koi86 B
- docdeps.json242 kB
- tokens_w_space.kk859 B
- tokens_w_space.nl555 B
- cpos.ud79 B
- edeprels.json831 kB
- tokens_w_space.hit72 B
- edeprel.lt2 kB
- tokens_w_space.am82 B
- deprels.json734 kB
- tokens_w_space.sv131 B
- tokens_w_space.myv82 B
- tokens_w_space.mdf82 B
- tokens_w_space.pl366 B
- edeprel.uk5 kB
- feats.json1 MB
- tokens_w_space.akk246 B
- tokens_w_space.ja844 B
- tokens_w_space.vi3 B
- deprel.ud237 B
- data.json441 kB
- tokens_w_space.fro10 B
- tokens_w_space.kpv86 B
- tokens_w_space.shopen9 B
- feat_val.shopen2 kB
- tokens_w_space.kmr277 B
- docfeats.json1 MB
- tokens_w_space.fr10 B
- tokens_w_space.lv112 B
- tokens_w_space.sms151 B
- tokens_w_space.lt1 kB
- tokens_w_space.sjo2 kB
- README.md808 B
- tokens_w_space.apu123 B
- tokens_w_space.fi78 B
- tokens_w_space.sga86 B
- generate_treebank_hub.pl1 kB
- conllu_to_text.pl9 kB
- check_overlaps.pl1 kB
- conllu_align_tokens.pl6 kB
- survey_enhancements.pl7 kB
- enhanced_collapse_empty_nodes.pl8 kB
- check_files.pl3 kB
- klcpos3.pl1 kB