Files in this item
Download all files in item (650.18 MB)- Name
- ud-treebanks-v2.15.tgz
- Size
- 539.05 MB
- Format
- application/x-gzip
- Description
- Treebank data
- MD5
- 1ebca6a1cf594ea689c1687a56fbb9d4
- ud-treebanks-v2.15
- UD_English-PUD
- stats.xml9 kB
- en_pud-ud-test.conllu1 MB
- README.md6 kB
- LICENSE.txt19 kB
- en_pud-ud-test.txt109 kB
- UD_Latvian-Cairo
- stats.xml7 kB
- README.md2 kB
- lv_cairo-ud-test.conllu20 kB
- LICENSE.txt202 B
- lv_cairo-ud-test.txt982 B
- UD_Telugu-MTG
- te_mtg-ud-test.txt10 kB
- README.md1 kB
- te_mtg-ud-train.conllu435 kB
- te_mtg-ud-dev.conllu56 kB
- stats.xml3 kB
- te_mtg-ud-test.conllu61 kB
- LICENSE.txt202 B
- te_mtg-ud-train.txt72 kB
- te_mtg-ud-dev.txt9 kB
- UD_Finnish-PUD
- stats.xml17 kB
- README.txt2 kB
- fi_pud-ud-test.txt119 kB
- LICENSE.txt202 B
- fi_pud-ud-test.conllu1 MB
- UD_Neapolitan-RB
- stats.xml1 kB
- README.md1 kB
- LICENSE.txt202 B
- nap_rb-ud-test.conllu431 B
- nap_rb-ud-test.txt56 B
- UD_Icelandic-GC
- README.md1 kB
- is_gc-ud-train.txt485 kB
- is_gc-ud-dev.conllu949 kB
- is_gc-ud-train.conllu6 MB
- is_gc-ud-test.conllu915 kB
- stats.xml8 kB
- LICENSE.txt202 B
- is_gc-ud-test.txt64 kB
- is_gc-ud-dev.txt65 kB
- UD_Turkish-Atis
- tr_atis-ud-train.conllu2 MB
- README.md1 kB
- tr_atis-ud-dev.conllu351 kB
- tr_atis-ud-test.txt38 kB
- tr_atis-ud-dev.txt38 kB
- stats.xml11 kB
- LICENSE.txt202 B
- tr_atis-ud-train.txt289 kB
- tr_atis-ud-test.conllu356 kB
- UD_Chinese-Beginner
- stats.xml5 kB
- README.md3 kB
- zh_beginner-ud-test.txt73 kB
- zh_beginner-ud-test.conllu2 MB
- LICENSE.txt801 B
- UD_Komi_Zyrian-IKDP
- stats.xml16 kB
- README.md5 kB
- LICENSE.txt202 B
- kpv_ikdp-ud-test.txt20 kB
- kpv_ikdp-ud-test.conllu202 kB
- UD_Czech-CLTT
- cs_cltt-ud-dev.conllu1 MB
- cs_cltt-ud-test.txt81 kB
- README.md4 kB
- cs_cltt-ud-train.txt96 kB
- cs_cltt-ud-dev.txt76 kB
- cs_cltt-ud-train.conllu1 MB
- stats.xml13 kB
- LICENSE.txt265 B
- cs_cltt-ud-test.conllu1 MB
- UD_Czech-PUD
- stats.xml15 kB
- README.md3 kB
- LICENSE.txt202 B
- cs_pud-ud-test.txt114 kB
- cs_pud-ud-test.conllu2 MB
- UD_Swiss_German-UZH
- gsw_uzh-ud-test.txt7 kB
- stats.xml2 kB
- README.md3 kB
- LICENSE.txt202 B
- gsw_uzh-ud-test.conllu58 kB
- UD_Sinhala-STB
- stats.xml14 kB
- README.md1 kB
- si_stb-ud-test.txt11 kB
- LICENSE.txt202 B
- si_stb-ud-test.conllu109 kB
- UD_Kiche-IU
- stats.xml11 kB
- quc_iu-ud-test.conllu823 kB
- README.md1 kB
- quc_iu-ud-test.txt46 kB
- LICENSE.txt202 B
- UD_Akuntsu-TuDeT
- stats.xml7 kB
- aqz_tudet-ud-test.conllu95 kB
- README.md3 kB
- aqz_tudet-ud-test.txt7 kB
- LICENSE.txt202 B
- UD_German-GSD
- README.md9 kB
- de_gsd-ud-dev.conllu883 kB
- de_gsd-ud-dev.txt72 kB
- de_gsd-ud-train.txt1 MB
- de_gsd-ud-test.conllu1 MB
- stats.xml11 kB
- de_gsd-ud-train.conllu18 MB
- LICENSE.txt202 B
- de_gsd-ud-test.txt97 kB
- UD_Vietnamese-TueCL
- stats.xml9 kB
- vi_tuecl-ud-test.conllu115 kB
- README.md810 B
- vi_tuecl-ud-test.txt11 kB
- LICENSE.txt202 B
- UD_Japanese-PUD
- stats.xml3 kB
- ja_pud-ud-test.txt138 kB
- README.md5 kB
- ja_pud-ud-test.conllu6 MB
- LICENSE.txt19 kB
- UD_Italian-Valico
- stats.xml8 kB
- README.md3 kB
- LICENSE.txt202 B
- it_valico-ud-test.conllu520 kB
- it_valico-ud-test.txt31 kB
- UD_English-ESLSpok
- README.md3 kB
- en_eslspok-ud-train.conllu646 kB
- en_eslspok-ud-dev.conllu82 kB
- stats.xml3 kB
- en_eslspok-ud-test.txt9 kB
- LICENSE.txt202 B
- en_eslspok-ud-train.txt72 kB
- en_eslspok-ud-test.conllu85 kB
- en_eslspok-ud-dev.txt9 kB
- UD_Italian-Old
- it_old-ud-train.txt418 kB
- README.md4 kB
- it_old-ud-dev.conllu979 kB
- it_old-ud-test.conllu979 kB
- it_old-ud-test.txt52 kB
- it_old-ud-train.conllu7 MB
- stats.xml10 kB
- LICENSE.txt202 B
- it_old-ud-dev.txt53 kB
- UD_Chinese-PUD
- stats.xml5 kB
- README.md5 kB
- zh_pud-ud-test.conllu2 MB
- zh_pud-ud-test.txt101 kB
- LICENSE.txt19 kB
- UD_Teko-TuDeT
- stats.xml15 kB
- eme_tudet-ud-test.txt22 kB
- eme_tudet-ud-test.conllu254 kB
- README.md1 kB
- LICENSE.txt202 B
- UD_Buryat-BDT
- UD_Abaza-ATB
- stats.xml17 kB
- abq_atb-ud-test.conllu125 kB
- README.md1 kB
- abq_atb-ud-test.txt9 kB
- LICENSE.txt202 B
- UD_Turkish-FrameNet
- README.md1 kB
- tr_framenet-ud-dev.txt9 kB
- tr_framenet-ud-train.conllu1 MB
- tr_framenet-ud-dev.conllu108 kB
- stats.xml11 kB
- LICENSE.txt202 B
- tr_framenet-ud-test.conllu111 kB
- tr_framenet-ud-train.txt111 kB
- tr_framenet-ud-test.txt10 kB
- UD_Latin-PROIEL
- la_proiel-ud-dev.txt87 kB
- README.md2 kB
- la_proiel-ud-dev.conllu1 MB
- la_proiel-ud-test.txt88 kB
- stats.xml10 kB
- la_proiel-ud-train.conllu15 MB
- LICENSE.txt279 B
- la_proiel-ud-train.txt1 MB
- la_proiel-ud-test.conllu1 MB
- UD_English-GUMReddit
- README.md32 kB
- en_gumreddit-ud-train.txt23 kB
- en_gumreddit-ud-train.conllu1 MB
- en_gumreddit-ud-dev.conllu194 kB
- get_text.py28 kB
- en_gumreddit-ud-dev.txt3 kB
- stats.xml7 kB
- en_gumreddit-ud-test.txt3 kB
- LICENSE.txt313 B
- en_gumreddit-ud-test.conllu196 kB
- UD_Sanskrit-Vedic
- sa_vedic-ud-train.conllu22 MB
- README.md2 kB
- sa_vedic-ud-train.txt1 MB
- sa_vedic-ud-test.conllu2 MB
- sa_vedic-ud-dev.txt184 kB
- stats.xml10 kB
- sa_vedic-ud-test.txt160 kB
- LICENSE.txt202 B
- sa_vedic-ud-dev.conllu3 MB
- UD_Warlpiri-UFAL
- stats.xml6 kB
- README.md870 B
- LICENSE.txt202 B
- wbp_ufal-ud-test.conllu37 kB
- wbp_ufal-ud-test.txt2 kB
- UD_Icelandic-Modern
- README.md6 kB
- is_modern-ud-dev.txt48 kB
- is_modern-ud-dev.conllu700 kB
- is_modern-ud-train.conllu5 MB
- is_modern-ud-test.conllu832 kB
- is_modern-ud-train.txt361 kB
- is_modern-ud-test.txt59 kB
- stats.xml9 kB
- LICENSE.txt202 B
- UD_Turkish-IMST
- tr_imst-ud-test.txt64 kB
- README.md4 kB
- tr_imst-ud-train.conllu2 MB
- tr_imst-ud-test.conllu821 kB
- tr_imst-ud-dev.conllu873 kB
- tr_imst-ud-dev.txt69 kB
- stats.xml13 kB
- LICENSE.txt20 kB
- tr_imst-ud-train.txt242 kB
- UD_Japanese-GSDLUW
- ja_gsdluw-ud-train.conllu25 MB
- README.md8 kB
- ja_gsdluw-ud-dev.txt58 kB
- ja_gsdluw-ud-test.txt62 kB
- ja_gsdluw-ud-test.conllu2 MB
- stats.xml4 kB
- ja_gsdluw-ud-train.txt804 kB
- LICENSE.txt202 B
- ja_gsdluw-ud-dev.conllu1 MB
- UD_French-FQB
- stats.xml8 kB
- fr_fqb-ud-test.conllu1 MB
- fr_fqb-ud-test.txt117 kB
- README.md3 kB
- LICENSE.txt14 kB
- UD_French-PUD
- fr_pud-ud-test.txt130 kB
- stats.xml8 kB
- fr_pud-ud-test.conllu1 MB
- README.md5 kB
- LICENSE.txt19 kB
- UD_English-GUM
- en_gum-ud-test.txt120 kB
- README.md36 kB
- en_gum-ud-dev.txt114 kB
- en_gum-ud-train.conllu15 MB
- en_gum-ud-dev.conllu2 MB
- stats.xml11 kB
- en_gum-ud-test.conllu2 MB
- en_gum-ud-train.txt792 kB
- LICENSE.txt1 kB
- UD_Moksha-JR
- stats.xml26 kB
- README.md6 kB
- mdf_jr-ud-train.txt1 kB
- mdf_jr-ud-test.txt43 kB
- mdf_jr-ud-test.conllu485 kB
- mdf_jr-ud-train.conllu18 kB
- LICENSE.txt202 B
- UD_Azerbaijani-TueCL
- az_tuecl-ud-test.txt4 kB
- stats.xml3 kB
- README.md1 kB
- az_tuecl-ud-test.conllu63 kB
- LICENSE.txt202 B
- UD_Irish-Cadhan
- ga_cadhan-ud-test.txt24 kB
- stats.xml12 kB
- README.md5 kB
- ga_cadhan-ud-test.conllu343 kB
- LICENSE.txt202 B
- UD_Spanish_Sign_Language-LSE
- stats.xml2 kB
- README.md2 kB
- LICENSE.txt202 B
- ssp_lse-ud-test.conllu150 kB
- ssp_lse-ud-test.txt14 kB
- UD_French-ParTUT
- README.md5 kB
- fr_partut-ud-dev.conllu117 kB
- fr_partut-ud-train.conllu1 MB
- fr_partut-ud-test.txt14 kB
- fr_partut-ud-train.txt128 kB
- stats.xml8 kB
- LICENSE.txt18 kB
- fr_partut-ud-test.conllu165 kB
- fr_partut-ud-dev.txt9 kB
- UD_Spanish-GSD
- README.md6 kB
- es_gsd-ud-test.conllu737 kB
- es_gsd-ud-train.conllu22 MB
- es_gsd-ud-test.txt61 kB
- es_gsd-ud-train.txt1 MB
- es_gsd-ud-dev.conllu2 MB
- es_gsd-ud-dev.txt191 kB
- stats.xml12 kB
- LICENSE.txt202 B
- UD_Ancient_Greek-Perseus
- README.md4 kB
- grc_perseus-ud-dev.txt250 kB
- grc_perseus-ud-test.conllu1 MB
- grc_perseus-ud-test.txt231 kB
- stats.xml10 kB
- grc_perseus-ud-train.txt1 MB
- grc_perseus-ud-train.conllu14 MB
- LICENSE.txt279 B
- grc_perseus-ud-dev.conllu1 MB
- UD_Skolt_Sami-Giellagas
- stats.xml12 kB
- sms_giellagas-ud-test.conllu222 kB
- sms_giellagas-ud-test.txt16 kB
- README.md4 kB
- LICENSE.txt202 B
- sms_giellagas-ud-train.conllu16 kB
- sms_giellagas-ud-train.txt1 kB
- UD_Coptic-Scriptorium
- README.md12 kB
- cop_scriptorium-ud-test.conllu969 kB
- cop_scriptorium-ud-test.txt80 kB
- cop_scriptorium-ud-train.conllu3 MB
- cop_scriptorium-ud-dev.conllu1 MB
- stats.xml9 kB
- LICENSE.txt538 B
- cop_scriptorium-ud-dev.txt85 kB
- cop_scriptorium-ud-train.txt270 kB
- UD_Polish-LFG
- pl_lfg-ud-dev.txt74 kB
- pl_lfg-ud-train.txt596 kB
- README.md6 kB
- pl_lfg-ud-test.txt74 kB
- pl_lfg-ud-dev.conllu1 MB
- pl_lfg-ud-test.conllu1 MB
- stats.xml14 kB
- LICENSE.txt34 kB
- pl_lfg-ud-train.conllu11 MB
- UD_Romanian-ArT
- ro_art-ud-test.conllu44 kB
- stats.xml8 kB
- README.md1 kB
- ro_art-ud-test.txt2 kB
- LICENSE.txt202 B
- UD_Russian-GSD
- ru_gsd-ud-dev.conllu1 MB
- README.md1 kB
- ru_gsd-ud-test.conllu1003 kB
- ru_gsd-ud-dev.txt123 kB
- ru_gsd-ud-train.txt794 kB
- ru_gsd-ud-test.txt120 kB
- stats.xml13 kB
- LICENSE.txt202 B
- ru_gsd-ud-train.conllu6 MB
- UD_Komi_Zyrian-Lattice
- stats.xml25 kB
- README.md7 kB
- kpv_lattice-ud-test.txt78 kB
- LICENSE.txt202 B
- kpv_lattice-ud-train.txt1 kB
- kpv_lattice-ud-test.conllu724 kB
- kpv_lattice-ud-train.conllu14 kB
- UD_Chinese-PatentChar
- stats.xml2 kB
- zh_patentchar-ud-test.txt23 kB
- README.md1 kB
- zh_patentchar-ud-test.conllu368 kB
- LICENSE.txt202 B
- UD_Italian-ParTUT
- README.md4 kB
- it_partut-ud-dev.txt15 kB
- it_partut-ud-test.txt19 kB
- it_partut-ud-train.txt259 kB
- stats.xml9 kB
- it_partut-ud-test.conllu234 kB
- it_partut-ud-dev.conllu189 kB
- LICENSE.txt18 kB
- it_partut-ud-train.conllu3 MB
- UD_Yakut-YKTDT
- stats.xml10 kB
- README.md2 kB
- sah_yktdt-ud-test.txt15 kB
- LICENSE.txt202 B
- sah_yktdt-ud-test.conllu148 kB
- UD_Hungarian-Szeged
- hu_szeged-ud-train.conllu1 MB
- README.md4 kB
- hu_szeged-ud-test.txt72 kB
- hu_szeged-ud-train.txt137 kB
- hu_szeged-ud-test.conllu738 kB
- stats.xml16 kB
- hu_szeged-ud-dev.conllu823 kB
- LICENSE.txt30 B
- hu_szeged-ud-dev.txt83 kB
- UD_Portuguese-PetroGold
- README.md3 kB
- pt_petrogold-ud-test.txt154 kB
- pt_petrogold-ud-dev.conllu1 MB
- pt_petrogold-ud-train.conllu12 MB
- stats.xml9 kB
- pt_petrogold-ud-dev.txt115 kB
- LICENSE.txt202 B
- pt_petrogold-ud-train.txt1 MB
- pt_petrogold-ud-test.conllu1 MB
- UD_Lithuanian-ALKSNIS
- lt_alksnis-ud-train.txt317 kB
- README.md4 kB
- lt_alksnis-ud-test.conllu1 MB
- lt_alksnis-ud-train.conllu4 MB
- stats.xml13 kB
- lt_alksnis-ud-dev.conllu1 MB
- lt_alksnis-ud-test.txt69 kB
- LICENSE.txt202 B
- lt_alksnis-ud-dev.txt78 kB
- UD_Kyrgyz-TueCL
- stats.xml6 kB
- ky_tuecl-ud-test.txt9 kB
- README.md1 kB
- ky_tuecl-ud-test.conllu101 kB
- LICENSE.txt202 B
- UD_Umbrian-IKUVINA
- stats.xml6 kB
- xum_ikuvina-ud-test.conllu48 kB
- xum_ikuvina-ud-test.txt4 kB
- README.md1 kB
- LICENSE.txt202 B
- UD_Classical_Armenian-CAVaL
- README.md6 kB
- xcl_caval-ud-train.txt509 kB
- xcl_caval-ud-train.conllu8 MB
- xcl_caval-ud-test.txt83 kB
- xcl_caval-ud-test.conllu1 MB
- stats.xml14 kB
- xcl_caval-ud-dev.txt66 kB
- LICENSE.txt219 B
- xcl_caval-ud-dev.conllu1 MB
- UD_Livvi-KKPP
- stats.xml10 kB
- README.md4 kB
- olo_kkpp-ud-train.txt808 B
- olo_kkpp-ud-test.conllu103 kB
- olo_kkpp-ud-test.txt9 kB
- LICENSE.txt202 B
- olo_kkpp-ud-train.conllu15 kB
- UD_German-PUD
- stats.xml10 kB
- README.md5 kB
- LICENSE.txt19 kB
- de_pud-ud-test.conllu1 MB
- de_pud-ud-test.txt126 kB
- UD_Western_Armenian-ArmTDP
- README.md3 kB
- hyw_armtdp-ud-test.txt141 kB
- hyw_armtdp-ud-train.txt1006 kB
- hyw_armtdp-ud-dev.txt133 kB
- hyw_armtdp-ud-test.conllu1 MB
- hyw_armtdp-ud-dev.conllu1 MB
- stats.xml24 kB
- LICENSE.txt202 B
- hyw_armtdp-ud-train.conllu12 MB
- UD_Urdu-UDTB
- README.md2 kB
- ur_udtb-ud-train.txt853 kB
- ur_udtb-ud-test.txt117 kB
- ur_udtb-ud-train.conllu15 MB
- stats.xml11 kB
- ur_udtb-ud-test.conllu2 MB
- ur_udtb-ud-dev.txt115 kB
- LICENSE.txt247 B
- ur_udtb-ud-dev.conllu2 MB
- UD_Kaapor-TuDeT
- stats.xml4 kB
- README.md2 kB
- urb_tudet-ud-test.txt2 kB
- LICENSE.txt202 B
- urb_tudet-ud-test.conllu24 kB
- UD_Akkadian-PISANDUB
- stats.xml3 kB
- README.md871 B
- akk_pisandub-ud-test.txt15 kB
- LICENSE.txt202 B
- akk_pisandub-ud-test.conllu99 kB
- UD_Ottoman_Turkish-DUDU
- stats.xml10 kB
- README.md1 kB
- ota_dudu-ud-test.conllu63 kB
- ota_dudu-ud-test.txt5 kB
- LICENSE.txt202 B
- UD_Portuguese-GSD
- pt_gsd-ud-test.conllu1 MB
- README.md4 kB
- pt_gsd-ud-train.conllu12 MB
- pt_gsd-ud-train.txt1 MB
- pt_gsd-ud-dev.conllu1 MB
- pt_gsd-ud-test.txt153 kB
- stats.xml10 kB
- LICENSE.txt202 B
- pt_gsd-ud-dev.txt156 kB
- UD_Thai-PUD
- stats.xml4 kB
- README.md5 kB
- th_pud-ud-test.conllu2 MB
- LICENSE.txt19 kB
- th_pud-ud-test.txt281 kB
- UD_Czech-FicTree
- README.md4 kB
- cs_fictree-ud-test.conllu1 MB
- cs_fictree-ud-test.txt86 kB
- cs_fictree-ud-train.conllu13 MB
- cs_fictree-ud-dev.txt86 kB
- cs_fictree-ud-dev.conllu1 MB
- stats.xml14 kB
- LICENSE.txt219 B
- cs_fictree-ud-train.txt696 kB
- UD_Romanian-TueCL
- stats.xml11 kB
- ro_tuecl-ud-test.txt22 kB
- README.md2 kB
- LICENSE.txt202 B
- ro_tuecl-ud-test.conllu358 kB
- UD_Old_East_Slavic-Ruthenian
- README.md1 kB
- orv_ruthenian-ud-test.txt91 kB
- orv_ruthenian-ud-test.conllu916 kB
- orv_ruthenian-ud-train.txt833 kB
- orv_ruthenian-ud-train.conllu8 MB
- stats.xml18 kB
- orv_ruthenian-ud-dev.txt95 kB
- LICENSE.txt202 B
- orv_ruthenian-ud-dev.conllu1 MB
- UD_Czech-Poetry
- stats.xml13 kB
- cs_poetry-ud-test.txt32 kB
- README.md2 kB
- LICENSE.txt202 B
- cs_poetry-ud-test.conllu572 kB
- UD_Polish-PDB
- pl_pdb-ud-train.txt1 MB
- README.md5 kB
- pl_pdb-ud-dev.conllu3 MB
- pl_pdb-ud-test.txt203 kB
- pl_pdb-ud-train.conllu27 MB
- pl_pdb-ud-dev.txt210 kB
- stats.xml16 kB
- LICENSE.txt384 B
- pl_pdb-ud-test.conllu3 MB
- UD_Ancient_Hebrew-PTNK
- README.md3 kB
- hbo_ptnk-ud-dev.txt98 kB
- hbo_ptnk-ud-dev.conllu1 MB
- hbo_ptnk-ud-test.conllu1 MB
- hbo_ptnk-ud-train.txt172 kB
- stats.xml10 kB
- hbo_ptnk-ud-train.conllu1 MB
- LICENSE.txt202 B
- hbo_ptnk-ud-test.txt95 kB
- UD_North_Sami-Giella
- stats.xml10 kB
- README.md2 kB
- sme_giella-ud-train.txt107 kB
- sme_giella-ud-train.conllu1 MB
- LICENSE.txt202 B
- sme_giella-ud-test.conllu668 kB
- sme_giella-ud-test.txt70 kB
- UD_Korean-Kaist
- ko_kaist-ud-test.conllu3 MB
- README.md1 kB
- ko_kaist-ud-train.txt2 MB
- ko_kaist-ud-dev.txt233 kB
- ko_kaist-ud-test.txt255 kB
- ko_kaist-ud-dev.conllu2 MB
- stats.xml4 kB
- LICENSE.txt202 B
- ko_kaist-ud-train.conllu32 MB
- UD_Irish-TwittIrish
- ga_twittirish-ud-train.txt89 kB
- README.md3 kB
- ga_twittirish-ud-dev.conllu826 kB
- ga_twittirish-ud-test.txt85 kB
- ga_twittirish-ud-test.conllu770 kB
- stats.xml4 kB
- LICENSE.txt202 B
- ga_twittirish-ud-dev.txt95 kB
- ga_twittirish-ud-train.conllu782 kB
- UD_Ukrainian-IU
- README.md9 kB
- uk_iu-ud-train.txt900 kB
- uk_iu-ud-test.txt177 kB
- uk_iu-ud-test.conllu2 MB
- uk_iu-ud-dev.conllu1 MB
- uk_iu-ud-dev.txt128 kB
- stats.xml17 kB
- LICENSE.txt172 B
- uk_iu-ud-train.conllu12 MB
- UD_Latgalian-Cairo
- stats.xml7 kB
- ltg_cairo-ud-test.txt955 B
- README.md1 kB
- ltg_cairo-ud-test.conllu20 kB
- LICENSE.txt202 B
- UD_Norwegian-Nynorsk
- no_nynorsk-ud-dev.conllu1 MB
- README.md5 kB
- no_nynorsk-ud-test.txt135 kB
- no_nynorsk-ud-dev.txt166 kB
- stats.xml8 kB
- no_nynorsk-ud-test.conllu1 MB
- LICENSE.txt68 B
- no_nynorsk-ud-train.txt1 MB
- no_nynorsk-ud-train.conllu14 MB
- UD_Old_East_Slavic-Birchbark
- README.md4 kB
- orv_birchbark-ud-dev.txt90 kB
- orv_birchbark-ud-dev.conllu1 MB
- orv_birchbark-ud-train.txt66 kB
- orv_birchbark-ud-test.txt90 kB
- orv_birchbark-ud-test.conllu1 MB
- stats.xml14 kB
- LICENSE.txt202 B
- orv_birchbark-ud-train.conllu981 kB
- UD_Galician-PUD
- stats.xml9 kB
- gl_pud-ud-test.conllu1 MB
- gl_pud-ud-test.txt117 kB
- README.md4 kB
- LICENSE.txt202 B
- UD_Georgian-GLC
- ka_glc-ud-dev.txt179 kB
- README.md3 kB
- ka_glc-ud-test.txt185 kB
- ka_glc-ud-train.conllu5 MB
- ka_glc-ud-dev.conllu1 MB
- stats.xml27 kB
- LICENSE.txt202 B
- ka_glc-ud-test.conllu1 MB
- ka_glc-ud-train.txt750 kB
- UD_Romanian-SiMoNERo
- ro_simonero-ud-test.conllu1 MB
- README.md2 kB
- ro_simonero-ud-dev.conllu1 MB
- ro_simonero-ud-test.txt93 kB
- ro_simonero-ud-train.txt719 kB
- ro_simonero-ud-dev.txt91 kB
- ro_simonero-ud-train.conllu9 MB
- stats.xml11 kB
- LICENSE.txt202 B
- UD_Spanish-PUD
- stats.xml11 kB
- es_pud-ud-test.conllu1 MB
- README.md6 kB
- LICENSE.txt19 kB
- es_pud-ud-test.txt123 kB
- UD_Cebuano-GJA
- ceb_gja-ud-test.conllu104 kB
- stats.xml7 kB
- README.md1 kB
- LICENSE.txt202 B
- ceb_gja-ud-test.txt6 kB
- UD_Malayalam-UFAL
- stats.xml19 kB
- README.md866 B
- LICENSE.txt202 B
- ml_ufal-ud-test.txt47 kB
- ml_ufal-ud-test.conllu415 kB
- UD_Serbian-SET
- sr_set-ud-test.txt67 kB
- README.md1 kB
- sr_set-ud-train.conllu5 MB
- sr_set-ud-dev.txt68 kB
- stats.xml11 kB
- sr_set-ud-test.conllu847 kB
- sr_set-ud-train.txt432 kB
- LICENSE.txt230 B
- sr_set-ud-dev.conllu888 kB
- UD_Tatar-NMCTT
- stats.xml12 kB
- README.md1 kB
- tt_nmctt-ud-test.txt26 kB
- LICENSE.txt202 B
- tt_nmctt-ud-test.conllu220 kB
- UD_Hittite-HitTB
- stats.xml9 kB
- README.md1 kB
- hit_hittb-ud-test.conllu115 kB
- LICENSE.txt202 B
- hit_hittb-ud-test.txt10 kB
- UD_Chinese-HK
- stats.xml4 kB
- README.md4 kB
- LICENSE.txt202 B
- zh_hk-ud-test.conllu897 kB
- zh_hk-ud-test.txt41 kB
- UD_Maghrebi_Arabic_French-Arabizi
- qaf_arabizi-ud-dev.conllu222 kB
- README.md3 kB
- qaf_arabizi-ud-train.txt81 kB
- qaf_arabizi-ud-test.conllu220 kB
- qaf_arabizi-ud-dev.txt11 kB
- qaf_arabizi-ud-train.conllu1 MB
- stats.xml6 kB
- LICENSE.txt202 B
- qaf_arabizi-ud-test.txt11 kB
- UD_Japanese-GSD
- ja_gsd-ud-dev.txt58 kB
- README.md8 kB
- ja_gsd-ud-dev.conllu2 MB
- ja_gsd-ud-train.conllu38 MB
- stats.xml4 kB
- LICENSE.txt202 B
- ja_gsd-ud-test.conllu2 MB
- ja_gsd-ud-train.txt804 kB
- ja_gsd-ud-test.txt62 kB
- UD_English-ParTUT
- README.md4 kB
- en_partut-ud-train.txt229 kB
- en_partut-ud-test.conllu183 kB
- en_partut-ud-test.txt18 kB
- en_partut-ud-train.conllu2 MB
- stats.xml8 kB
- LICENSE.txt18 kB
- en_partut-ud-dev.conllu148 kB
- en_partut-ud-dev.txt13 kB
- UD_Czech-CAC
- cs_cac-ud-test.txt71 kB
- cs_cac-ud-test.conllu1 MB
- README.md7 kB
- cs_cac-ud-train.conllu49 MB
- cs_cac-ud-dev.txt72 kB
- cs_cac-ud-train.txt2 MB
- stats.xml18 kB
- LICENSE.txt265 B
- cs_cac-ud-dev.conllu1 MB
- UD_Arabic-PADT
- README.md6 kB
- ar_padt-ud-dev.conllu5 MB
- ar_padt-ud-train.conllu38 MB
- ar_padt-ud-train.txt1 MB
- ar_padt-ud-test.txt234 kB
- ar_padt-ud-test.conllu4 MB
- stats.xml11 kB
- ar_padt-ud-dev.txt241 kB
- LICENSE.txt19 kB
- UD_Upper_Sorbian-UFAL
- stats.xml11 kB
- hsb_ufal-ud-test.conllu730 kB
- README.md1 kB
- hsb_ufal-ud-train.conllu31 kB
- hsb_ufal-ud-test.txt64 kB
- LICENSE.txt202 B
- hsb_ufal-ud-train.txt2 kB
- UD_Swedish_Sign_Language-SSLC
- stats.xml2 kB
- README.md1 kB
- swl_sslc-ud-test.txt15 kB
- LICENSE.txt19 kB
- swl_sslc-ud-test.conllu79 kB
- UD_Czech-PDT
- cs_pdt-ud-train.conllu139 MB
- README.md13 kB
- cs_pdt-ud-test.conllu20 MB
- cs_pdt-ud-test.txt1 MB
- cs_pdt-ud-dev.txt989 kB
- cs_pdt-ud-dev.conllu19 MB
- stats.xml18 kB
- LICENSE.txt311 B
- cs_pdt-ud-train.txt7 MB
- UD_Bororo-BDT
- stats.xml13 kB
- README.md2 kB
- LICENSE.txt202 B
- bor_bdt-ud-test.txt38 kB
- bor_bdt-ud-test.conllu497 kB
- UD_Chinese-GSD
- README.md2 kB
- zh_gsd-ud-test.conllu1 MB
- zh_gsd-ud-train.conllu8 MB
- zh_gsd-ud-train.txt433 kB
- zh_gsd-ud-dev.txt55 kB
- zh_gsd-ud-dev.conllu1 MB
- stats.xml5 kB
- zh_gsd-ud-test.txt53 kB
- LICENSE.txt202 B
- UD_Catalan-AnCora
- README.md4 kB
- ca_ancora-ud-test.txt297 kB
- ca_ancora-ud-dev.conllu5 MB
- ca_ancora-ud-test.conllu5 MB
- ca_ancora-ud-train.conllu37 MB
- ca_ancora-ud-train.txt2 MB
- stats.xml11 kB
- ca_ancora-ud-dev.txt290 kB
- LICENSE.txt189 B
- UD_Xavante-XDT
- stats.xml7 kB
- xav_xdt-ud-test.txt8 kB
- README.md1 kB
- xav_xdt-ud-test.conllu129 kB
- LICENSE.txt202 B
- UD_Abkhaz-AbNC
- stats.xml36 kB
- README.md2 kB
- ab_abnc-ud-test.conllu943 kB
- ab_abnc-ud-test.txt66 kB
- LICENSE.txt202 B
- UD_Russian-PUD
- stats.xml12 kB
- README.md5 kB
- LICENSE.txt19 kB
- ru_pud-ud-test.txt209 kB
- ru_pud-ud-test.conllu1 MB
- UD_Arabic-PUD
- stats.xml9 kB
- README.md5 kB
- ar_pud-ud-test.txt168 kB
- LICENSE.txt19 kB
- ar_pud-ud-test.conllu2 MB
- UD_Tupinamba-TuDeT
- stats.xml15 kB
- README.md2 kB
- LICENSE.txt202 B
- tpn_tudet-ud-test.txt29 kB
- tpn_tudet-ud-test.conllu317 kB
- UD_Spanish-AnCora
- README.md5 kB
- es_ancora-ud-train.txt2 MB
- es_ancora-ud-test.conllu4 MB
- es_ancora-ud-dev.conllu4 MB
- es_ancora-ud-test.txt277 kB
- stats.xml12 kB
- es_ancora-ud-train.conllu40 MB
- es_ancora-ud-dev.txt276 kB
- LICENSE.txt189 B
- UD_Dutch-LassySmall
- nl_lassysmall-ud-train.conllu19 MB
- nl_lassysmall-ud-test.conllu2 MB
- nl_lassysmall-ud-test.txt162 kB
- nl_lassysmall-ud-train.txt1 MB
- nl_lassysmall-ud-dev.txt155 kB
- stats.xml8 kB
- LICENSE.txt392 B
- README.txt2 kB
- nl_lassysmall-ud-dev.conllu2 MB
- UD_Mbya_Guarani-Dooley
- stats.xml7 kB
- gun_dooley-ud-test.conllu560 kB
- README.md3 kB
- LICENSE.txt202 B
- gun_dooley-ud-test.txt23 kB
- UD_French-GSD
- fr_gsd-ud-train.conllu21 MB
- README.md7 kB
- fr_gsd-ud-dev.conllu2 MB
- fr_gsd-ud-dev.txt184 kB
- stats.xml11 kB
- fr_gsd-ud-test.conllu640 kB
- LICENSE.txt202 B
- fr_gsd-ud-test.txt49 kB
- fr_gsd-ud-train.txt1 MB
- UD_Assyrian-AS
- stats.xml7 kB
- aii_as-ud-test.conllu31 kB
- README.md1 kB
- aii_as-ud-test.txt4 kB
- LICENSE.txt202 B
- UD_Portuguese-PUD
- stats.xml7 kB
- README.md5 kB
- LICENSE.txt19 kB
- pt_pud-ud-test.txt119 kB
- pt_pud-ud-test.conllu1 MB
- UD_Arabic-NYUAD
- README.md2 kB
- ar_nyuad-ud-test.conllu5 MB
- stats.xml6 kB
- ar_nyuad-ud-dev.txt123 kB
- LICENSE.txt202 B
- ar_nyuad-ud-test.txt123 kB
- ar_nyuad-ud-train.txt982 kB
- ar_nyuad-ud-train.conllu44 MB
- ar_nyuad-ud-dev.conllu5 MB
- merge.jar91 kB
- UD_Bavarian-MaiBaam
- stats.xml3 kB
- bar_maibaam-ud-test.conllu962 kB
- README.md4 kB
- LICENSE.txt202 B
- bar_maibaam-ud-test.txt69 kB
- UD_French-Rhapsodie
- README.md1 kB
- fr_rhapsodie-ud-train.txt80 kB
- fr_rhapsodie-ud-train.conllu1 MB
- fr_rhapsodie-ud-test.conllu852 kB
- fr_rhapsodie-ud-dev.conllu913 kB
- fr_rhapsodie-ud-dev.txt53 kB
- fr_rhapsodie-ud-test.txt53 kB
- stats.xml10 kB
- LICENSE.txt202 B
- UD_Latin-LLCT
- la_llct-ud-dev.conllu2 MB
- README.md10 kB
- la_llct-ud-test.conllu2 MB
- la_llct-ud-train.conllu17 MB
- stats.xml13 kB
- la_llct-ud-dev.txt136 kB
- LICENSE.txt202 B
- la_llct-ud-train.txt1 MB
- la_llct-ud-test.txt136 kB
- UD_Latin-ITTB
- la_ittb-ud-train.txt2 MB
- README.md13 kB
- la_ittb-ud-dev.txt168 kB
- la_ittb-ud-test.conllu3 MB
- la_ittb-ud-dev.conllu3 MB
- stats.xml18 kB
- LICENSE.txt19 kB
- la_ittb-ud-test.txt169 kB
- la_ittb-ud-train.conllu39 MB
- UD_Cantonese-HK
- stats.xml4 kB
- yue_hk-ud-test.txt53 kB
- README.md4 kB
- LICENSE.txt202 B
- yue_hk-ud-test.conllu717 kB
- UD_Latin-CIRCSE
- stats.xml18 kB
- la_circse-ud-test.conllu2 MB
- README.md6 kB
- la_circse-ud-test.txt120 kB
- LICENSE.txt202 B
- UD_Albanian-STAF
- sq_staf-ud-test.conllu31 kB
- README.md1 kB
- sq_staf-ud-dev.txt1 kB
- sq_staf-ud-train.conllu248 kB
- sq_staf-ud-dev.conllu27 kB
- sq_staf-ud-train.txt14 kB
- stats.xml9 kB
- LICENSE.txt202 B
- sq_staf-ud-test.txt1 kB
- UD_Spanish-COSER
- stats.xml10 kB
- es_coser-ud-test.conllu589 kB
- README.md2 kB
- LICENSE.txt202 B
- es_coser-ud-test.txt33 kB
- UD_French-ParisStories
- fr_parisstories-ud-test.txt40 kB
- README.md5 kB
- fr_parisstories-ud-dev.conllu882 kB
- fr_parisstories-ud-test.conllu866 kB
- fr_parisstories-ud-train.txt90 kB
- fr_parisstories-ud-dev.txt40 kB
- stats.xml9 kB
- LICENSE.txt202 B
- fr_parisstories-ud-train.conllu1 MB
- UD_Italian-ISDT
- README.md10 kB
- it_isdt-ud-train.conllu18 MB
- it_isdt-ud-train.txt1 MB
- it_isdt-ud-dev.txt59 kB
- it_isdt-ud-test.txt52 kB
- it_isdt-ud-test.conllu717 kB
- stats.xml10 kB
- LICENSE.txt22 kB
- it_isdt-ud-dev.conllu814 kB
- UD_Gujarati-GujTB
- stats.xml7 kB
- gu_gujtb-ud-test.txt21 kB
- README.md2 kB
- gu_gujtb-ud-test.conllu121 kB
- LICENSE.txt202 B
- UD_Icelandic-IcePaHC
- is_icepahc-ud-dev.conllu11 MB
- is_icepahc-ud-test.txt738 kB
- README.md8 kB
- is_icepahc-ud-dev.txt735 kB
- is_icepahc-ud-train.conllu58 MB
- stats.xml11 kB
- LICENSE.txt202 B
- is_icepahc-ud-train.txt3 MB
- is_icepahc-ud-test.conllu11 MB
- UD_English-PUD
- ... too many files ...0 B
- Name
- ud-documentation-v2.15.tgz
- Size
- 110.23 MB
- Format
- application/x-gzip
- Description
- Documentation
- MD5
- 58aae6ccf3f4160ec08a223dd450850b
- ud-documentation-v2.15
- markdown-source
- ext-feat-index.md160 kB
- _tl
- _ka
- feat-index.md134 B
- dep-index.md140 B
- pos
- ADV.md1 kB
- VERB.md1 kB
- NUM.md1 kB
- SCONJ.md672 B
- NOUN.md789 B
- INTJ.md412 B
- ADP.md1 kB
- AUX_.md1 kB
- X.md645 B
- PART.md1015 B
- _wbp
- index.md3 kB
- feat
- Clitic.md1 kB
- _zh
- index.md8 kB
- syntax.md2 kB
- tokenization.md2 kB
- morphology.md2 kB
- feat
- PronType.md1 kB
- PartType.md570 B
- dep-index.md372 B
- pos
- PRON.md3 kB
- ADV.md3 kB
- VERB.md922 B
- NUM.md922 B
- CCONJ.md744 B
- ADJ.md1 kB
- SCONJ.md1 kB
- SYM.md847 B
- DET.md2 kB
- NOUN.md1 kB
- PROPN.md976 B
- INTJ.md1 kB
- PUNCT.md496 B
- ADP.md2 kB
- AUX_.md1 kB
- X.md787 B
- PART.md2 kB
- dep
- obj.md3 kB
- advcl.md3 kB
- nsubj.md718 B
- vocative.md1 kB
- discourse-sp.md2 kB
- mark-prt.md3 kB
- xcomp.md7 kB
- mark.md2 kB
- flat.md2 kB
- obl-patient.md1002 B
- compound.md2 kB
- csubj.md1004 B
- reparandum.md1 kB
- dislocated-vo.md1 kB
- amod.md1 kB
- nmod.md2 kB
- nummod.md1 kB
- iobj.md1 kB
- nsubj-pass.md600 B
- acl.md3 kB
- case.md3 kB
- mark-rel.md2 kB
- punct.md4 kB
- advmod.md4 kB
- case-loc.md1 kB
- obj-periph.md900 B
- aux-pass.md1 kB
- clf.md4 kB
- ccomp.md7 kB
- parataxis.md4 kB
- goeswith.md1 kB
- appos.md2 kB
- compound-dir.md5 kB
- advmod-df.md2 kB
- cc.md1 kB
- csubj-pass.md869 B
- obl-tmod.md2 kB
- det.md1 kB
- discourse.md1 kB
- list.md2 kB
- obl-agent.md1 kB
- cop.md1 kB
- compound-ext.md4 kB
- compound-vv.md4 kB
- orphan.md4 kB
- aux_.md3 kB
- obl.md3 kB
- root.md2 kB
- dislocated.md4 kB
- compound-vo.md3 kB
- mark-adv.md637 B
- conj.md6 kB
- pos-index.md143 B
- _pay
- _urj
- syntax.md2 kB
- feat-index.md146 B
- tokenization.md1 kB
- morphology.md4 kB
- feat
- VerbForm.md2 kB
- Person.md547 B
- Number.md599 B
- Aspect.md713 B
- Polarity.md523 B
- Poss.md460 B
- Definite.md436 B
- Reflex.md352 B
- PronType.md553 B
- NumType.md275 B
- Case.md1 kB
- Degree.md268 B
- Tense.md626 B
- Mood.md514 B
- Voice.md589 B
- introduction.md1 kB
- dep-index.md152 B
- dep
- amod.md1 kB
- acl-relcl.md1 kB
- cop.md411 B
- vocative.md922 B
- acl.md433 B
- appos.md1 kB
- punct.md2 kB
- case.md405 B
- compound.md579 B
- ccomp.md316 B
- advcl.md447 B
- aux_.md708 B
- pos
- PRON.md661 B
- ADV.md3 kB
- VERB.md1 kB
- CCONJ.md918 B
- NUM.md599 B
- ADJ.md693 B
- SCONJ.md423 B
- SYM.md533 B
- DET.md570 B
- NOUN.md490 B
- PROPN.md423 B
- INTJ.md301 B
- PUNCT.md263 B
- ADP.md780 B
- AUX_.md771 B
- X.md643 B
- PART.md537 B
- pos-index.md144 B
- _as
- template-index.md1 kB
- how_to_start.md9 kB
- _jv
- index.md7 kB
- dep
- nmod-tmod.md368 B
- nsubj-pass.md451 B
- case-adv.md912 B
- nmod-lmod.md629 B
- nmod-poss.md408 B
- obl-tmod.md437 B
- _vep
- _am
- index.md5 kB
- feat
- Voice.md3 kB
- Case.md3 kB
- _nhi
- _gn
- index.md11 kB
- feat
- ConjType.md644 B
- Aspect.md1 kB
- Number.md749 B
- Priv.md622 B
- AdvType.md1 kB
- Voice.md1 kB
- Corf.md451 B
- Nomzr.md2 kB
- Tense.md1 kB
- Int.md760 B
- Emph.md442 B
- Recip.md427 B
- Mood.md1 kB
- Person.md2 kB
- Poss.md1 kB
- Hum.md699 B
- Red.md690 B
- Foc.md661 B
- PronType.md1 kB
- Speech.md841 B
- Incorp.md651 B
- Rel.md2 kB
- Intens.md711 B
- Augm.md731 B
- Case.md1 kB
- NonFoc.md880 B
- Delib.md674 B
- Dev.md925 B
- dep
- obl-subj.md674 B
- advcl.md842 B
- obl-obj.md681 B
- template-index.md1 kB
- pos
- ADP.md798 B
- _mo
- template-index.md1 kB
- _v2_prelim
- coordination.md717 B
- features.md292 B
- index.md5 kB
- enhanced.md2 kB
- ellipsis.md6 kB
- tokenization.md1 kB
- conllu.md372 B
- core_dependents.md23 kB
- form_vs_function.md19 kB
- function_dependents.md3 kB
- _gd
- index.md14 kB
- feat
- Mood.md1 kB
- PronType.md1 kB
- Form.md1 kB
- Polarity.md805 B
- PartType.md2 kB
- dep
- obl-smod.md695 B
- nsubj.md2 kB
- flat-name.md1 kB
- flat.md2 kB
- compound.md2 kB
- mark-prt.md1 kB
- csubj-cop.md576 B
- case-voc.md464 B
- csubj-cleft.md1 kB
- fixed.md3 kB
- nmod.md1 kB
- obl.md2 kB
- flat-foreign.md829 B
- nsubj-pass.md2 kB
- aux-pass.md1 kB
- csubj-outer.md1 kB
- amod.md1 kB
- nsubj-outer.md1 kB
- xcomp-pred.md1 kB
- contributing.md13 kB
- introduction.md27 kB
- _da
- index.md4 kB
- pos-index.md132 B
- pos
- PRON.md1 kB
- VERB.md690 B
- ADV.md626 B
- NUM.md863 B
- CCONJ.md442 B
- ADJ.md801 B
- SCONJ.md467 B
- SYM.md331 B
- DET.md885 B
- NOUN.md353 B
- PROPN.md518 B
- INTJ.md439 B
- AUX_.md1 kB
- ADP.md335 B
- PUNCT.md387 B
- X.md565 B
- PART.md673 B
- tools.md28 kB
- _sk
- index.md14 kB
- _soj
- index.md2 kB
- _aln
- index.md3 kB
- dep
- aux-part.md1 kB
- template-index.md1 kB
- _ckt
- index.md2 kB
- dep
- acl-relat.md1 kB
- acl-attr.md682 B
- nmod-attr.md764 B
- aux-neg.md1 kB
- parataxis-rep.md669 B
- nmod-relat.md920 B
- _plugins
- file_exists.rb578 B
- _sa
- index.md4 kB
- feat
- Compound.md1 kB
- dep
- acl-pred.md546 B
- mark-sim.md486 B
- advcl-ccomp.md932 B
- acl-crel.md991 B
- obl-goal.md511 B
- acl-dpct.md496 B
- compound-name.md337 B
- advcl-cond.md972 B
- advcl-concess.md577 B
- obl-grad.md543 B
- obl-soc.md535 B
- acl-cont.md788 B
- compound-coord.md397 B
- advcl-consec.md857 B
- xcomp-result.md561 B
- nmod-appos.md819 B
- acl-attr.md959 B
- nsubj-cop.md1 kB
- advcl-caus.md774 B
- obl-benef.md843 B
- nmod-pred.md411 B
- obl-manner.md606 B
- obl-instr.md361 B
- case-sim.md490 B
- advcl-advers.md314 B
- advcl-lcl.md708 B
- advcl-tcl.md846 B
- ccomp-rel.md836 B
- acl-ptcp.md485 B
- obl-path.md585 B
- obl-source.md971 B
- advcl-manner.md913 B
- advcl-dpct.md1 kB
- advcl-fin.md640 B
- _cu
- _xpg
- index.md3 kB
- _it
- index.md11 kB
- feat-index.md134 B
- tokenization.md1 kB
- feat
- VerbForm.md1021 B
- Person.md1 kB
- Number.md629 B
- Poss.md553 B
- Gender.md572 B
- Definite.md500 B
- Foreign.md1 kB
- Reflex.md433 B
- PronType.md5 kB
- NumType.md1 kB
- Degree.md1 kB
- Mood.md1 kB
- Tense.md694 B
- Clitic.md570 B
- introduction.md7 kB
- dep-index.md140 B
- pos
- PRON.md1 kB
- VERB.md1019 B
- ADV.md1 kB
- NUM.md1 kB
- CCONJ.md674 B
- ADJ.md1 kB
- SCONJ.md1 kB
- SYM.md1 kB
- DET.md1 kB
- NOUN.md536 B
- PROPN.md565 B
- INTJ.md964 B
- PUNCT.md495 B
- ADP.md1 kB
- AUX_.md1 kB
- X.md807 B
- PART.md493 B
- dep
- advcl.md1 kB
- obj.md969 B
- nsubj.md1 kB
- vocative.md1 kB
- det-predet.md570 B
- csubj-relcl.md552 B
- advcl-pred.md592 B
- discourse-emo.md354 B
- flat-redup.md329 B
- ccomp-reported.md300 B
- mark.md976 B
- xcomp.md2 kB
- flat.md796 B
- parataxis-appos.md346 B
- compound.md991 B
- flat-foreign.md714 B
- csubj.md1 kB
- amod.md1 kB
- flat-name.md1 kB
- nmod.md925 B
- nummod.md1 kB
- parataxis-hashtag.md634 B
- iobj.md643 B
- acl-relcl.md1 kB
- nmod-lmod.md383 B
- nsubj-pass.md640 B
- expl-impers.md1 kB
- case.md1 kB
- acl.md2 kB
- parataxis-insert.md407 B
- punct.md1 kB
- advmod.md1 kB
- aux-pass.md2 kB
- advcl-relcl.md488 B
- advcl-cmp.md276 B
- ccomp.md2 kB
- parataxis.md1 kB
- advmod-tmod.md361 B
- goeswith.md367 B
- appos.md1008 B
- parataxis-nsubj.md402 B
- cc.md1 kB
- csubj-pass.md859 B
- fixed.md1 kB
- det.md629 B
- obl-tmod.md383 B
- ccomp-relcl.md626 B
- discourse.md866 B
- list.md844 B
- advmod-neg.md335 B
- obl-agent.md489 B
- expl-pass.md852 B
- cop.md2 kB
- parataxis-obj.md574 B
- parataxis-discourse.md383 B
- orphan.md821 B
- aux_.md1 kB
- obl.md1 kB
- root.md1003 B
- vocative-mention.md658 B
- nsubj-outer.md1 kB
- expl.md1 kB
- dislocated.md933 B
- det-poss.md653 B
- expl-poss.md3 kB
- dep.md615 B
- conj.md1 kB
- pos-index.md132 B
- _is
- index.md4 kB
- genres.md12 kB
- _bho
- index.md3 kB
- _hil
- template-index.md1 kB
- _qxp
- template-index.md1 kB
- addlanguage.sh1 kB
- _ro
- index.md9 kB
- template.docx33 kB
- feat
- Strength.md1 kB
- Variant.md1 kB
- PartType.md648 B
- Position.md1 kB
- Compound.md697 B
- upos-xpos-feats.txt33 kB
- dep-index.md140 B
- dep
- ccomp.md819 B
- iobj.md1 kB
- nsubj.md304 B
- det.md390 B
- cc.md879 B
- compound.md316 B
- ccomp-pmod.md375 B
- obj.md980 B
- obl-tmod464 B
- case.md1 kB
- vocative-mention.md725 B
- acl.md941 B
- nummod.md986 B
- orphan.md288 B
- csubj.md483 B
- nmod.md472 B
- advcl.md917 B
- advmod.md558 B
- cop.md1 kB
- advmod-tmod.md597 B
- obl-pmod.md352 B
- aux_.md565 B
- advcl-tcl.md613 B
- conj.md709 B
- nsubj-pass.md394 B
- csubj-pass.md410 B
- expl.md766 B
- aux-pass.md353 B
- amod.md379 B
- expl-poss.md823 B
- root.md738 B
- discourse-emo.md435 B
- mark.md376 B
- appos.md1 kB
- _got
- _mjl
- template-index.md1 kB
- _yrk
- template-index.md1 kB
- _eme
- index.md10 kB
- feat
- Nmzr.md2 kB
- Conces.md737 B
- Aspect.md2 kB
- Contrast.md833 B
- Voice.md2 kB
- Corf.md1 kB
- Subord.md1 kB
- Int.md986 B
- Excl.md751 B
- Emph.md1018 B
- VerbForm.md778 B
- Mood.md2 kB
- Also.md765 B
- Red.md663 B
- Imprs.md1 kB
- Foc.md717 B
- Rel.md1 kB
- Top.md702 B
- Accomp.md926 B
- Intens.md992 B
- Case.md3 kB
- Pred.md741 B
- _ca
- index.md27 kB
- pos-index.md132 B
- pos
- NOUN.md577 B
- INTJ.md1 kB
- ADV.md1 kB
- PUNCT.md491 B
- ADJ.md1 kB
- _orv
- gen_index
- clean_up_label_tables.pl1 kB
- list_obsolete_introductions.pl1 kB
- stests.yaml12 kB
- genre_symbols.json409 B
- syn_validation_run.py9 kB
- feature_index.html12 kB
- _corpus_data
- Norwegian-Nynorsk.json222 B
- Hindi.json222 B
- Norwegian-Bokmaal.json222 B
- Spanish-PUD.json216 B
- French.json222 B
- Swedish_Sign_Language.json207 B
- Hungarian.json219 B
- Latin.json218 B
- Romanian.json222 B
- Indonesian-PUD.json213 B
- Japanese.json220 B
- Turkish-PUD.json214 B
- Uyghur.json215 B
- Indonesian.json215 B
- Croatian.json221 B
- Arabic-PUD.json218 B
- Thai-PUD.json214 B
- Czech.json226 B
- Upper_Sorbian.json217 B
- Old_Church_Slavonic.json218 B
- Belarusian.json214 B
- Erzya.json199 B
- Swedish-LinES.json213 B
- Korean-PUD.json214 B
- Slovak.json222 B
- Russian.json218 B
- English-LinES.json213 B
- Japanese-KTC.json220 B
- Chinese-HK.json199 B
- Gothic.json218 B
- Catalan.json222 B
- Italian-PoSTWITA.json199 B
- Norwegian-NynorskLIA.json218 B
- Kazakh.json218 B
- Danish.json221 B
- Finnish-PUD.json220 B
- Latin-PROIEL.json222 B
- Turkish.json218 B
- Sanskrit.json214 B
- Marathi.json199 B
- English-ParTUT.json219 B
- Coptic.json216 B
- Urdu.json221 B
- Old_French.json199 B
- North_Sami.json218 B
- Dutch.json222 B
- Dargwa.json199 B
- French-Sequoia.json219 B
- English-PUD.json219 B
- Hebrew.json222 B
- Chinese.json222 B
- Polish.json218 B
- Ancient_Greek.json222 B
- Finnish-FTB.json222 B
- Chinese-CFL.json214 B
- German.json222 B
- Romansh.json199 B
- Galician-TreeGal.json218 B
- Maltese.json211 B
- Russian-SynTagRus.json231 B
- Arabic-NYUAD.json222 B
- Japanese-PUD.json218 B
- French-Spoken.json199 B
- Dutch-LassySmall.json221 B
- French-PUD.json217 B
- Latin-ITTB.json222 B
- Finnish.json227 B
- Faroese.json199 B
- Buryat.json217 B
- Spanish.json222 B
- Chinese-PUD.json215 B
- Telugu.json214 B
- Lithuanian-Alksnis.json199 B
- Czech-PUD.json219 B
- Bambara.json199 B
- Ukrainian.json218 B
- Russian-PUD.json214 B
- Irish.json219 B
- Korean.json216 B
- Bengali-DDS.json199 B
- English.json224 B
- Serbian.json218 B
- Swedish.json218 B
- Swedish-PUD.json218 B
- French-FTB.json222 B
- Greek.json218 B
- Bulgarian.json222 B
- Ancient_Greek-PROIEL.json222 B
- Hindi-PUD.json215 B
- Sorani.json199 B
- Basque.json221 B
- Bangla.json199 B
- Italian-ParTUT.json219 B
- Kurmanji.json217 B
- Arabic.json221 B
- Slovenian-SST.json218 B
- Tamil.json214 B
- Czech-CLTT.json219 B
- Somali.json199 B
- Naija.json199 B
- Slovenian.json221 B
- Estonian.json218 B
- Latvian.json218 B
- Korean-Sejong.json217 B
- French-ParTUT.json218 B
- Lithuanian.json214 B
- Afrikaans.json218 B
- Portuguese.json221 B
- Vietnamese.json217 B
- Amharic.json199 B
- Galician.json220 B
- German-PUD.json217 B
- Italian.json223 B
- Portuguese-PUD.json217 B
- Cantonese.json199 B
- Armenian.json199 B
- Czech-FicTree.json223 B
- English-ESL.json217 B
- Romansh-Sursilv.json199 B
- Spanish-AnCora.json222 B
- Czech-CAC.json223 B
- Portuguese-BR.json220 B
- Persian.json222 B
- Italian-PUD.json218 B
- generate_validation.sh475 B
- generate_feature_index.pl4 kB
- _la
- .gitignore61 B
- index.md17 kB
- feat
- VerbForm.md27 kB
- Aspect.md16 kB
- AdvType.md3 kB
- NumValue.md2 kB
- Compound.md1 kB
- Variant.md2 kB
- PronType.md2 kB
- Form.md2 kB
- InflClass.md18 kB
- NumForm.md2 kB
- Degree.md13 kB
- InflClass-nominal.md5 kB
- NameType.md7 kB
- Proper.md2 kB
- dep
- nsubj-cleft.md3 kB
- obl-lmod.md5 kB
- orphan-missing.md1 kB
- iobj.md18 kB
- flat-gov.md1 kB
- conj-expl.md4 kB
- cop-outer.md1 kB
- advmod-lmod.md1 kB
- advcl-relcl.md5 kB
- advcl-cmp.md8 kB
- flat-redup.md4 kB
- dislocated-ccomp.md2 kB
- obl-tmod.md2 kB
- dislocated-obj.md2 kB
- parataxis-rep.md2 kB
- dislocated-csubj.md2 kB
- csubj-reported.md2 kB
- xcomp.md4 kB
- csubj-cleft.md4 kB
- obl-cmp.md2 kB
- advmod-neg.md1 kB
- advmod-tmod.md1 kB
- parataxis-reporting.md1 kB
- dislocated-obl.md2 kB
- advcl-abs.md8 kB
- ccomp-reported.md1 kB
- csubj-relcl.md5 kB
- advcl-pred.md5 kB
- parataxis-speaker.md833 B
- ccomp-relcl.md4 kB
- xcomp-relcl.md4 kB
- dislocated-advcl.md1 kB
- dislocated-nsubj.md1 kB
- introduction.md4 kB
- template-index.md1 kB
- _oc
- template-index.md1 kB
- _usp
- template-index.md1 kB
- _bzd
- template-index.md1 kB
- _lad
- template-index.md1 kB
- _bar
- index.md9 kB
- _pbv
- template-index.md1 kB
- _bal
- index.md10 kB
- _qee
- template-index.md1 kB
- _pnt
- template-index.md1 kB
- _kab
- template-index.md1 kB
- _data
- features.yaml31 kB
- postags.yaml13 kB
- validation.yaml41 B
- relations.yaml58 kB
- _tr
- index.md3 kB
- feat-index.md145 B
- specific-syntax.md7 kB
- tokenization.md8 kB
- feat
- VerbForm.md2 kB
- Number-psor.md604 B
- Person.md2 kB
- Number.md2 kB
- Aspect.md3 kB
- Polarity.md1 kB
- Definite.md557 B
- PronType.md1 kB
- Reflex.md631 B
- NumType.md1 kB
- Case.md5 kB
- Degree.md893 B
- Person-psor.md783 B
- Evident.md1 kB
- Tense.md4 kB
- Mood.md9 kB
- Voice.md7 kB
- dep
- obj.md1 kB
- advcl.md1 kB
- nsubj.md1 kB
- vocative.md363 B
- discourse-q.md1 kB
- mark.md1 kB
- xcomp.md1 kB
- flat.md1 kB
- compound.md913 B
- flat-foreign.md518 B
- csubj.md629 B
- reparandum.md396 B
- amod.md682 B
- nmod.md784 B
- nummod.md633 B
- iobj.md355 B
- nsubj-pass.md505 B
- case.md1 kB
- acl.md1 kB
- punct.md312 B
- nmod-poss.md548 B
- advmod.md1 kB
- ccomp.md1 kB
- parataxis.md694 B
- dep-der.md1 kB
- goeswith.md424 B
- appos.md921 B
- cc.md1 kB
- csubj-pass.md636 B
- fixed.md935 B
- obl-tmod.md773 B
- det.md610 B
- discourse.md813 B
- list.md798 B
- compound-redup.md1 kB
- nsubj-cop.md580 B
- obl-agent.md831 B
- cop.md1 kB
- csubj-cop.md664 B
- nmod-comp.md680 B
- advmod-emph.md656 B
- orphan.md586 B
- aux_.md1 kB
- obj-cau.md1 kB
- obl.md1 kB
- root.md611 B
- nmod-part.md1 kB
- aux-q.md954 B
- dislocated.md1 kB
- obl-cau.md1 kB
- compound-lvc.md1 kB
- dep.md422 B
- conj.md1 kB
- dep-index.md151 B
- pos
- PRON.md862 B
- ADV.md535 B
- VERB.md1 kB
- CCONJ.md493 B
- NUM.md902 B
- ADJ.md727 B
- SCONJ.md1 kB
- SYM.md327 B
- DET.md1 kB
- NOUN.md1 kB
- PROPN.md789 B
- INTJ.md540 B
- ADP.md1 kB
- PUNCT.md566 B
- AUX_.md873 B
- X.md332 B
- PART.md563 B
- pos-index.md132 B
- notes.md15 kB
- _kk
- index.md5 kB
- pos-index.md132 B
- feat
- NumType.md1 kB
- dep-index.md140 B
- tokenization.md363 B
- dep
- iobj.md843 B
- ccomp.md1 kB
- nsubj.md957 B
- punct.md1 kB
- flat.md1 kB
- det.md881 B
- cc.md898 B
- compound.md1 kB
- obj.md1 kB
- case.md1 kB
- obl-own.md1 kB
- acl.md1 kB
- orphan.md875 B
- parataxis.md843 B
- nummod.md792 B
- xcomp.md875 B
- csubj.md499 B
- advcl.md777 B
- nmod.md1 kB
- advmod.md755 B
- cop.md1 kB
- vocative.md599 B
- aux_.md1 kB
- conj.md1 kB
- discourse.md931 B
- amod.md1 kB
- root.md547 B
- mark.md775 B
- appos.md622 B
- pos
- PRON.md797 B
- ADV.md536 B
- VERB.md509 B
- NUM.md557 B
- ADJ.md532 B
- SYM.md386 B
- DET.md549 B
- NOUN.md466 B
- PROPN.md501 B
- INTJ.md369 B
- AUX_.md859 B
- PUNCT.md349 B
- ADP.md433 B
- _be
- index.md9 kB
- feat
- Variant.md1 kB
- InflClass.md1 kB
- tokenization.md4 kB
- syntax.md508 B
- introduction.md2 kB
- parallel.md5 kB
- _apu
- markdown-source
- ... too many files ...0 B
- Name
- ud-tools-v2.15.tgz
- Size
- 929.36 KB
- Format
- application/x-gzip
- Description
- Tools
- MD5
- b718bbb27d27a8d58a205a03ab7b5718
- ud-tools-v2.15
- survey_misc.pl6 kB
- conllu_quick_fix_id_sequence.pl2 kB
- Node.pm18 kB
- conllu_copy_tokenization.pl11 kB
- generate_treebank_hub.pl1 kB
- restore_conllu_lines.pl1 kB
- remove_sense_suffixes_from_lemmas.pl1 kB
- text_without_spaces.pl2 kB
- package_st_data.sh10 kB
- conllu-w2t.py2 kB
- conllu_remove_enhanced_deps.pl443 B
- klcpos3.pl1 kB
- __pycache__
- file_util.cpython-311.pyc4 kB
- file_util.cpython-37.pyc2 kB
- udlib.pm60 kB
- data
- deprel.shopen311 B
- edeprel.ta2 kB
- tokens_w_space.ud27 B
- tokens_w_space.br443 B
- tokens_w_space.koi86 B
- docdeps.json285 kB
- tokens_w_space.kk859 B
- tokens_w_space.nl612 B
- cpos.ud79 B
- edeprels.json1008 kB
- tokens_w_space.hit72 B
- tokens_w_space.ltg110 B
- tokens_w_space.am82 B
- tokens_w_space.sv131 B
- deprels.json897 kB
- tokens_w_space.myv82 B
- tokens_w_space.mdf82 B
- tokens_w_space.pl366 B
- feats.json1 MB
- edeprel.uk5 kB
- tokens_w_space.akk246 B
- tokens_w_space.ja844 B
- tokens_w_space.vi3 B
- deprel.ud237 B
- data.json491 kB
- tokens_w_space.fro10 B
- tokens_w_space.kpv86 B
- tokens_w_space.shopen9 B
- tokens_w_space.kmr353 B
- feat_val.shopen2 kB
- docfeats.json1 MB
- tokens_w_space.sms151 B
- tokens_w_space.fr10 B
- tokens_w_space.lv178 B
- tokens_w_space.lt1 kB
- tokens_w_space.sjo2 kB
- README.md808 B
- tokens_w_space.apu123 B
- tokens_w_space.fi78 B
- tokens_w_space.sga86 B
- conllu_quick_fix.pl20 kB
- survey_paradigms.pl20 kB
- Graph.pm12 kB
- file_util.pyc2 kB
- mergept.pl2 kB
- validate.py187 kB
- check-space-after-paragraph.pl2 kB
- conllu_to_text.pl9 kB
- README.md12 kB
- csort.pm7 kB
- check_files.pl3 kB
- enhanced_classify_relations.pl26 kB
- conllu-formconvert.py3 kB
- conllu_align_tokens.pl6 kB
- survey_deprel_subtypes.pl8 kB
- survey_features.pl11 kB
- scan_local_repos.pl3 kB
- example-data
- long-token-to-text-wrong.txt333 B
- long-token-to-text-correct.txt332 B
- long-token-to-text.conllu2 kB
- tanl.conll471 B
- compat
- argparse.pyc65 kB
- argparse.py85 kB
- __init__.pyc140 B
- __init__.py0 B
- conll_convert_tags_to_uposf.pl1 kB
- check_sentence_ids.pl1 kB
- v2-conversion
- convert.py3 kB
- README.md2 kB
- processors_en.py1 kB
- processors_universal.py5 kB
- depgraph_utils.py6 kB
- nmod_obl_adjudication.py3 kB
- conllu_break_cycles.pl3 kB
- check_overlaps.pl1 kB
- survey_language_families.pl3 kB
- conllu_cut.pl2 kB
- conllu_copy_sentence_segmentation.pl12 kB
- file_util.py2 kB
- evaluate_treebank.pl18 kB
- eval.py42 kB
- fix-space-after-paragraph.pl4 kB
- generate_comparison_of_treebanks.pl2 kB
- find_duplicate_sentences.pl1 kB
- remove_duplicate_sentences.pl2 kB
- conllu_copy_annotation.pl4 kB
- check_release.pl37 kB
- package_ud_release.sh7 kB
- LICENSE.txt17 kB
- conllu-tenfold.pl2 kB
- enhanced_collapse_empty_nodes.pl8 kB
- conllu_to_conllx.pl2 kB
- survey_enhancements.pl9 kB
- survey_feature_language.pl8 kB
- fix_format_of_deps.pl1 kB
- mwtoken-stats.pl1 kB
- conllu_copy_basic_to_enhanced.pl1 kB
- save_evaluation_logs.sh962 B
- conllu-stats.pl107 kB
- normalize_unicode.pl511 B
- conllu_sort_sentences_by_ids.pl1 kB
- create_iso_639_3_symlinks.py175 kB
- test-cases
- nonvalid
- lowercase-postag.conllu141 B
- lowercase-feature-value-in-empty.conllu251 B
- empty-head.conllu114 B
- invalid-deps-id.conllu173 B
- misordered-feature.conllu243 B
- invalid-deps-syntax.conllu194 B
- missing-final-line.conllu155 B
- empty-field.conllu100 B
- head-not-0-deprel-root.conllu172 B
- empty-sentence.conllu163 B
- ambiguous-feature.conllu175 B
- trailing-tab.conllu127 B
- lowercase-postag-in-empty.conllu239 B
- head-0-deprel-not-root.conllu133 B
- multiple-sent_id.conllu736 B
- malformed_deps.conllu683 B
- head-not-empty-in-empty.conllu224 B
- lowercase-feature.conllu238 B
- duplicate-value.conllu137 B
- tanl-broken.conllu690 B
- misordered-layered-feature.conllu239 B
- whitespace_nonv.conllu274 B
- misplaced-comment-end.conllu429 B
- nonsequential-empty-node-id.conllu238 B
- dos-newlines.conllu698 B
- cyclic-deps.conllu227 B
- invalid-head.conllu164 B
- duplicate-layered-feature.conllu182 B
- id-with-extra-0.conllu140 B
- duplicate-feature.conllu142 B
- overlapping-multiword.conllu387 B
- token_with_cols_filled.conllu385 B
- self-cycle-deps.conllu164 B
- nonsequential-id.conllu176 B
- space-in-field.conllu127 B
- extra-empty-line.conllu287 B
- lowercase-feature-in-empty.conllu244 B
- non-proj.conllu109 B
- no-sent_id.conllu686 B
- id-starting-from-2.conllu247 B
- misindexed-empty-node.conllu235 B
- self-cycle-head.conllu190 B
- invalid-range.conllu375 B
- empty-node-without-dependent.conllu251 B
- uppercase-deps-deprel.conllu206 B
- multiword-with-pos.conllu407 B
- uppercase-deprel.conllu184 B
- invalid-deps-order.conllu409 B
- missing-space-after.conllu176 B
- extra-field.conllu130 B
- duplicate-id.conllu171 B
- invalid-range-format.conllu380 B
- deprel-not-empty-in-empty.conllu233 B
- misplaced-comment-mid.conllu401 B
- misordered-multiword.conllu392 B
- lowercase-value.conllu237 B
- valid
- maximal-empty-node.conllu273 B
- multiple-features.conllu295 B
- whitespace.conllu294 B
- id_test_part2.conllu375 B
- empty-nodes.conllu324 B
- id_test_part1.conllu375 B
- tanl.conllu673 B
- empty-file.conllu0 B
- minimal-empty-node.conllu239 B
- layered-features.conllu272 B
- nonvalid
- collect_propn_sequences.pl3 kB
- enhanced_graph_properties.pl21 kB
- check_text_wosp_match.sh750 B
- conllu-dependency-stats.pl944 B
- overlap.py2 kB