Files in this item
Download all files in item (534.14 MB)- Name
- ud-treebanks-v2.9.tgz
- Size
- 441.62 MB
- Format
- application/x-gzip
- Description
- Treebank data
- MD5
- 2d5d04a1868093977cef42c92c870153
- ud-treebanks-v2.9
- UD_Italian-PUD
- stats.xml8 kB
- it_pud-ud-test.txt123 kB
- README.md5 kB
- it_pud-ud-test.conllu1 MB
- LICENSE.txt19 kB
- UD_Telugu-MTG
- te_mtg-ud-test.txt10 kB
- te_mtg-ud-train.conllu494 kB
- te_mtg-ud-dev.conllu64 kB
- stats.xml3 kB
- te_mtg-ud-test.conllu70 kB
- LICENSE.txt202 B
- README.txt1 kB
- te_mtg-ud-dev.txt9 kB
- te_mtg-ud-train.txt72 kB
- UD_Swedish-Talbanken
- sv_talbanken-ud-test.txt122 kB
- README.md7 kB
- sv_talbanken-ud-train.txt402 kB
- stats.xml9 kB
- LICENSE.txt20 kB
- sv_talbanken-ud-train.conllu5 MB
- sv_talbanken-ud-dev.conllu834 kB
- sv_talbanken-ud-dev.txt58 kB
- sv_talbanken-ud-test.conllu1 MB
- UD_Finnish-OOD
- fi_ood-ud-test.txt134 kB
- stats.xml18 kB
- README.md1 kB
- fi_ood-ud-test.conllu1 MB
- LICENSE.txt202 B
- UD_Neapolitan-RB
- stats.xml1 kB
- README.md1 kB
- LICENSE.txt202 B
- nap_rb-ud-test.conllu431 B
- nap_rb-ud-test.txt56 B
- UD_Soi-AHA
- stats.xml3 kB
- soj_aha-ud-test.txt386 B
- README.md1 kB
- LICENSE.txt202 B
- soj_aha-ud-test.conllu4 kB
- UD_Turkish-Atis
- tr_atis-ud-train.conllu2 MB
- README.md1 kB
- tr_atis-ud-dev.conllu349 kB
- tr_atis-ud-test.txt38 kB
- tr_atis-ud-dev.txt38 kB
- stats.xml10 kB
- LICENSE.txt202 B
- tr_atis-ud-train.txt289 kB
- tr_atis-ud-test.conllu353 kB
- UD_Czech-CLTT
- cs_cltt-ud-dev.conllu483 kB
- README.md2 kB
- cs_cltt-ud-test.txt29 kB
- cs_cltt-ud-train.txt195 kB
- cs_cltt-ud-dev.txt33 kB
- cs_cltt-ud-train.conllu2 MB
- stats.xml13 kB
- LICENSE.txt265 B
- cs_cltt-ud-test.conllu416 kB
- UD_Swiss_German-UZH
- stats.xml2 kB
- gsw_uzh-ud-test.txt7 kB
- README.md3 kB
- LICENSE.txt202 B
- gsw_uzh-ud-test.conllu58 kB
- UD_Czech-PUD
- stats.xml16 kB
- README.md3 kB
- LICENSE.txt202 B
- cs_pud-ud-test.txt114 kB
- cs_pud-ud-test.conllu2 MB
- UD_Kiche-IU
- stats.xml11 kB
- quc_iu-ud-test.conllu823 kB
- README.md1 kB
- quc_iu-ud-test.txt46 kB
- LICENSE.txt202 B
- UD_Akuntsu-TuDeT
- stats.xml5 kB
- aqz_tudet-ud-test.conllu26 kB
- README.md3 kB
- aqz_tudet-ud-test.txt2 kB
- LICENSE.txt202 B
- UD_German-GSD
- README.md8 kB
- de_gsd-ud-dev.conllu876 kB
- de_gsd-ud-dev.txt72 kB
- de_gsd-ud-train.txt1 MB
- de_gsd-ud-test.conllu1 MB
- stats.xml10 kB
- de_gsd-ud-train.conllu18 MB
- LICENSE.txt202 B
- de_gsd-ud-test.txt97 kB
- UD_Komi_Permyak-UH
- stats.xml14 kB
- README.md6 kB
- koi_uh-ud-test.conllu99 kB
- LICENSE.txt202 B
- koi_uh-ud-test.txt8 kB
- UD_Faroese-FarPaHC
- fo_farpahc-ud-dev.conllu465 kB
- fo_farpahc-ud-dev.txt42 kB
- README.md4 kB
- fo_farpahc-ud-test.conllu459 kB
- fo_farpahc-ud-train.txt105 kB
- fo_farpahc-ud-train.conllu1 MB
- stats.xml5 kB
- fo_farpahc-ud-test.txt42 kB
- LICENSE.txt202 B
- UD_Japanese-PUD
- ja_pud-ud-test.txt138 kB
- stats.xml3 kB
- README.md5 kB
- ja_pud-ud-test.conllu4 MB
- LICENSE.txt19 kB
- UD_Lithuanian-HSE
- lt_hse-ud-dev.txt6 kB
- README.md2 kB
- lt_hse-ud-test.conllu88 kB
- lt_hse-ud-train.txt20 kB
- lt_hse-ud-test.txt6 kB
- lt_hse-ud-train.conllu255 kB
- stats.xml10 kB
- LICENSE.txt202 B
- lt_hse-ud-dev.conllu87 kB
- UD_Japanese-PUDLUW
- stats.xml4 kB
- README.md5 kB
- ja_pudluw-ud-test.txt138 kB
- LICENSE.txt202 B
- ja_pudluw-ud-test.conllu2 MB
- UD_Chinese-PUD
- stats.xml4 kB
- README.md5 kB
- zh_pud-ud-test.conllu1 MB
- zh_pud-ud-test.txt101 kB
- LICENSE.txt19 kB
- UD_Latin-UDante
- la_udante-ud-train.conllu2 MB
- README.md7 kB
- la_udante-ud-dev.conllu1 MB
- la_udante-ud-train.txt170 kB
- stats.xml19 kB
- la_udante-ud-test.txt78 kB
- la_udante-ud-dev.txt67 kB
- LICENSE.txt202 B
- la_udante-ud-test.conllu1 MB
- UD_Buryat-BDT
- stats.xml12 kB
- README.txt1 kB
- bxr_bdt-ud-train.conllu10 kB
- bxr_bdt-ud-train.txt1 kB
- LICENSE.txt202 B
- bxr_bdt-ud-test.txt114 kB
- bxr_bdt-ud-test.conllu699 kB
- UD_Slovenian-SST
- stats.xml11 kB
- sl_sst-ud-test.txt53 kB
- README.txt4 kB
- sl_sst-ud-train.conllu1 MB
- sl_sst-ud-test.conllu880 kB
- LICENSE.txt441 B
- sl_sst-ud-train.txt103 kB
- UD_Latin-PROIEL
- la_proiel-ud-dev.txt87 kB
- README.md2 kB
- la_proiel-ud-dev.conllu1 MB
- la_proiel-ud-test.txt88 kB
- stats.xml10 kB
- la_proiel-ud-train.conllu15 MB
- LICENSE.txt279 B
- la_proiel-ud-train.txt1 MB
- la_proiel-ud-test.conllu1 MB
- UD_Warlpiri-UFAL
- stats.xml6 kB
- README.md870 B
- LICENSE.txt202 B
- wbp_ufal-ud-test.conllu37 kB
- wbp_ufal-ud-test.txt2 kB
- UD_Turkish-IMST
- tr_imst-ud-test.txt65 kB
- README.md2 kB
- tr_imst-ud-train.conllu2 MB
- tr_imst-ud-test.conllu801 kB
- tr_imst-ud-dev.conllu797 kB
- tr_imst-ud-dev.txt64 kB
- stats.xml13 kB
- LICENSE.txt20 kB
- tr_imst-ud-train.txt246 kB
- UD_French-FQB
- stats.xml7 kB
- fr_fqb-ud-test.conllu1 MB
- fr_fqb-ud-test.txt117 kB
- README.md3 kB
- LICENSE.txt14 kB
- UD_Welsh-CCG
- cy_ccg-ud-test.txt79 kB
- cy_ccg-ud-test.conllu1 MB
- README.md1 kB
- cy_ccg-ud-dev.txt43 kB
- cy_ccg-ud-train.txt71 kB
- cy_ccg-ud-train.conllu967 kB
- cy_ccg-ud-dev.conllu595 kB
- stats.xml8 kB
- LICENSE.txt202 B
- UD_Chinese-GSDSimp
- zh_gsdsimp-ud-test.txt53 kB
- README.md2 kB
- zh_gsdsimp-ud-dev.conllu680 kB
- zh_gsdsimp-ud-train.txt433 kB
- zh_gsdsimp-ud-train.conllu5 MB
- stats.xml5 kB
- LICENSE.txt202 B
- zh_gsdsimp-ud-dev.txt55 kB
- zh_gsdsimp-ud-test.conllu647 kB
- UD_Slovenian-SSJ
- sl_ssj-ud-dev.conllu1 MB
- sl_ssj-ud-train.txt619 kB
- sl_ssj-ud-test.conllu1 MB
- sl_ssj-ud-train.conllu9 MB
- sl_ssj-ud-dev.txt79 kB
- stats.xml12 kB
- LICENSE.txt543 B
- README.txt5 kB
- sl_ssj-ud-test.txt78 kB
- UD_Old_East_Slavic-TOROT
- README.md3 kB
- orv_torot-ud-test.txt150 kB
- orv_torot-ud-train.txt1 MB
- orv_torot-ud-train.conllu11 MB
- orv_torot-ud-dev.conllu1 MB
- orv_torot-ud-dev.txt151 kB
- orv_torot-ud-test.conllu1 MB
- stats.xml12 kB
- LICENSE.txt197 B
- UD_Japanese-BCCWJLUW
- README.md3 kB
- ja_bccwjluw-ud-test.txt133 kB
- ja_bccwjluw-ud-dev.conllu7 MB
- ja_bccwjluw-ud-test.conllu7 MB
- ja_bccwjluw-ud-train.txt711 kB
- ja_bccwjluw-ud-dev.txt144 kB
- merge
- test_pos.pkl1 MB
- dev_pos.pkl2 MB
- script
- lib.py5 kB
- restore_word_unit_bccwj.py7 kB
- convert_core_bccwj_pkl.py746 B
- misc_mapping.pkl315 B
- merge.sh1 kB
- train_pos.pkl10 MB
- stats.xml2 kB
- LICENSE.txt202 B
- ja_bccwjluw-ud-train.conllu37 MB
- UD_French-PUD
- fr_pud-ud-test.txt130 kB
- stats.xml8 kB
- fr_pud-ud-test.conllu1 MB
- README.md5 kB
- LICENSE.txt19 kB
- UD_Russian-SynTagRus
- README.md4 kB
- ru_syntagrus-ud-dev.txt1 MB
- ru_syntagrus-ud-test.txt1 MB
- ru_syntagrus-ud-dev.conllu14 MB
- ru_syntagrus-ud-train.conllu110 MB
- ru_syntagrus-ud-train.txt12 MB
- ru_syntagrus-ud-test.conllu14 MB
- stats.xml14 kB
- LICENSE.txt188 B
- UD_Manx-Cadhan
- stats.xml7 kB
- README.md2 kB
- LICENSE.txt656 B
- gv_cadhan-ud-test.txt82 kB
- gv_cadhan-ud-test.conllu1 MB
- UD_Moksha-JR
- stats.xml24 kB
- README.md5 kB
- mdf_jr-ud-test.txt33 kB
- mdf_jr-ud-test.conllu343 kB
- LICENSE.txt202 B
- UD_Munduruku-TuDeT
- stats.xml7 kB
- README.md2 kB
- LICENSE.txt202 B
- myu_tudet-ud-test.conllu39 kB
- myu_tudet-ud-test.txt2 kB
- UD_Indonesian-GSD
- README.md6 kB
- id_gsd-ud-test.txt69 kB
- id_gsd-ud-dev.conllu1020 kB
- id_gsd-ud-train.conllu7 MB
- stats.xml8 kB
- LICENSE.txt202 B
- id_gsd-ud-test.conllu950 kB
- id_gsd-ud-dev.txt73 kB
- id_gsd-ud-train.txt573 kB
- UD_Tagalog-TRG
- tl_trg-ud-test.txt3 kB
- stats.xml7 kB
- tl_trg-ud-test.conllu59 kB
- README.md1 kB
- LICENSE.txt202 B
- UD_Turkish-PUD
- stats.xml12 kB
- README.md6 kB
- tr_pud-ud-test.conllu1 MB
- tr_pud-ud-test.txt119 kB
- LICENSE.txt19 kB
- UD_French-ParTUT
- README.md5 kB
- fr_partut-ud-dev.conllu116 kB
- fr_partut-ud-train.conllu1 MB
- fr_partut-ud-test.txt14 kB
- fr_partut-ud-train.txt128 kB
- stats.xml8 kB
- LICENSE.txt18 kB
- fr_partut-ud-test.conllu164 kB
- fr_partut-ud-dev.txt9 kB
- UD_Turkish-Tourism
- tr_tourism-ud-test.conllu715 kB
- README.md1 kB
- tr_tourism-ud-dev.conllu758 kB
- tr_tourism-ud-train.conllu5 MB
- stats.xml13 kB
- LICENSE.txt202 B
- tr_tourism-ud-train.txt478 kB
- tr_tourism-ud-dev.txt70 kB
- tr_tourism-ud-test.txt67 kB
- UD_Spanish-GSD
- README.md4 kB
- es_gsd-ud-test.conllu714 kB
- es_gsd-ud-train.conllu22 MB
- es_gsd-ud-test.txt61 kB
- es_gsd-ud-train.txt1 MB
- es_gsd-ud-dev.conllu2 MB
- es_gsd-ud-dev.txt191 kB
- stats.xml10 kB
- LICENSE.txt202 B
- UD_Tagalog-Ugnayan
- stats.xml3 kB
- README.md1 kB
- tl_ugnayan-ud-test.txt5 kB
- tl_ugnayan-ud-test.conllu53 kB
- LICENSE.txt219 B
- UD_Mbya_Guarani-Thomas
- stats.xml8 kB
- README.md3 kB
- gun_thomas-ud-test.txt7 kB
- LICENSE.txt202 B
- gun_thomas-ud-test.conllu90 kB
- UD_Italian-TWITTIRO
- README.md3 kB
- it_twittiro-ud-test.conllu184 kB
- it_twittiro-ud-test.txt15 kB
- it_twittiro-ud-train.conllu1 MB
- it_twittiro-ud-train.txt120 kB
- stats.xml9 kB
- it_twittiro-ud-dev.conllu188 kB
- it_twittiro-ud-dev.txt15 kB
- LICENSE.txt202 B
- UD_Polish-LFG
- pl_lfg-ud-dev.txt74 kB
- README.md6 kB
- pl_lfg-ud-train.txt596 kB
- pl_lfg-ud-test.txt74 kB
- pl_lfg-ud-dev.conllu1 MB
- pl_lfg-ud-test.conllu1 MB
- stats.xml14 kB
- LICENSE.txt34 kB
- pl_lfg-ud-train.conllu11 MB
- UD_Romanian-ArT
- stats.xml8 kB
- ro_art-ud-test.conllu44 kB
- README.md1 kB
- LICENSE.txt202 B
- ro_art-ud-test.txt2 kB
- UD_Indonesian-CSUI
- stats.xml7 kB
- README.md3 kB
- id_csui-ud-train.txt108 kB
- id_csui-ud-test.txt59 kB
- LICENSE.txt202 B
- id_csui-ud-test.conllu589 kB
- id_csui-ud-train.conllu1 MB
- UD_Dutch-Alpino
- nl_alpino-ud-test.conllu902 kB
- nl_alpino-ud-train.conllu14 MB
- nl_alpino-ud-train.txt1016 kB
- nl_alpino-ud-dev.conllu942 kB
- nl_alpino-ud-dev.txt62 kB
- stats.xml7 kB
- LICENSE.txt19 kB
- README.txt5 kB
- nl_alpino-ud-test.txt64 kB
- UD_Romanian-Nonstandard
- ro_nonstandard-ud-test.txt104 kB
- README.md9 kB
- ro_nonstandard-ud-dev.txt91 kB
- ro_nonstandard-ud-dev.conllu1 MB
- ro_nonstandard-ud-test.conllu1 MB
- ro_nonstandard-ud-train.txt2 MB
- ro_nonstandard-ud-train.conllu44 MB
- stats.xml12 kB
- LICENSE.txt202 B
- UD_Livvi-KKPP
- stats.xml10 kB
- README.md4 kB
- olo_kkpp-ud-train.txt808 B
- olo_kkpp-ud-test.txt9 kB
- olo_kkpp-ud-test.conllu103 kB
- LICENSE.txt202 B
- olo_kkpp-ud-train.conllu15 kB
- UD_German-PUD
- stats.xml9 kB
- README.md5 kB
- LICENSE.txt19 kB
- de_pud-ud-test.txt126 kB
- de_pud-ud-test.conllu1 MB
- UD_Western_Armenian-ArmTDP
- README.md3 kB
- hyw_armtdp-ud-test.txt97 kB
- hyw_armtdp-ud-train.txt755 kB
- hyw_armtdp-ud-dev.txt103 kB
- hyw_armtdp-ud-test.conllu1 MB
- hyw_armtdp-ud-dev.conllu1 MB
- stats.xml24 kB
- hyw_armtdp-ud-train.conllu9 MB
- LICENSE.txt202 B
- UD_Urdu-UDTB
- README.md2 kB
- ur_udtb-ud-train.txt853 kB
- ur_udtb-ud-test.txt117 kB
- ur_udtb-ud-train.conllu11 MB
- ur_udtb-ud-test.conllu1 MB
- stats.xml10 kB
- ur_udtb-ud-dev.txt115 kB
- LICENSE.txt247 B
- ur_udtb-ud-dev.conllu1 MB
- UD_Estonian-EDT
- et_edt-ud-test.txt312 kB
- et_edt-ud-train.txt2 MB
- README.md4 kB
- et_edt-ud-test.conllu3 MB
- et_edt-ud-dev.conllu3 MB
- et_edt-ud-train.conllu24 MB
- stats.xml13 kB
- LICENSE.txt279 B
- et_edt-ud-dev.txt284 kB
- UD_Kaapor-TuDeT
- stats.xml4 kB
- README.md2 kB
- urb_tudet-ud-test.txt2 kB
- LICENSE.txt202 B
- urb_tudet-ud-test.conllu24 kB
- UD_Finnish-FTB
- fi_ftb-ud-train.conllu10 MB
- README.md3 kB
- fi_ftb-ud-test.txt116 kB
- fi_ftb-ud-test.conllu1 MB
- stats.xml17 kB
- LICENSE.txt43 kB
- fi_ftb-ud-dev.conllu1 MB
- fi_ftb-ud-train.txt904 kB
- fi_ftb-ud-dev.txt111 kB
- UD_Galician-TreeGal
- stats.xml9 kB
- README.md5 kB
- gl_treegal-ud-test.txt50 kB
- gl_treegal-ud-train.conllu1 MB
- LICENSE.txt14 kB
- gl_treegal-ud-train.txt76 kB
- gl_treegal-ud-test.conllu670 kB
- UD_Portuguese-GSD
- pt_gsd-ud-test.conllu1 MB
- README.md3 kB
- pt_gsd-ud-train.conllu11 MB
- pt_gsd-ud-train.txt1 MB
- pt_gsd-ud-dev.conllu1 MB
- pt_gsd-ud-test.txt153 kB
- stats.xml5 kB
- LICENSE.txt202 B
- pt_gsd-ud-dev.txt156 kB
- UD_Thai-PUD
- stats.xml4 kB
- th_pud-ud-test.conllu1 MB
- README.md5 kB
- LICENSE.txt19 kB
- th_pud-ud-test.txt281 kB
- UD_Hindi_English-HIENCS
- README.md3 kB
- qhe_hiencs-ud-train.conllu681 kB
- qhe_hiencs-ud-test.conllu104 kB
- qhe_hiencs-ud-test.txt6 kB
- qhe_hiencs-ud-train.txt39 kB
- qhe_hiencs-ud-dev.conllu107 kB
- merge
- train-annot.json1 MB
- tweet_ids_dev.txt4 kB
- EMOTICONS3 kB
- EDITS6 kB
- test-annot.json229 kB
- tweet_ids_test.txt4 kB
- NONBREAKING_PREFIXES812 B
- DOMAINS293 B
- tweet_ids_train.txt26 kB
- dev-annot.json236 kB
- stats.xml2 kB
- LICENSE.txt202 B
- crawl_tweets.py18 kB
- qhe_hiencs-ud-dev.txt6 kB
- UD_Czech-FicTree
- README.md3 kB
- cs_fictree-ud-test.conllu1 MB
- cs_fictree-ud-test.txt86 kB
- cs_fictree-ud-train.conllu13 MB
- cs_fictree-ud-dev.txt86 kB
- cs_fictree-ud-dev.conllu1 MB
- stats.xml15 kB
- LICENSE.txt219 B
- cs_fictree-ud-train.txt696 kB
- UD_Italian-PoSTWITA
- it_postwita-ud-test.conllu759 kB
- README.md3 kB
- it_postwita-ud-train.txt526 kB
- it_postwita-ud-dev.conllu732 kB
- it_postwita-ud-train.conllu5 MB
- stats.xml9 kB
- LICENSE.txt18 kB
- it_postwita-ud-dev.txt64 kB
- it_postwita-ud-test.txt67 kB
- UD_Low_Saxon-LSDC
- stats.xml10 kB
- README.md4 kB
- nds_lsdc-ud-test.conllu193 kB
- LICENSE.txt202 B
- nds_lsdc-ud-test.txt10 kB
- UD_Finnish-TDT
- fi_tdt-ud-train.txt1 MB
- fi_tdt-ud-train.conllu12 MB
- fi_tdt-ud-test.conllu1 MB
- stats.xml20 kB
- fi_tdt-ud-test.txt154 kB
- LICENSE.txt24 kB
- README.txt3 kB
- fi_tdt-ud-dev.conllu1 MB
- fi_tdt-ud-dev.txt136 kB
- UD_Swedish-PUD
- stats.xml8 kB
- README.md3 kB
- LICENSE.txt202 B
- sv_pud-ud-test.txt115 kB
- sv_pud-ud-test.conllu1 MB
- UD_Polish-PDB
- pl_pdb-ud-train.txt1 MB
- README.md5 kB
- pl_pdb-ud-dev.conllu3 MB
- pl_pdb-ud-test.txt203 kB
- pl_pdb-ud-train.conllu27 MB
- pl_pdb-ud-dev.txt210 kB
- stats.xml17 kB
- LICENSE.txt384 B
- pl_pdb-ud-test.conllu3 MB
- UD_Amharic-ATT
- stats.xml7 kB
- am_att-ud-test.txt53 kB
- README.md1 kB
- am_att-ud-test.conllu995 kB
- LICENSE.txt202 B
- UD_Korean-Kaist
- ko_kaist-ud-test.conllu1 MB
- README.md1 kB
- ko_kaist-ud-train.txt2 MB
- ko_kaist-ud-dev.txt233 kB
- ko_kaist-ud-test.txt255 kB
- ko_kaist-ud-dev.conllu1 MB
- stats.xml4 kB
- LICENSE.txt202 B
- ko_kaist-ud-train.conllu17 MB
- UD_Bambara-CRB
- stats.xml6 kB
- README.md2 kB
- LICENSE.txt202 B
- bm_crb-ud-test.txt51 kB
- bm_crb-ud-test.conllu873 kB
- UD_Ukrainian-IU
- README.md9 kB
- uk_iu-ud-train.txt895 kB
- uk_iu-ud-test.txt176 kB
- uk_iu-ud-test.conllu2 MB
- uk_iu-ud-dev.conllu1 MB
- uk_iu-ud-dev.txt128 kB
- stats.xml17 kB
- LICENSE.txt172 B
- uk_iu-ud-train.conllu12 MB
- UD_English-ESL
- en_esl-ud-dev.conllu319 kB
- README.md4 kB
- en_esl-ud-train.txt153 kB
- en_esl-ud-train.conllu2 MB
- merge.py905 B
- en_esl-ud-test.txt18 kB
- stats.xml3 kB
- en_esl-ud-dev.txt18 kB
- LICENSE.txt19 kB
- en_esl-ud-test.conllu321 kB
- UD_Persian-Seraji
- fa_seraji-ud-dev.conllu989 kB
- README.md5 kB
- fa_seraji-ud-test.txt134 kB
- fa_seraji-ud-train.conllu7 MB
- stats.xml9 kB
- fa_seraji-ud-test.conllu1021 kB
- fa_seraji-ud-train.txt995 kB
- LICENSE.txt110 B
- fa_seraji-ud-dev.txt133 kB
- UD_Indonesian-PUD
- stats.xml8 kB
- README.md8 kB
- id_pud-ud-test.txt117 kB
- LICENSE.txt19 kB
- id_pud-ud-test.conllu1 MB
- UD_Belarusian-HSE
- be_hse-ud-test.txt180 kB
- README.md6 kB
- be_hse-ud-train.txt2 MB
- be_hse-ud-dev.conllu1 MB
- be_hse-ud-train.conllu26 MB
- be_hse-ud-test.conllu1 MB
- stats.xml15 kB
- LICENSE.txt1021 B
- be_hse-ud-dev.txt164 kB
- UD_Guajajara-TuDeT
- stats.xml8 kB
- gub_tudet-ud-test.txt10 kB
- README.md2 kB
- gub_tudet-ud-test.conllu156 kB
- LICENSE.txt202 B
- UD_Norwegian-NynorskLIA
- no_nynorsklia-ud-test.txt42 kB
- no_nynorsklia-ud-dev.conllu593 kB
- no_nynorsklia-ud-test.conllu594 kB
- stats.xml8 kB
- LICENSE.txt202 B
- README.txt1 kB
- no_nynorsklia-ud-dev.txt42 kB
- no_nynorsklia-ud-train.txt147 kB
- no_nynorsklia-ud-train.conllu2 MB
- UD_Italian-VIT
- it_vit-ud-test.conllu1 MB
- README.md4 kB
- it_vit-ud-dev.conllu1 MB
- it_vit-ud-train.conllu13 MB
- it_vit-ud-dev.txt150 kB
- it_vit-ud-test.txt130 kB
- stats.xml10 kB
- LICENSE.txt202 B
- it_vit-ud-train.txt1 MB
- UD_Spanish-PUD
- stats.xml8 kB
- es_pud-ud-test.conllu1 MB
- README.md5 kB
- LICENSE.txt19 kB
- es_pud-ud-test.txt123 kB
- UD_Scottish_Gaelic-ARCOSG
- gd_arcosg-ud-train.txt315 kB
- README.md7 kB
- gd_arcosg-ud-test.conllu607 kB
- gd_arcosg-ud-dev.txt52 kB
- gd_arcosg-ud-test.txt51 kB
- gd_arcosg-ud-train.conllu3 MB
- stats.xml9 kB
- LICENSE.txt202 B
- gd_arcosg-ud-dev.conllu614 kB
- UD_Chinese-HK
- stats.xml3 kB
- README.md4 kB
- LICENSE.txt202 B
- zh_hk-ud-test.conllu482 kB
- zh_hk-ud-test.txt41 kB
- UD_Afrikaans-AfriBooms
- af_afribooms-ud-test.conllu618 kB
- af_afribooms-ud-train.conllu2 MB
- af_afribooms-ud-test.txt57 kB
- stats.xml8 kB
- LICENSE.txt202 B
- README.txt1 kB
- af_afribooms-ud-dev.txt30 kB
- af_afribooms-ud-dev.conllu321 kB
- af_afribooms-ud-train.txt195 kB
- UD_Japanese-GSD
- ja_gsd-ud-dev.txt58 kB
- README.md8 kB
- ja_gsd-ud-dev.conllu1 MB
- ja_gsd-ud-train.conllu26 MB
- stats.xml4 kB
- LICENSE.txt202 B
- ja_gsd-ud-test.conllu2 MB
- ja_gsd-ud-train.txt804 kB
- ja_gsd-ud-test.txt62 kB
- UD_Kangri-KDTB
- stats.xml2 kB
- xnr_kdtb-ud-test.conllu132 kB
- README.md1 kB
- LICENSE.txt202 B
- xnr_kdtb-ud-test.txt29 kB
- UD_Czech-CAC
- cs_cac-ud-test.conllu1 MB
- cs_cac-ud-test.txt71 kB
- README.md5 kB
- cs_cac-ud-train.conllu51 MB
- cs_cac-ud-dev.txt72 kB
- cs_cac-ud-train.txt2 MB
- stats.xml19 kB
- LICENSE.txt265 B
- cs_cac-ud-dev.conllu1 MB
- UD_Faroese-OFT
- stats.xml7 kB
- README.md1 kB
- fo_oft-ud-test.txt58 kB
- fo_oft-ud-test.conllu783 kB
- LICENSE.txt822 B
- UD_Ancient_Greek-PROIEL
- README.md2 kB
- grc_proiel-ud-dev.txt159 kB
- grc_proiel-ud-train.conllu19 MB
- grc_proiel-ud-test.conllu1 MB
- grc_proiel-ud-test.txt154 kB
- stats.xml13 kB
- LICENSE.txt279 B
- grc_proiel-ud-train.txt2 MB
- grc_proiel-ud-dev.conllu1 MB
- UD_English-Pronouns
- stats.xml5 kB
- README.md9 kB
- en_pronouns-ud-test.conllu138 kB
- LICENSE.txt202 B
- en_pronouns-ud-test.txt7 kB
- UD_Czech-PDT
- cs_pdt-ud-train.conllu127 MB
- README.md8 kB
- cs_pdt-ud-test.conllu18 MB
- cs_pdt-ud-test.txt1 MB
- cs_pdt-ud-dev.txt989 kB
- cs_pdt-ud-dev.conllu17 MB
- stats.xml20 kB
- LICENSE.txt19 kB
- cs_pdt-ud-train.txt7 MB
- UD_Chinese-GSD
- README.md2 kB
- zh_gsd-ud-test.conllu647 kB
- zh_gsd-ud-train.conllu5 MB
- zh_gsd-ud-train.txt433 kB
- zh_gsd-ud-dev.txt55 kB
- zh_gsd-ud-dev.conllu680 kB
- stats.xml5 kB
- zh_gsd-ud-test.txt53 kB
- LICENSE.txt202 B
- UD_Old_Church_Slavonic-PROIEL
- cu_proiel-ud-train.txt369 kB
- README.md2 kB
- cu_proiel-ud-test.txt99 kB
- cu_proiel-ud-dev.conllu1 MB
- cu_proiel-ud-test.conllu1 MB
- cu_proiel-ud-train.conllu3 MB
- stats.xml12 kB
- LICENSE.txt279 B
- cu_proiel-ud-dev.txt97 kB
- UD_Arabic-PUD
- stats.xml9 kB
- README.md5 kB
- ar_pud-ud-test.txt168 kB
- LICENSE.txt19 kB
- ar_pud-ud-test.conllu1 MB
- UD_Icelandic-PUD
- stats.xml9 kB
- is_pud-ud-test.txt119 kB
- README.md3 kB
- LICENSE.txt202 B
- is_pud-ud-test.conllu1 MB
- UD_Erzya-JR
- myv_jr-ud-test.txt177 kB
- stats.xml30 kB
- README.txt6 kB
- LICENSE.txt202 B
- myv_jr-ud-test.conllu1 MB
- UD_Dutch-LassySmall
- nl_lassysmall-ud-train.conllu5 MB
- nl_lassysmall-ud-test.conllu925 kB
- nl_lassysmall-ud-test.txt67 kB
- nl_lassysmall-ud-train.txt420 kB
- nl_lassysmall-ud-dev.txt61 kB
- stats.xml7 kB
- LICENSE.txt392 B
- README.txt2 kB
- nl_lassysmall-ud-dev.conllu887 kB
- UD_Nayini-AHA
- stats.xml4 kB
- README.md1 kB
- LICENSE.txt202 B
- nyq_aha-ud-test.txt538 B
- nyq_aha-ud-test.conllu6 kB
- UD_French-GSD
- fr_gsd-ud-train.conllu21 MB
- README.md7 kB
- fr_gsd-ud-dev.conllu2 MB
- fr_gsd-ud-dev.txt184 kB
- stats.xml9 kB
- fr_gsd-ud-test.conllu624 kB
- LICENSE.txt202 B
- fr_gsd-ud-test.txt49 kB
- fr_gsd-ud-train.txt1 MB
- UD_Portuguese-Bosque
- README.md6 kB
- pt_bosque-ud-dev.txt140 kB
- pt_bosque-ud-test.conllu1 MB
- pt_bosque-ud-dev.conllu1 MB
- pt_bosque-ud-test.txt136 kB
- pt_bosque-ud-train.txt845 kB
- pt_bosque-ud-train.conllu10 MB
- stats.xml11 kB
- LICENSE.txt269 B
- UD_Frisian_Dutch-Fame
- stats.xml3 kB
- README.md3 kB
- qfn_fame-ud-test.conllu232 kB
- LICENSE.txt202 B
- qfn_fame-ud-test.txt19 kB
- UD_Kurmanji-MG
- stats.xml9 kB
- README.txt1 kB
- kmr_mg-ud-train.conllu17 kB
- LICENSE.txt202 B
- kmr_mg-ud-test.txt49 kB
- kmr_mg-ud-train.txt1 kB
- kmr_mg-ud-test.conllu729 kB
- UD_Javanese-CSUI
- stats.xml7 kB
- jv_csui-ud-test.txt12 kB
- README.md2 kB
- LICENSE.txt202 B
- jv_csui-ud-test.conllu141 kB
- UD_Portuguese-PUD
- stats.xml7 kB
- README.md5 kB
- LICENSE.txt19 kB
- pt_pud-ud-test.txt119 kB
- pt_pud-ud-test.conllu1 MB
- UD_Arabic-NYUAD
- README.md2 kB
- ar_nyuad-ud-test.conllu5 MB
- stats.xml6 kB
- LICENSE.txt202 B
- ar_nyuad-ud-dev.txt123 kB
- ar_nyuad-ud-train.txt982 kB
- ar_nyuad-ud-train.conllu44 MB
- ar_nyuad-ud-test.txt123 kB
- ar_nyuad-ud-dev.conllu5 MB
- merge.jar91 kB
- UD_Old_East_Slavic-RNC
- stats.xml15 kB
- orv_rnc-ud-train.conllu1 MB
- orv_rnc-ud-test.conllu1 MB
- README.md3 kB
- LICENSE.txt202 B
- orv_rnc-ud-test.txt177 kB
- orv_rnc-ud-train.txt149 kB
- UD_Chinese-CFL
- stats.xml4 kB
- zh_cfl-ud-test.conllux395 kB
- zh_cfl-ud-test.conllu375 kB
- README.txt7 kB
- zh_cfl-ud-test.txt30 kB
- LICENSE.txt202 B
- UD_French-Rhapsodie
- README.md1 kB
- fr_rhapsodie-ud-train.txt80 kB
- fr_rhapsodie-ud-train.conllu1 MB
- fr_rhapsodie-ud-test.conllu847 kB
- fr_rhapsodie-ud-dev.conllu908 kB
- fr_rhapsodie-ud-dev.txt53 kB
- fr_rhapsodie-ud-test.txt53 kB
- stats.xml8 kB
- LICENSE.txt202 B
- UD_English-EWT
- en_ewt-ud-dev.conllu1 MB
- en_ewt-ud-test.txt123 kB
- en_ewt-ud-train.conllu13 MB
- README.md8 kB
- en_ewt-ud-train.txt989 kB
- en_ewt-ud-dev.txt123 kB
- stats.xml10 kB
- LICENSE.txt19 kB
- en_ewt-ud-test.conllu1 MB
- UD_Latin-LLCT
- la_llct-ud-dev.conllu2 MB
- README.md6 kB
- la_llct-ud-test.conllu2 MB
- la_llct-ud-train.conllu16 MB
- stats.xml12 kB
- la_llct-ud-dev.txt136 kB
- LICENSE.txt202 B
- la_llct-ud-test.txt136 kB
- la_llct-ud-train.txt1 MB
- UD_Japanese-BCCWJ
- ja_bccwj-ud-train.conllu60 MB
- ja_bccwj-ud-train.txt902 kB
- ja_bccwj-ud-dev.txt177 kB
- ja_bccwj-ud-test.conllu11 MB
- merge
- dev_pos.pkl2 MB
- test_pos.pkl2 MB
- script
- lib.py5 kB
- restore_word_unit_bccwj.py7 kB
- convert_core_bccwj_pkl.py746 B
- merge.sh1 kB
- misc_mapping.pkl5 kB
- train_pos.pkl13 MB
- stats.xml2 kB
- LICENSE.txt18 kB
- README.txt3 kB
- ja_bccwj-ud-test.txt165 kB
- ja_bccwj-ud-dev.conllu11 MB
- UD_Latin-ITTB
- la_ittb-ud-train.txt2 MB
- README.md9 kB
- la_ittb-ud-dev.txt168 kB
- la_ittb-ud-test.conllu2 MB
- la_ittb-ud-dev.conllu2 MB
- stats.xml17 kB
- LICENSE.txt19 kB
- la_ittb-ud-test.txt169 kB
- la_ittb-ud-train.conllu35 MB
- UD_Armenian-ArmTDP
- README.md4 kB
- hy_armtdp-ud-train.conllu5 MB
- hy_armtdp-ud-dev.conllu694 kB
- hy_armtdp-ud-dev.txt57 kB
- hy_armtdp-ud-test.txt51 kB
- hy_armtdp-ud-train.txt434 kB
- stats.xml24 kB
- hy_armtdp-ud-test.conllu657 kB
- LICENSE.txt202 B
- UD_Vietnamese-VTB
- vi_vtb-ud-test.txt72 kB
- README.md1 kB
- vi_vtb-ud-train.txt127 kB
- vi_vtb-ud-train.conllu939 kB
- vi_vtb-ud-dev.txt69 kB
- stats.xml3 kB
- LICENSE.txt19 kB
- vi_vtb-ud-test.conllu545 kB
- vi_vtb-ud-dev.conllu522 kB
- UD_Cantonese-HK
- yue_hk-ud-test.txt53 kB
- stats.xml4 kB
- README.md4 kB
- LICENSE.txt202 B
- yue_hk-ud-test.conllu693 kB
- UD_Beja-NSC
- stats.xml7 kB
- README.md2 kB
- bej_nsc-ud-test.txt4 kB
- bej_nsc-ud-test.conllu153 kB
- LICENSE.txt202 B
- UD_Italian-ISDT
- README.md10 kB
- it_isdt-ud-dev.txt59 kB
- it_isdt-ud-train.txt1 MB
- it_isdt-ud-train.conllu18 MB
- it_isdt-ud-test.txt52 kB
- it_isdt-ud-test.conllu717 kB
- stats.xml10 kB
- LICENSE.txt22 kB
- it_isdt-ud-dev.conllu814 kB
- UD_Hebrew-HTB
- he_htb-ud-test.txt75 kB
- he_htb-ud-dev.txt71 kB
- he_htb-ud-train.conllu9 MB
- he_htb-ud-train.txt833 kB
- he_htb-ud-dev.conllu847 kB
- stats.xml11 kB
- LICENSE.txt249 B
- README.txt4 kB
- he_htb-ud-test.conllu909 kB
- UD_Bengali-BRU
- stats.xml8 kB
- README.md1 kB
- bn_bru-ud-test.txt3 kB
- LICENSE.txt202 B
- bn_bru-ud-test.conllu38 kB
- UD_Italian-PUD
- ... too many files ...0 B
- Name
- ud-documentation-v2.9.tgz
- Size
- 91.97 MB
- Format
- application/x-gzip
- Description
- Documentation
- MD5
- 8f2ae73f46c35f19cdacb13a2442ea8b
- ud-documentation-v2.9
- html
- misc
- new-documentation.html15 kB
- brainstorming-pisa-09-18-2017.html13 kB
- sme
- gv
- ar
- index.html12 kB
- img
- stars45.png1 kB
- stars50.png1 kB
- brat.png116 kB
- conllueditor_tree.png31 kB
- tred.png7 kB
- img_trans.gif43 B
- stars00.png1 kB
- stars.png3 kB
- stars05.png1 kB
- stars10.png1 kB
- dga.png6 kB
- palmyra.png404 kB
- stars15.png2 kB
- stars20.png1 kB
- stars25.png2 kB
- udpipe.png20 kB
- stars30.png1 kB
- stars35.png2 kB
- stars40.png1 kB
- arborator.PNG20 kB
- gh-edit.png47 kB
- structure.html5 kB
- qpm
- template-index.html8 kB
- af
- index.html11 kB
- feat
- Degree.html9 kB
- VerbType.html8 kB
- AdjType.html7 kB
- PartType.html9 kB
- Subcat.html8 kB
- bxr
- index.html11 kB
- dep
- advmod-neg.html7 kB
- cy
- template-index.html8 kB
- index.html15 kB
- feat
- Tense.html9 kB
- Number.html8 kB
- Person.html9 kB
- Poss.html7 kB
- Mood.html9 kB
- Gender.html8 kB
- Mutation.html11 kB
- Degree.html8 kB
- VerbForm.html8 kB
- dep
- nmod-agent.html7 kB
- nmod-redup.html8 kB
- case-pred.html7 kB
- obl-agent.html7 kB
- conjugation.md4 kB
- pos
- AUX_.html8 kB
- ADP.html9 kB
- ADV.html8 kB
- NUM.html8 kB
- INTJ.html7 kB
- ADJ.html8 kB
- PUNCT.html7 kB
- DET.html7 kB
- SCONJ.html7 kB
- SYM.html7 kB
- X.html7 kB
- PART.html7 kB
- CCONJ.html7 kB
- PROPN.html8 kB
- VERB.html9 kB
- NOUN.html9 kB
- PRON.html9 kB
- sla
- nap
- index.html10 kB
- qfn
- index.html10 kB
- cs
- tokenization.html14 kB
- pos
- PUNCT.html8 kB
- SCONJ.html8 kB
- INTJ.html9 kB
- SYM.html9 kB
- NOUN.html9 kB
- PART.html10 kB
- CONJ.html417 B
- VERB.html11 kB
- fr
- tokenization.html12 kB
- morphology.html6 kB
- syntax.html6 kB
- feat
- Person-psor.html7 kB
- Polarity.html7 kB
- Tense.html8 kB
- PronType.html11 kB
- Number.html8 kB
- Number-psor.html7 kB
- Person.html9 kB
- Mood.html9 kB
- Voice.html7 kB
- Gender.html7 kB
- Reflex.html7 kB
- NumType.html8 kB
- index.html7 kB
- VerbForm.html8 kB
- Definite.html7 kB
- specific-syntax.html18 kB
- pos
- DET.html8 kB
- PRON.html7 kB
- ADP.html7 kB
- PROPN.html8 kB
- VERB.html8 kB
- CCONJ.html7 kB
- SYM.html7 kB
- ADV.html7 kB
- SCONJ.html7 kB
- ADJ.html7 kB
- index.html6 kB
- AUX_.html8 kB
- X.html7 kB
- NUM.html8 kB
- PART.html7 kB
- NOUN.html8 kB
- PUNCT.html7 kB
- INTJ.html7 kB
- CONJ.html417 B
- dep
- flat-foreign.html7 kB
- acl-relcl.html8 kB
- parataxis-parenth.html6 kB
- fixed.html8 kB
- case.html8 kB
- aux-caus.html7 kB
- nummod.html8 kB
- aux-tense.html6 kB
- flat-name.html6 kB
- appos.html8 kB
- advcl-cleft.html7 kB
- nmod.html8 kB
- reparandum.html7 kB
- cc.html8 kB
- nmod-appos.html8 kB
- iobj.html8 kB
- parataxis-insert.html7 kB
- compound.html8 kB
- root.html8 kB
- expl.html10 kB
- obj-agent.html7 kB
- ccomp.html8 kB
- mark.html9 kB
- nsubj-pass.html7 kB
- obl-agent.html7 kB
- expl-comp.html6 kB
- expl-pass.html6 kB
- obl-arg.md579 B
- acl.html9 kB
- obj-lvc.html6 kB
- obl-mod.html6 kB
- obj.html8 kB
- csubj.html8 kB
- obl.html8 kB
- index.html68 kB
- dep-comp.html6 kB
- iobj-agent.html7 kB
- aux-pass.html7 kB
- expl-subj.html6 kB
- amod.html8 kB
- remnant.html421 B
- cop.html8 kB
- aux_.html9 kB
- advmod.html8 kB
- dislocated.html8 kB
- punct.html7 kB
- conj.html7 kB
- csubj-pass.html7 kB
- goeswith.html8 kB
- name.html413 B
- xcomp.html8 kB
- dep.html7 kB
- parataxis.html8 kB
- discourse.html8 kB
- det.html8 kB
- vocative.html7 kB
- nsubj.html8 kB
- advcl.html8 kB
- flat.html8 kB
- orphan.html7 kB
- nsubj-caus.html7 kB
- index.html9 kB
- overview
- introduction.html13 kB
- lt
- index.html15 kB
- feat
- Variant.html9 kB
- NumForm.html7 kB
- shp
- template-index.html8 kB
- bej
- index.html10 kB
- feat
- Definite.html7 kB
- Polite.html7 kB
- Tense.html8 kB
- Polarity.html7 kB
- Singulative.html7 kB
- ReportedSpeech.html7 kB
- Number.html8 kB
- Voice.html9 kB
- VerbType.html8 kB
- Reflex.html8 kB
- Person.html9 kB
- Case.html11 kB
- TokenType.html8 kB
- VerbForm.html8 kB
- Foreign.html6 kB
- PronType.html8 kB
- NumType.html7 kB
- Mood.html8 kB
- VerbClass.html7 kB
- Deixis.html7 kB
- Degree.html9 kB
- Aspect.html9 kB
- Gender.html8 kB
- Poss.html7 kB
- dep
- nummod-det.html6 kB
- acl-relcl.html7 kB
- acl-fixed.html6 kB
- obl-arg.html6 kB
- appos.html7 kB
- nmod.html7 kB
- reparandum.html7 kB
- mark-aff.html6 kB
- cc.html8 kB
- nsubj-aff.html6 kB
- dep-redup.html6 kB
- iobj.html8 kB
- root.html7 kB
- compound.html7 kB
- nmod-poss.html7 kB
- ccomp.html7 kB
- case-aff.html6 kB
- acl.html7 kB
- obl-mod.html6 kB
- dep-conj.html6 kB
- obj.html7 kB
- dep-comp.html6 kB
- advmod-fixed.html6 kB
- amod.html7 kB
- dislocated-subj.html6 kB
- aux_.html7 kB
- cop.html8 kB
- dislocated.html7 kB
- advmod.html7 kB
- punct.html7 kB
- parataxis-coord.html6 kB
- parataxis.html7 kB
- dep-aff.html6 kB
- aux-aff.html6 kB
- vocative.html7 kB
- discourse.html7 kB
- det.html7 kB
- nsubj.html8 kB
- parataxis-mod.html6 kB
- advcl.html8 kB
- conj-redup.html6 kB
- pos
- AUX_.html8 kB
- ADP.html7 kB
- CONJ.html421 B
- NUM.html7 kB
- ADV.html7 kB
- PUNCT.html7 kB
- INTJ.html7 kB
- ADJ.html8 kB
- DET.html8 kB
- SCONJ.html8 kB
- X.html7 kB
- PART.html7 kB
- CCONJ.html8 kB
- PROPN.html7 kB
- PRON.html7 kB
- NOUN.html8 kB
- VERB.html8 kB
- lzh
- template-index.html8 kB
- index.html14 kB
- dep
- discourse-sp.html7 kB
- flat-vv.html6 kB
- sandbox.html16 kB
- nyn
- template-index.html8 kB
- mag
- template-index.html8 kB
- logos
- by.svg9 kB
- by-nc-sa.svg22 kB
- logo-ud.png10 kB
- by-sa.svg16 kB
- by-nc-nd.svg18 kB
- F.svg3 kB
- LGPLLR.svg1 kB
- gpl.svg3 kB
- D.svg3 kB
- L.svg3 kB
- cc-zero.svg8 kB
- tools.html39 kB
- mdf
- index.html11 kB
- feat
- NameType.html9 kB
- Person-psor.html8 kB
- Variant.html8 kB
- Clitic.html9 kB
- Valency.html7 kB
- NounType.html7 kB
- Connegative.html8 kB
- NumForm.html6 kB
- Derivation.html8 kB
- Style.html6 kB
- Case.html16 kB
- Mood.html12 kB
- Reflex.html8 kB
- NumType.html10 kB
- index.html7 kB
- dep
- advmod-foc.html6 kB
- obl-lfrom.html7 kB
- nmod-lmod.html6 kB
- aux-opt.html6 kB
- obl-lto.html7 kB
- advcl-tcl.html7 kB
- aux-neg.html8 kB
- advmod-deg.html6 kB
- obl-cau.html6 kB
- advmod-cau.html6 kB
- obl-lmp.html7 kB
- obl-inst.html6 kB
- nmod-comp.html6 kB
- index.html9 kB
- advmod-tmod.html6 kB
- advcl-cau.html6 kB
- advmod-mmod.html6 kB
- nmod-appos.html7 kB
- advmod-eval.html6 kB
- aux-nec.html6 kB
- aux-q.html6 kB
- aux-cnd.html6 kB
- advmod-lfrom.html6 kB
- nmod-bahuv.html6 kB
- advmod-lto.html6 kB
- obl-comp.html6 kB
- obl-freq.html6 kB
- nmod-tmod.html6 kB
- csubj-cop.html7 kB
- advmod-freq.html6 kB
- nsubj-cop.html7 kB
- fa
- morphology.html5 kB
- newbie.html9 kB
- olo
- yue
- template-index.html8 kB
- dep
- compound-vv.html10 kB
- dislocated-vo.html7 kB
- advmod-df.html9 kB
- case.html11 kB
- advcl-coverb.html9 kB
- nummod.html8 kB
- compound-quant.html10 kB
- appos.html10 kB
- nmod.html9 kB
- reparandum.html8 kB
- cc.html8 kB
- iobj.html8 kB
- list.html9 kB
- root.html9 kB
- compound.html10 kB
- discourse-sp.html8 kB
- nsubj-periph.html6 kB
- expl.html8 kB
- compound-vo.html10 kB
- obl-patient.html7 kB
- ccomp.html16 kB
- mark.html10 kB
- nsubj-pass.html8 kB
- obl-agent.html8 kB
- obj-periph.html6 kB
- mark-adv.html6 kB
- acl.html11 kB
- obj.html10 kB
- clf.html10 kB
- csubj.html8 kB
- obl.html10 kB
- index.html11 kB
- aux-pass.html7 kB
- mark-rel.html8 kB
- amod.html8 kB
- compound-dir.html11 kB
- aux_.html11 kB
- cop.html8 kB
- advmod.html12 kB
- dislocated.html11 kB
- case-loc.html7 kB
- conj.html12 kB
- csubj-pass.html7 kB
- punct.html12 kB
- goeswith.html8 kB
- xcomp.html16 kB
- parataxis.html11 kB
- vocative.html8 kB
- discourse.html12 kB
- det.html9 kB
- obl-tmod.html9 kB
- nsubj.html8 kB
- compound-ext.html10 kB
- advcl.html10 kB
- flat.html9 kB
- orphan.html11 kB
- pos
- DET.html9 kB
- PRON.html10 kB
- ADP.html9 kB
- PROPN.html8 kB
- VERB.html8 kB
- ADV.html11 kB
- CCONJ.html8 kB
- SYM.html7 kB
- SCONJ.html8 kB
- ADJ.html9 kB
- index.html6 kB
- AUX_.html8 kB
- X.html7 kB
- NUM.html8 kB
- PART.html10 kB
- NOUN.html8 kB
- PUNCT.html7 kB
- INTJ.html8 kB
- u
- feat
- VerbForm.html14 kB
- Gender-obj.html8 kB
- Case.html36 kB
- all.html306 kB
- PronType.html15 kB
- Foreign.html7 kB
- Gender-erg.html8 kB
- Definiteness.html433 B
- Polite.html11 kB
- Polite-abs.html9 kB
- Person-subj.html10 kB
- AdvType.html8 kB
- Animacy.html12 kB
- Evident.html8 kB
- Number-psor.html7 kB
- Gender-subj.html9 kB
- VerbType.html10 kB
- Typo.html7 kB
- Clusivity.html7 kB
- Polarity.html10 kB
- NumType.html14 kB
- Person-dat.html9 kB
- Polite-erg.html9 kB
- PartType.html8 kB
- Number.html15 kB
- NounClass.html25 kB
- Style.html11 kB
- Number-dat.html10 kB
- Echo.html7 kB
- Tense.html14 kB
- PrepCase.html7 kB
- Gender.html11 kB
- Negative.html437 B
- ConjType.html7 kB
- Clusivity-psor.html8 kB
- index.html18 kB
- Hyph.html7 kB
- Gender-dat.html8 kB
- NumValue.html7 kB
- Person.html11 kB
- Person-abs.html9 kB
- Number-subj.html10 kB
- Aspect.html13 kB
- Degree.html10 kB
- Abbr.html7 kB
- Subcat.html8 kB
- Person-psor.html8 kB
- Voice.html14 kB
- NameType.html10 kB
- Person-erg.html11 kB
- PunctType.html10 kB
- Number-abs.html10 kB
- Person-obj.html9 kB
- Negativeness.html437 B
- Evidentiality.html425 B
- Reflex.html8 kB
- Clusivity-obj.html8 kB
- Mood.html16 kB
- Number-psed.html9 kB
- Polite-dat.html9 kB
- Deixis.html12 kB
- Definite.html12 kB
- Number-obj.html10 kB
- Poss.html8 kB
- NounType.html7 kB
- Gender-psor.html8 kB
- NumForm.html8 kB
- PunctSide.html7 kB
- Clusivity-subj.html8 kB
- DeixisRef.html8 kB
- Number-erg.html10 kB
- AdpType.html7 kB
- dep
- flat-foreign.html7 kB
- advmod-lmod.html6 kB
- acl-relcl.html7 kB
- fixed.html9 kB
- advmod-emph.html8 kB
- case.html13 kB
- nummod.html8 kB
- flat-name.html8 kB
- cc-preconj.html6 kB
- obl-arg.html9 kB
- appos.html12 kB
- compound-svc.html10 kB
- nmod.html8 kB
- nmod-tmod.html6 kB
- reparandum.html7 kB
- cc.html8 kB
- iobj.html10 kB
- det-numgov.html7 kB
- list.html9 kB
- nummod-gov.html7 kB
- root.html8 kB
- compound.html10 kB
- expl.html13 kB
- nmod-poss.html7 kB
- ccomp.html9 kB
- mark.html8 kB
- nsubj-pass.html7 kB
- obl-lmod.html6 kB
- obl-agent.html7 kB
- det-poss.html6 kB
- expl-pass.html6 kB
- det-nummod.html7 kB
- acl.html9 kB
- all.html160 kB
- obj.html9 kB
- clf.html11 kB
- csubj.html8 kB
- index.html14 kB
- obl.html9 kB
- aux-pass.html8 kB
- compound-lvc.html7 kB
- amod.html8 kB
- compound-redup.html7 kB
- expl-pv.html7 kB
- compound-prt.html7 kB
- aux_.html8 kB
- cop.html13 kB
- advmod.html9 kB
- dislocated.html8 kB
- conj.html11 kB
- csubj-pass.html7 kB
- expl-impers.html7 kB
- punct.html9 kB
- goeswith.html7 kB
- xcomp.html13 kB
- dep.html7 kB
- parataxis.html13 kB
- vocative.html8 kB
- discourse.html8 kB
- det.html8 kB
- nsubj.html10 kB
- obl-tmod.html6 kB
- advcl.html8 kB
- flat.html19 kB
- orphan.html8 kB
- overview
- tokenization.html9 kB
- syntax.html31 kB
- morphology.html23 kB
- complex-syntax.html23 kB
- enhanced-syntax.html47 kB
- feat-layers.html22 kB
- specific-syntax.html34 kB
- typos.html19 kB
- simple-syntax.html34 kB
- nominal-syntax.html9 kB
- pos
- DET.html13 kB
- PRON.html10 kB
- ADP.html8 kB
- PROPN.html9 kB
- VERB.html9 kB
- CCONJ.html8 kB
- SYM.html8 kB
- ADV.html10 kB
- SCONJ.html9 kB
- ADJ.html10 kB
- index.html7 kB
- AUX_.html9 kB
- X.html7 kB
- all.html46 kB
- NUM.html9 kB
- PART.html9 kB
- NOUN.html8 kB
- PUNCT.html8 kB
- INTJ.html8 kB
- feat
- format.html36 kB
- ky
- template-index.html8 kB
- pra
- template-index.html8 kB
- fro
- index.html10 kB
- feat
- index.html7 kB
- Morph.html7 kB
- dep
- obl-advmod.html7 kB
- nummod.html7 kB
- appos.html9 kB
- mark-advmod.html6 kB
- nmod.html8 kB
- obj-advneg.html7 kB
- cc.html8 kB
- iobj.html8 kB
- expl.html8 kB
- obj-obl.html7 kB
- nsubj-obj.html7 kB
- ccomp.html9 kB
- mark.html8 kB
- acl.html9 kB
- cc-nc.html6 kB
- nsubj-advmod.html7 kB
- obj.html9 kB
- csubj.html8 kB
- index.html10 kB
- obl.html8 kB
- obj-advmod.html7 kB
- amod.html8 kB
- remnant.html425 B
- advmod-obl.html6 kB
- cop.html8 kB
- aux_.html9 kB
- dislocated.html8 kB
- advmod.html9 kB
- conj.html8 kB
- xcomp.html8 kB
- vocative.html8 kB
- det.html8 kB
- nsubj.html9 kB
- case-det.html6 kB
- advcl.html9 kB
- orphan.html8 kB
- pos
- ADP.html7 kB
- AUX_.html8 kB
- NUM.html8 kB
- ADV.html7 kB
- INTJ.html7 kB
- ADJ.html8 kB
- DET.html8 kB
- SCONJ.html7 kB
- CCONJ.html7 kB
- PROPN.html7 kB
- index.html6 kB
- NOUN.html7 kB
- PRON.html8 kB
- VERB.html8 kB
- kpv
- index.html10 kB
- feat
- Person-psor.html7 kB
- PartForm.html7 kB
- Clitic.html8 kB
- Connegative.html7 kB
- NounType.html7 kB
- Valency.html7 kB
- PronType.html9 kB
- Derivation.html16 kB
- Case.html22 kB
- Reflex.html8 kB
- NumType.html10 kB
- index.html7 kB
- VerbForm.html11 kB
- dep
- flat-foreign.html7 kB
- aux-cnd.html6 kB
- advcl-eval.html6 kB
- nmod-prp.html6 kB
- advmod-lmod.html6 kB
- advmod-lto.html6 kB
- advmod-emph.html6 kB
- aux-tense.html6 kB
- cc-preconj.html7 kB
- obl-lto.html6 kB
- advcl-lto.html6 kB
- advcl-tcl.html7 kB
- advmod-deg.html6 kB
- nmod-appos.html7 kB
- aux-pot.html6 kB
- aux-nec.html6 kB
- nmod-comp.html6 kB
- nmod-lfrom.html6 kB
- flat-num.html6 kB
- aux-neg.html7 kB
- advmod-foc.html6 kB
- advmod-tmod.html6 kB
- advmod-cau.html6 kB
- advmod-mmod.html6 kB
- obl-lmod.html6 kB
- obl-cau.html6 kB
- obl-agent.html7 kB
- nmod-subj.html6 kB
- advmod-freq.html6 kB
- advmod-lmp.html6 kB
- csubj-cop.html7 kB
- csubj.html7 kB
- nsubj-cop.html7 kB
- index.html9 kB
- obl-mcl.html6 kB
- obl-lmp.html7 kB
- cop.html10 kB
- obl-lfrom.html7 kB
- nmod-lmod.html6 kB
- nmod-obj.html6 kB
- advmod-lfrom.html6 kB
- advmod-eval.html6 kB
- aux-aspect.html6 kB
- pos
- AUX_.html9 kB
- ADP.html7 kB
- ADV.html7 kB
- NUM.html7 kB
- PUNCT.html7 kB
- ADJ.html7 kB
- INTJ.html7 kB
- DET.html7 kB
- SCONJ.html7 kB
- X.html7 kB
- PART.html9 kB
- CCONJ.html7 kB
- PROPN.html7 kB
- NOUN.html7 kB
- PRON.html7 kB
- VERB.html7 kB
- gub
- index.html21 kB
- feat
- Tense.html8 kB
- Polarity.html8 kB
- Clusivity.html7 kB
- Voice.html8 kB
- Number.html9 kB
- OblTop.html7 kB
- Person.html9 kB
- Case.html9 kB
- Emph.html7 kB
- Red.html7 kB
- VerbForm.html8 kB
- Rel.html8 kB
- Evident.html8 kB
- Nomzr.html9 kB
- Foreign.html7 kB
- PronType.html9 kB
- Dimin.html7 kB
- Mood.html8 kB
- Detrans.html7 kB
- Aspect.html8 kB
- bn
- index.html17 kB
- README.md176 B
- en
- tokenization.html6 kB
- morphology.html8 kB
- migration-guidelines.html46 kB
- feat
- ExtPos.html9 kB
- Tense.html9 kB
- PronType.html11 kB
- Case.html8 kB
- Number.html10 kB
- Person.html9 kB
- Poss.html7 kB
- Mood.html9 kB
- Voice.html7 kB
- Gender.html7 kB
- NumType.html10 kB
- index.html7 kB
- Reflex.html7 kB
- Degree.html9 kB
- VerbForm.html10 kB
- Definite.html7 kB
- specific-syntax.html62 kB
- pos
- DET.html7 kB
- PRON.html8 kB
- ADP.html7 kB
- PROPN.html7 kB
- VERB.html7 kB
- CCONJ.html7 kB
- SYM.html7 kB
- ADV.html7 kB
- SCONJ.html8 kB
- ADJ.html7 kB
- index.html6 kB
- AUX_.html7 kB
- X.html7 kB
- NUM.html7 kB
- PART.html8 kB
- NOUN.html7 kB
- PUNCT.html7 kB
- INTJ.html7 kB
- CONJ.html417 B
- dep
- flat-foreign.html7 kB
- nmod-npmod.html7 kB
- acl-relcl.html7 kB
- fixed.html15 kB
- case.html8 kB
- nummod.html7 kB
- cc-preconj.html6 kB
- appos.html7 kB
- nmod.html8 kB
- nmod-tmod.html6 kB
- reparandum.html7 kB
- cc.html8 kB
- iobj.html7 kB
- list.html7 kB
- root.html7 kB
- compound.html9 kB
- expl.html7 kB
- obl-npmod.html7 kB
- nmod-poss.html7 kB
- ccomp.html8 kB
- mark.html8 kB
- nsubj-pass.html7 kB
- acl.html8 kB
- obj.html7 kB
- csubj.html7 kB
- index.html9 kB
- aux-pass.html7 kB
- amod.html8 kB
- compound-prt.html7 kB
- cop.html10 kB
- aux_.html8 kB
- advmod.html7 kB
- dislocated.html7 kB
- conj.html7 kB
- csubj-pass.html7 kB
- punct.html7 kB
- goeswith.html7 kB
- xcomp.html8 kB
- dep.html6 kB
- parataxis.html8 kB
- vocative.html7 kB
- det.html7 kB
- det-predet.html6 kB
- discourse.html7 kB
- obl-tmod.html6 kB
- nsubj.html10 kB
- advcl.html8 kB
- flat.html9 kB
- orphan.html9 kB
- index.html11 kB
- overview
- introduction.html11 kB
- sjo
- index.html13 kB
- dep
- mark-rel.html6 kB
- mark-plur.html6 kB
- mark-adv.html7 kB
- tt
- index.html10 kB
- feat
- Polarity.html8 kB
- Tense.html8 kB
- PronType.html9 kB
- Aspect.html9 kB
- Case.html14 kB
- Number.html10 kB
- Number-psor.html7 kB
- Person.html11 kB
- Mood.html12 kB
- Voice.html12 kB
- Reflex.html7 kB
- NumType.html9 kB
- Degree.html8 kB
- VerbForm.html12 kB
- dep
- compound-lvc.html6 kB
- pos
- DET.html8 kB
- PRON.html8 kB
- ADP.html9 kB
- PROPN.html8 kB
- VERB.html8 kB
- CCONJ.html7 kB
- SYM.html7 kB
- ADV.html8 kB
- SCONJ.html8 kB
- ADJ.html8 kB
- AUX_.html8 kB
- X.html7 kB
- NUM.html8 kB
- PART.html7 kB
- NOUN.html9 kB
- PUNCT.html8 kB
- INTJ.html8 kB
- CONJ.html417 B
- nl
- index.html29 kB
- overview
- introduction.html7 kB
- wo
- ajp
- index.html9 kB
- he
- misc
- html
- ... too many files ...0 B
- Name
- ud-tools-v2.9.tgz
- Size
- 559.19 KB
- Format
- application/x-gzip
- Description
- Tools
- MD5
- 3591a4120be718b03c5f44a73a2bdc28
- ud-tools-v2.9
- check_text_wosp_match.sh814 B
- conll_convert_tags_to_uposf.pl1 kB
- check_sentence_ids.pl1 kB
- conllu-sort-sentences-by-ids.pl1 kB
- package_st_data.sh10 kB
- conllu-stats.py6 kB
- runtests.sh1 kB
- conllu-w2t.py2 kB
- file_util.pyc2 kB
- example-data
- long-token-to-text-wrong.txt333 B
- long-token-to-text-correct.txt332 B
- long-token-to-text.conllu2 kB
- tanl.conll471 B
- validate_repo_metadata.py4 kB
- conllu-copy-basic-to-enhanced.pl1 kB
- evaluate_treebank.pl18 kB
- iwpt20_xud_eval.py36 kB
- enhanced_classify_relations.pl26 kB
- package_ud_release.sh7 kB
- conllu-stats.pl107 kB
- conllu-dependency-stats.pl944 B
- check-space-after-paragraph.pl2 kB
- file_util.py2 kB
- udlib.pm~20 kB
- conllu-quick-fix-id-sequence.pl2 kB
- conllu-formconvert.py3 kB
- find_duplicate_sentences.pl1 kB
- survey_misc.pl6 kB
- remove_duplicate_sentences.pl2 kB
- validate_all.sh943 B
- fix_format_of_deps.pl1 kB
- conllu_to_conllx.pl2 kB
- LICENSE.txt17 kB
- restore_conllu_lines.pl1 kB
- mwtoken-stats.pl1 kB
- Node.pm18 kB
- overlap.py2 kB
- collect_propn_sequences.pl3 kB
- survey_features.pl11 kB
- __pycache__
- file_util.cpython-37.pyc2 kB
- fix-space-after-paragraph.pl4 kB
- udlib.pm22 kB
- survey_deprel_subtypes.pl8 kB
- compat
- argparse.pyc65 kB
- argparse.py85 kB
- __init__.pyc140 B
- __init__.py0 B
- validate-python2-obsolete.py36 kB
- v2-conversion
- convert.py3 kB
- README.md2 kB
- processors_en.py1 kB
- processors_universal.py5 kB
- depgraph_utils.py6 kB
- nmod_obl_adjudication.py3 kB
- text_without_spaces.pl2 kB
- remove_sense_suffixes_from_lemmas.pl1 kB
- generate_comparison_of_treebanks.pl2 kB
- csort.pm7 kB
- enhanced_graph_properties.pl21 kB
- package_ud_release.sh~6 kB
- validate.py119 kB
- create_iso_639_3_symlinks.py175 kB
- conllu-quick-fix.pl20 kB
- test-cases
- nonvalid
- lowercase-postag.conllu141 B
- lowercase-feature-value-in-empty.conllu251 B
- empty-head.conllu114 B
- invalid-deps-id.conllu173 B
- invalid-deps-syntax.conllu194 B
- misordered-feature.conllu243 B
- missing-final-line.conllu155 B
- empty-field.conllu100 B
- head-not-0-deprel-root.conllu172 B
- ambiguous-feature.conllu175 B
- empty-sentence.conllu163 B
- trailing-tab.conllu127 B
- lowercase-postag-in-empty.conllu239 B
- multiple-sent_id.conllu736 B
- malformed_deps.conllu683 B
- head-0-deprel-not-root.conllu133 B
- head-not-empty-in-empty.conllu224 B
- lowercase-feature.conllu238 B
- duplicate-value.conllu137 B
- tanl-broken.conllu690 B
- misordered-layered-feature.conllu239 B
- whitespace_nonv.conllu274 B
- misplaced-comment-end.conllu429 B
- nonsequential-empty-node-id.conllu238 B
- dos-newlines.conllu698 B
- duplicate-layered-feature.conllu182 B
- cyclic-deps.conllu227 B
- invalid-head.conllu164 B
- id-with-extra-0.conllu140 B
- duplicate-feature.conllu142 B
- overlapping-multiword.conllu387 B
- token_with_cols_filled.conllu385 B
- self-cycle-deps.conllu164 B
- space-in-field.conllu127 B
- nonsequential-id.conllu176 B
- extra-empty-line.conllu287 B
- lowercase-feature-in-empty.conllu244 B
- non-proj.conllu109 B
- no-sent_id.conllu686 B
- id-starting-from-2.conllu247 B
- misindexed-empty-node.conllu235 B
- self-cycle-head.conllu190 B
- invalid-range.conllu375 B
- uppercase-deps-deprel.conllu206 B
- multiword-with-pos.conllu407 B
- empty-node-without-dependent.conllu251 B
- uppercase-deprel.conllu184 B
- invalid-deps-order.conllu409 B
- missing-space-after.conllu176 B
- extra-field.conllu130 B
- invalid-range-format.conllu380 B
- duplicate-id.conllu171 B
- deprel-not-empty-in-empty.conllu233 B
- misplaced-comment-mid.conllu401 B
- misordered-multiword.conllu392 B
- lowercase-value.conllu237 B
- valid
- maximal-empty-node.conllu273 B
- whitespace.conllu294 B
- multiple-features.conllu295 B
- id_test_part2.conllu375 B
- empty-nodes.conllu324 B
- id_test_part1.conllu375 B
- tanl.conllu673 B
- empty-file.conllu0 B
- minimal-empty-node.conllu239 B
- layered-features.conllu272 B
- nonvalid
- README.md11 kB
- save_evaluation_logs.sh962 B
- conllu-remove-enhanced-deps.pl443 B
- conllu-tenfold.pl2 kB
- mergept.pl2 kB
- normalize_unicode.pl511 B
- Graph.pm12 kB
- data
- deprel.shopen311 B
- edeprel.ta2 kB
- tokens_w_space.ud27 B
- edeprel.ar27 kB
- edeprel.akk22 B
- tokens_w_space.br457 B
- edeprel.sv4 kB
- tokens_w_space.koi86 B
- docdeps.json208 kB
- edeprel.pl21 kB
- tokens_w_space.kk1 kB
- tokens_w_space.nl158 B
- edeprel.sk3 kB
- cpos.ud79 B
- edeprel.cs28 kB
- edeprel.lv1023 B
- edeprel.it3 kB
- edeprel.fr430 B
- edeprel.lt2 kB
- edeprel.ru14 kB
- tokens_w_space.am82 B
- deprels.json641 kB
- tokens_w_space.sv131 B
- edeprel.fi8 kB
- tokens_w_space.myv82 B
- tokens_w_space.mdf82 B
- tokens_w_space.pl366 B
- edeprel.uk5 kB
- feats.json874 kB
- tokens_w_space.akk246 B
- tokens_w_space.gun0 B
- tokens_w_space.vi3 B
- edeprel.ud4 B
- deprel.ud237 B
- tokens_w_space.kpv86 B
- tokens_w_space.fro10 B
- data.json319 kB
- edeprel.ojp6 B
- tokens_w_space.shopen9 B
- feat_val.shopen2 kB
- edeprel.et10 kB
- tokens_w_space.kmr277 B
- docfeats.json937 kB
- tokens_w_space.fr10 B
- tokens_w_space.lv112 B
- tokens_w_space.sms151 B
- edeprel.en5 kB
- tokens_w_space.sjo1 kB
- tokens_w_space.lt1 kB
- README.md905 B
- edeprel.bg2 kB
- edeprel.be6 kB
- tokens_w_space.apu123 B
- edeprel.nl6 kB
- tokens_w_space.fi78 B
- edeprel.lzh76 B
- generate_treebank_hub.pl1 kB
- check_overlaps.pl1 kB
- conllu_to_text.pl9 kB
- survey_enhancements.pl7 kB
- conllu_align_tokens.pl6 kB
- enhanced_collapse_empty_nodes.pl8 kB
- check_files.pl66 kB
- klcpos3.pl1 kB