Files in this item
Download all files in item (565.97 MB)- Name
- ud-treebanks-v2.10.tgz
- Size
- 470.62 MB
- Format
- application/x-gzip
- Description
- Treebank data
- MD5
- 11e388bc743839ce6f2bdd66957f41e6
- ud-treebanks-v2.10
- UD_English-PUD
- stats.xml8 kB
- en_pud-ud-test.conllu1 MB
- README.md6 kB
- en_pud-ud-test.txt109 kB
- LICENSE.txt19 kB
- UD_Telugu-MTG
- te_mtg-ud-test.txt10 kB
- te_mtg-ud-train.conllu494 kB
- te_mtg-ud-dev.conllu64 kB
- stats.xml3 kB
- te_mtg-ud-test.conllu70 kB
- LICENSE.txt202 B
- README.txt1 kB
- te_mtg-ud-train.txt72 kB
- te_mtg-ud-dev.txt9 kB
- UD_Finnish-PUD
- stats.xml17 kB
- README.txt2 kB
- fi_pud-ud-test.txt119 kB
- LICENSE.txt202 B
- fi_pud-ud-test.conllu1 MB
- UD_Makurap-TuDeT
- stats.xml4 kB
- README.md1 kB
- mpu_tudet-ud-test.txt798 B
- LICENSE.txt202 B
- mpu_tudet-ud-test.conllu9 kB
- UD_Swedish-Talbanken
- sv_talbanken-ud-test.txt122 kB
- README.md7 kB
- sv_talbanken-ud-train.txt402 kB
- stats.xml9 kB
- LICENSE.txt20 kB
- sv_talbanken-ud-train.conllu5 MB
- sv_talbanken-ud-dev.conllu834 kB
- sv_talbanken-ud-dev.txt58 kB
- sv_talbanken-ud-test.conllu1 MB
- UD_Romanian-RRT
- README.md5 kB
- ro_rrt-ud-dev.txt98 kB
- ro_rrt-ud-train.conllu13 MB
- stats.xml12 kB
- LICENSE.txt66 B
- ro_rrt-ud-dev.conllu1 MB
- ro_rrt-ud-test.conllu1 MB
- ro_rrt-ud-train.txt1 MB
- ro_rrt-ud-test.txt94 kB
- UD_Czech-CLTT
- cs_cltt-ud-dev.conllu483 kB
- cs_cltt-ud-test.txt29 kB
- README.md2 kB
- cs_cltt-ud-train.txt195 kB
- cs_cltt-ud-dev.txt33 kB
- stats.xml13 kB
- cs_cltt-ud-train.conllu2 MB
- LICENSE.txt265 B
- cs_cltt-ud-test.conllu416 kB
- UD_Gothic-PROIEL
- got_proiel-ud-train.conllu3 MB
- README.md2 kB
- got_proiel-ud-test.txt64 kB
- got_proiel-ud-dev.conllu930 kB
- got_proiel-ud-train.txt221 kB
- stats.xml9 kB
- LICENSE.txt279 B
- got_proiel-ud-dev.txt62 kB
- got_proiel-ud-test.conllu946 kB
- UD_Kiche-IU
- stats.xml11 kB
- quc_iu-ud-test.conllu823 kB
- README.md1 kB
- quc_iu-ud-test.txt46 kB
- LICENSE.txt202 B
- UD_Swedish-LinES
- sv_lines-ud-train.conllu4 MB
- sv_lines-ud-dev.conllu1 MB
- sv_lines-ud-train.txt302 kB
- sv_lines-ud-dev.txt101 kB
- sv_lines-ud-test.conllu1 MB
- stats.xml9 kB
- sv_lines-ud-test.txt92 kB
- LICENSE.txt18 kB
- README.txt7 kB
- UD_German-GSD
- README.md8 kB
- de_gsd-ud-dev.conllu881 kB
- de_gsd-ud-dev.txt72 kB
- de_gsd-ud-train.txt1 MB
- de_gsd-ud-test.conllu1 MB
- stats.xml11 kB
- de_gsd-ud-train.conllu18 MB
- LICENSE.txt202 B
- de_gsd-ud-test.txt97 kB
- UD_Komi_Permyak-UH
- stats.xml14 kB
- README.md6 kB
- koi_uh-ud-test.conllu99 kB
- LICENSE.txt202 B
- koi_uh-ud-test.txt8 kB
- UD_Pomak-Philotis
- README.md2 kB
- qpm_philotis-ud-train.conllu5 MB
- qpm_philotis-ud-test.txt45 kB
- qpm_philotis-ud-train.txt357 kB
- qpm_philotis-ud-dev.txt45 kB
- qpm_philotis-ud-test.conllu695 kB
- qpm_philotis-ud-dev.conllu691 kB
- stats.xml12 kB
- LICENSE.txt417 B
- UD_Lithuanian-HSE
- lt_hse-ud-dev.txt6 kB
- README.md2 kB
- lt_hse-ud-test.conllu88 kB
- lt_hse-ud-train.txt20 kB
- lt_hse-ud-test.txt6 kB
- lt_hse-ud-train.conllu255 kB
- stats.xml10 kB
- LICENSE.txt202 B
- lt_hse-ud-dev.conllu87 kB
- UD_Japanese-PUDLUW
- stats.xml4 kB
- README.md5 kB
- ja_pudluw-ud-test.txt138 kB
- LICENSE.txt202 B
- ja_pudluw-ud-test.conllu4 MB
- UD_Turkish_German-SAGT
- qtd_sagt-ud-train.conllu770 kB
- qtd_sagt-ud-test.txt77 kB
- README.md6 kB
- qtd_sagt-ud-train.txt55 kB
- qtd_sagt-ud-dev.conllu988 kB
- qtd_sagt-ud-test.conllu1 MB
- qtd_sagt-ud-dev.txt71 kB
- stats.xml15 kB
- LICENSE.txt202 B
- UD_Chinese-PUD
- stats.xml4 kB
- zh_pud-ud-test.conllu1 MB
- README.md5 kB
- zh_pud-ud-test.txt101 kB
- LICENSE.txt19 kB
- UD_Tamil-TTB
- README.md4 kB
- ta_ttb-ud-dev.txt24 kB
- ta_ttb-ud-dev.conllu225 kB
- ta_ttb-ud-train.conllu1 MB
- ta_ttb-ud-train.txt123 kB
- stats.xml16 kB
- ta_ttb-ud-test.conllu353 kB
- ta_ttb-ud-test.txt37 kB
- LICENSE.txt280 B
- UD_Teko-TuDeT
- stats.xml7 kB
- eme_tudet-ud-test.conllu22 kB
- eme_tudet-ud-test.txt1 kB
- README.md1 kB
- LICENSE.txt202 B
- UD_English-LinES
- en_lines-ud-test.conllu1013 kB
- en_lines-ud-train.conllu3 MB
- en_lines-ud-test.txt83 kB
- en_lines-ud-dev.conllu1 MB
- stats.xml8 kB
- en_lines-ud-train.txt272 kB
- README.txt7 kB
- LICENSE.txt18 kB
- en_lines-ud-dev.txt91 kB
- UD_Latin-UDante
- la_udante-ud-train.conllu2 MB
- README.md8 kB
- la_udante-ud-dev.conllu1 MB
- la_udante-ud-train.txt170 kB
- stats.xml19 kB
- la_udante-ud-test.txt78 kB
- la_udante-ud-dev.txt67 kB
- LICENSE.txt202 B
- la_udante-ud-test.conllu1 MB
- UD_Buryat-BDT
- stats.xml12 kB
- README.txt1 kB
- bxr_bdt-ud-train.conllu10 kB
- bxr_bdt-ud-train.txt1 kB
- LICENSE.txt202 B
- bxr_bdt-ud-test.conllu699 kB
- bxr_bdt-ud-test.txt114 kB
- UD_Italian-MarkIT
- it_markit-ud-dev.txt54 kB
- README.md1 kB
- it_markit-ud-train.txt103 kB
- it_markit-ud-test.txt52 kB
- stats.xml8 kB
- it_markit-ud-train.conllu1 MB
- LICENSE.txt188 B
- it_markit-ud-test.conllu644 kB
- it_markit-ud-dev.conllu649 kB
- UD_English-GUMReddit
- README.md23 kB
- en_gumreddit-ud-train.txt23 kB
- en_gumreddit-ud-train.conllu1 MB
- en_gumreddit-ud-dev.conllu168 kB
- get_text.py26 kB
- stats.xml6 kB
- en_gumreddit-ud-dev.txt3 kB
- en_gumreddit-ud-test.txt3 kB
- LICENSE.txt313 B
- en_gumreddit-ud-test.conllu169 kB
- UD_Guarani-OldTuDeT
- stats.xml8 kB
- README.md2 kB
- gn_oldtudet-ud-test.txt1 kB
- LICENSE.txt202 B
- gn_oldtudet-ud-test.conllu18 kB
- UD_Norwegian-Bokmaal
- README.md6 kB
- no_bokmaal-ud-dev.txt195 kB
- no_bokmaal-ud-train.txt1 MB
- no_bokmaal-ud-test.txt161 kB
- no_bokmaal-ud-train.conllu14 MB
- stats.xml9 kB
- no_bokmaal-ud-test.conllu1 MB
- no_bokmaal-ud-dev.conllu2 MB
- LICENSE.txt68 B
- UD_French-FQB
- stats.xml8 kB
- fr_fqb-ud-test.conllu1 MB
- README.md3 kB
- fr_fqb-ud-test.txt117 kB
- LICENSE.txt14 kB
- UD_South_Levantine_Arabic-MADAR
- stats.xml4 kB
- README.md2 kB
- ajp_madar-ud-test.conllu42 kB
- LICENSE.txt202 B
- ajp_madar-ud-test.txt5 kB
- UD_Welsh-CCG
- cy_ccg-ud-test.txt79 kB
- cy_ccg-ud-test.conllu1 MB
- README.md1 kB
- cy_ccg-ud-dev.txt42 kB
- cy_ccg-ud-train.txt89 kB
- cy_ccg-ud-train.conllu1 MB
- cy_ccg-ud-dev.conllu591 kB
- stats.xml8 kB
- LICENSE.txt202 B
- UD_Chinese-GSDSimp
- zh_gsdsimp-ud-test.txt53 kB
- README.md2 kB
- zh_gsdsimp-ud-dev.conllu680 kB
- zh_gsdsimp-ud-train.txt433 kB
- zh_gsdsimp-ud-train.conllu5 MB
- stats.xml5 kB
- LICENSE.txt202 B
- zh_gsdsimp-ud-dev.txt55 kB
- zh_gsdsimp-ud-test.conllu647 kB
- UD_Galician-CTG
- gl_ctg-ud-dev.conllu1 MB
- gl_ctg-ud-test.conllu1 MB
- gl_ctg-ud-dev.txt155 kB
- gl_ctg-ud-train.conllu4 MB
- gl_ctg-ud-test.txt156 kB
- stats.xml3 kB
- gl_ctg-ud-train.txt413 kB
- LICENSE.txt173 B
- README.txt2 kB
- UD_Old_East_Slavic-TOROT
- README.md3 kB
- orv_torot-ud-test.txt150 kB
- orv_torot-ud-train.txt1 MB
- orv_torot-ud-train.conllu11 MB
- orv_torot-ud-dev.conllu1 MB
- orv_torot-ud-dev.txt151 kB
- orv_torot-ud-test.conllu1 MB
- stats.xml12 kB
- LICENSE.txt197 B
- UD_Armenian-BSUT
- README.md2 kB
- hy_bsut-ud-dev.txt119 kB
- hy_bsut-ud-dev.conllu1 MB
- hy_bsut-ud-train.txt220 kB
- hy_bsut-ud-train.conllu2 MB
- stats.xml23 kB
- LICENSE.txt202 B
- hy_bsut-ud-test.conllu1 MB
- hy_bsut-ud-test.txt109 kB
- UD_French-PUD
- fr_pud-ud-test.txt130 kB
- stats.xml8 kB
- fr_pud-ud-test.conllu1 MB
- README.md5 kB
- LICENSE.txt19 kB
- UD_Indonesian-GSD
- README.md6 kB
- id_gsd-ud-test.txt69 kB
- id_gsd-ud-dev.conllu969 kB
- id_gsd-ud-train.conllu7 MB
- stats.xml8 kB
- LICENSE.txt202 B
- id_gsd-ud-test.conllu903 kB
- id_gsd-ud-dev.txt73 kB
- id_gsd-ud-train.txt573 kB
- UD_Wolof-WTB
- wo_wtb-ud-train.txt100 kB
- README.md2 kB
- wo_wtb-ud-test.conllu637 kB
- wo_wtb-ud-dev.conllu625 kB
- stats.xml11 kB
- wo_wtb-ud-train.conllu1 MB
- wo_wtb-ud-dev.txt43 kB
- LICENSE.txt202 B
- wo_wtb-ud-test.txt44 kB
- UD_Turkish-Tourism
- README.md1 kB
- tr_tourism-ud-test.conllu715 kB
- tr_tourism-ud-dev.conllu747 kB
- tr_tourism-ud-train.conllu5 MB
- stats.xml13 kB
- LICENSE.txt202 B
- tr_tourism-ud-train.txt477 kB
- tr_tourism-ud-dev.txt69 kB
- tr_tourism-ud-test.txt67 kB
- UD_Spanish-GSD
- README.md4 kB
- es_gsd-ud-train.conllu22 MB
- es_gsd-ud-test.conllu714 kB
- es_gsd-ud-test.txt61 kB
- es_gsd-ud-train.txt1 MB
- es_gsd-ud-dev.conllu2 MB
- es_gsd-ud-dev.txt191 kB
- stats.xml10 kB
- LICENSE.txt202 B
- UD_Persian-PerDT
- fa_perdt-ud-train.conllu28 MB
- README.md4 kB
- fa_perdt-ud-dev.conllu1 MB
- fa_perdt-ud-dev.txt206 kB
- fa_perdt-ud-test.txt198 kB
- fa_perdt-ud-train.txt3 MB
- stats.xml7 kB
- LICENSE.txt19 kB
- fa_perdt-ud-test.conllu1 MB
- UD_Tagalog-Ugnayan
- stats.xml3 kB
- README.md1 kB
- tl_ugnayan-ud-test.txt5 kB
- tl_ugnayan-ud-test.conllu53 kB
- LICENSE.txt219 B
- UD_Italian-TWITTIRO
- README.md3 kB
- it_twittiro-ud-test.conllu184 kB
- it_twittiro-ud-test.txt15 kB
- it_twittiro-ud-train.txt120 kB
- it_twittiro-ud-train.conllu1 MB
- stats.xml9 kB
- it_twittiro-ud-dev.conllu188 kB
- it_twittiro-ud-dev.txt15 kB
- LICENSE.txt202 B
- UD_English-Atis
- en_atis-ud-test.conllu334 kB
- README.md1 kB
- en_atis-ud-train.conllu2 MB
- en_atis-ud-test.txt36 kB
- en_atis-ud-train.txt271 kB
- en_atis-ud-dev.txt36 kB
- stats.xml6 kB
- LICENSE.txt202 B
- en_atis-ud-dev.conllu332 kB
- UD_Coptic-Scriptorium
- README.md11 kB
- cop_scriptorium-ud-test.conllu955 kB
- cop_scriptorium-ud-test.txt80 kB
- cop_scriptorium-ud-train.conllu2 MB
- cop_scriptorium-ud-dev.conllu1012 kB
- stats.xml8 kB
- LICENSE.txt538 B
- cop_scriptorium-ud-dev.txt85 kB
- cop_scriptorium-ud-train.txt234 kB
- UD_Polish-LFG
- pl_lfg-ud-dev.txt74 kB
- pl_lfg-ud-train.txt596 kB
- README.md6 kB
- pl_lfg-ud-test.txt74 kB
- pl_lfg-ud-dev.conllu1 MB
- pl_lfg-ud-test.conllu1 MB
- stats.xml14 kB
- LICENSE.txt34 kB
- pl_lfg-ud-train.conllu11 MB
- UD_Russian-GSD
- ru_gsd-ud-dev.conllu1 MB
- README.md1 kB
- ru_gsd-ud-test.conllu1003 kB
- ru_gsd-ud-dev.txt123 kB
- ru_gsd-ud-train.txt794 kB
- ru_gsd-ud-test.txt120 kB
- stats.xml13 kB
- ru_gsd-ud-train.conllu6 MB
- LICENSE.txt202 B
- UD_Komi_Zyrian-Lattice
- stats.xml25 kB
- README.md7 kB
- LICENSE.txt202 B
- kpv_lattice-ud-test.txt79 kB
- kpv_lattice-ud-test.conllu741 kB
- UD_Estonian-EWT
- et_ewt-ud-train.txt306 kB
- README.md3 kB
- et_ewt-ud-dev.txt54 kB
- et_ewt-ud-dev.conllu693 kB
- et_ewt-ud-test.conllu920 kB
- et_ewt-ud-test.txt76 kB
- et_ewt-ud-train.conllu3 MB
- stats.xml12 kB
- LICENSE.txt202 B
- UD_Yakut-YKTDT
- stats.xml9 kB
- README.md2 kB
- sah_yktdt-ud-test.txt6 kB
- LICENSE.txt202 B
- sah_yktdt-ud-test.conllu51 kB
- UD_Indonesian-CSUI
- stats.xml7 kB
- README.md3 kB
- id_csui-ud-train.txt108 kB
- id_csui-ud-test.txt59 kB
- LICENSE.txt202 B
- id_csui-ud-train.conllu1 MB
- id_csui-ud-test.conllu589 kB
- UD_Lithuanian-ALKSNIS
- lt_alksnis-ud-train.txt317 kB
- README.md4 kB
- lt_alksnis-ud-test.conllu1 MB
- lt_alksnis-ud-train.conllu4 MB
- lt_alksnis-ud-dev.conllu1 MB
- lt_alksnis-ud-test.txt69 kB
- stats.xml13 kB
- LICENSE.txt202 B
- lt_alksnis-ud-dev.txt78 kB
- UD_Dutch-Alpino
- nl_alpino-ud-test.conllu902 kB
- nl_alpino-ud-train.conllu14 MB
- nl_alpino-ud-train.txt1016 kB
- nl_alpino-ud-dev.conllu942 kB
- nl_alpino-ud-dev.txt62 kB
- stats.xml7 kB
- LICENSE.txt19 kB
- README.txt5 kB
- nl_alpino-ud-test.txt64 kB
- UD_Romanian-Nonstandard
- ro_nonstandard-ud-test.txt104 kB
- README.md9 kB
- ro_nonstandard-ud-dev.txt91 kB
- ro_nonstandard-ud-dev.conllu1 MB
- ro_nonstandard-ud-test.conllu1 MB
- ro_nonstandard-ud-train.txt2 MB
- ro_nonstandard-ud-train.conllu44 MB
- stats.xml12 kB
- LICENSE.txt202 B
- UD_Apurina-UFPA
- stats.xml8 kB
- README.md2 kB
- LICENSE.txt202 B
- apu_ufpa-ud-test.conllu95 kB
- apu_ufpa-ud-test.txt4 kB
- UD_Livvi-KKPP
- stats.xml10 kB
- olo_kkpp-ud-train.txt808 B
- README.md4 kB
- olo_kkpp-ud-test.conllu103 kB
- olo_kkpp-ud-test.txt9 kB
- LICENSE.txt202 B
- olo_kkpp-ud-train.conllu15 kB
- UD_German-PUD
- stats.xml9 kB
- README.md5 kB
- LICENSE.txt19 kB
- de_pud-ud-test.txt126 kB
- de_pud-ud-test.conllu1 MB
- UD_Turkish-Kenet
- tr_kenet-ud-dev.txt122 kB
- README.md1 kB
- tr_kenet-ud-train.conllu9 MB
- tr_kenet-ud-test.txt123 kB
- tr_kenet-ud-dev.conllu1 MB
- stats.xml13 kB
- LICENSE.txt202 B
- tr_kenet-ud-train.txt989 kB
- tr_kenet-ud-test.conllu1 MB
- UD_Akkadian-PISANDUB
- stats.xml3 kB
- README.md871 B
- akk_pisandub-ud-test.txt15 kB
- LICENSE.txt202 B
- akk_pisandub-ud-test.conllu99 kB
- UD_Galician-TreeGal
- stats.xml9 kB
- README.md5 kB
- gl_treegal-ud-test.txt50 kB
- gl_treegal-ud-train.conllu1 MB
- LICENSE.txt14 kB
- gl_treegal-ud-train.txt76 kB
- gl_treegal-ud-test.conllu670 kB
- UD_Thai-PUD
- stats.xml4 kB
- th_pud-ud-test.conllu1 MB
- README.md5 kB
- LICENSE.txt19 kB
- th_pud-ud-test.txt281 kB
- UD_Latin-Perseus
- stats.xml8 kB
- la_perseus-ud-train.conllu1 MB
- README.md3 kB
- la_perseus-ud-test.conllu961 kB
- la_perseus-ud-test.txt61 kB
- LICENSE.txt279 B
- la_perseus-ud-train.txt104 kB
- UD_Old_Turkish-Tonqq
- stats.xml2 kB
- otk_tonqq-ud-test.txt1 kB
- README.md1 kB
- otk_tonqq-ud-test.conllu10 kB
- LICENSE.txt6 kB
- UD_Hindi_English-HIENCS
- README.md3 kB
- qhe_hiencs-ud-train.conllu681 kB
- qhe_hiencs-ud-test.conllu104 kB
- qhe_hiencs-ud-test.txt6 kB
- qhe_hiencs-ud-train.txt39 kB
- qhe_hiencs-ud-dev.conllu107 kB
- merge
- tweet_ids_dev.txt4 kB
- train-annot.json1 MB
- EMOTICONS3 kB
- EDITS6 kB
- test-annot.json229 kB
- NONBREAKING_PREFIXES812 B
- DOMAINS293 B
- tweet_ids_test.txt4 kB
- tweet_ids_train.txt26 kB
- dev-annot.json236 kB
- stats.xml2 kB
- LICENSE.txt202 B
- crawl_tweets.py18 kB
- qhe_hiencs-ud-dev.txt6 kB
- UD_Italian-PoSTWITA
- it_postwita-ud-test.conllu759 kB
- it_postwita-ud-train.txt526 kB
- README.md3 kB
- it_postwita-ud-dev.conllu732 kB
- it_postwita-ud-train.conllu5 MB
- stats.xml9 kB
- LICENSE.txt18 kB
- it_postwita-ud-dev.txt64 kB
- it_postwita-ud-test.txt67 kB
- UD_Latvian-LVTB
- README.md6 kB
- lv_lvtb-ud-dev.txt197 kB
- lv_lvtb-ud-test.conllu3 MB
- lv_lvtb-ud-dev.conllu3 MB
- lv_lvtb-ud-test.txt216 kB
- stats.xml13 kB
- lv_lvtb-ud-train.txt1 MB
- LICENSE.txt19 kB
- lv_lvtb-ud-train.conllu23 MB
- UD_Low_Saxon-LSDC
- stats.xml10 kB
- README.md4 kB
- nds_lsdc-ud-test.conllu209 kB
- LICENSE.txt202 B
- nds_lsdc-ud-test.txt11 kB
- UD_Karelian-KKPP
- stats.xml10 kB
- krl_kkpp-ud-test.conllu220 kB
- README.md2 kB
- LICENSE.txt202 B
- krl_kkpp-ud-test.txt21 kB
- UD_Polish-PDB
- pl_pdb-ud-train.txt1 MB
- README.md5 kB
- pl_pdb-ud-dev.conllu3 MB
- pl_pdb-ud-test.txt203 kB
- pl_pdb-ud-train.conllu27 MB
- pl_pdb-ud-dev.txt210 kB
- stats.xml17 kB
- LICENSE.txt384 B
- pl_pdb-ud-test.conllu3 MB
- UD_Croatian-SET
- hr_set-ud-dev.conllu1 MB
- README.md5 kB
- hr_set-ud-dev.txt130 kB
- hr_set-ud-train.conllu11 MB
- hr_set-ud-train.txt901 kB
- stats.xml11 kB
- hr_set-ud-test.txt143 kB
- LICENSE.txt233 B
- hr_set-ud-test.conllu1 MB
- UD_Ancient_Hebrew-PTNK
- README.md1 kB
- hbo_ptnk-ud-dev.txt98 kB
- hbo_ptnk-ud-dev.conllu841 kB
- hbo_ptnk-ud-test.conllu841 kB
- hbo_ptnk-ud-train.txt172 kB
- stats.xml10 kB
- hbo_ptnk-ud-train.conllu1 MB
- LICENSE.txt202 B
- hbo_ptnk-ud-test.txt95 kB
- UD_North_Sami-Giella
- stats.xml10 kB
- README.md2 kB
- sme_giella-ud-train.txt107 kB
- sme_giella-ud-train.conllu1 MB
- LICENSE.txt202 B
- sme_giella-ud-test.conllu668 kB
- sme_giella-ud-test.txt70 kB
- UD_Khunsari-AHA
- stats.xml4 kB
- README.md1 kB
- kfm_aha-ud-test.conllu6 kB
- LICENSE.txt202 B
- kfm_aha-ud-test.txt542 B
- UD_Maltese-MUDT
- mt_mudt-ud-dev.txt55 kB
- README.md6 kB
- mt_mudt-ud-train.conllu1020 kB
- mt_mudt-ud-test.txt59 kB
- mt_mudt-ud-dev.conllu454 kB
- stats.xml3 kB
- LICENSE.txt202 B
- mt_mudt-ud-train.txt123 kB
- mt_mudt-ud-test.conllu489 kB
- UD_Madi-Jarawara
- stats.xml5 kB
- jaa_jarawara-ud-test.conllu7 kB
- README.md1 kB
- jaa_jarawara-ud-test.txt542 B
- LICENSE.txt202 B
- UD_Persian-Seraji
- fa_seraji-ud-dev.conllu989 kB
- README.md5 kB
- fa_seraji-ud-test.txt134 kB
- fa_seraji-ud-train.conllu7 MB
- fa_seraji-ud-test.conllu1021 kB
- stats.xml9 kB
- fa_seraji-ud-train.txt995 kB
- LICENSE.txt110 B
- fa_seraji-ud-dev.txt133 kB
- UD_Indonesian-PUD
- stats.xml8 kB
- README.md8 kB
- id_pud-ud-test.txt117 kB
- LICENSE.txt19 kB
- id_pud-ud-test.conllu1 MB
- UD_Belarusian-HSE
- be_hse-ud-test.txt180 kB
- README.md6 kB
- be_hse-ud-train.txt2 MB
- be_hse-ud-dev.conllu1 MB
- be_hse-ud-train.conllu26 MB
- be_hse-ud-test.conllu1 MB
- stats.xml15 kB
- LICENSE.txt1021 B
- be_hse-ud-dev.txt164 kB
- UD_Norwegian-Nynorsk
- no_nynorsk-ud-dev.conllu1 MB
- README.md4 kB
- no_nynorsk-ud-test.txt135 kB
- no_nynorsk-ud-dev.txt166 kB
- stats.xml9 kB
- no_nynorsk-ud-test.conllu1 MB
- LICENSE.txt68 B
- no_nynorsk-ud-train.txt1 MB
- no_nynorsk-ud-train.conllu14 MB
- UD_Turkish-BOUN
- README.md3 kB
- tr_boun-ud-dev.txt81 kB
- tr_boun-ud-dev.conllu915 kB
- tr_boun-ud-train.txt660 kB
- tr_boun-ud-test.conllu918 kB
- tr_boun-ud-train.conllu7 MB
- stats.xml12 kB
- LICENSE.txt202 B
- tr_boun-ud-test.txt81 kB
- UD_Old_East_Slavic-Birchbark
- README.md4 kB
- orv_birchbark-ud-dev.txt89 kB
- orv_birchbark-ud-dev.conllu1 MB
- orv_birchbark-ud-train.txt66 kB
- orv_birchbark-ud-test.txt90 kB
- orv_birchbark-ud-test.conllu1 MB
- stats.xml14 kB
- LICENSE.txt202 B
- orv_birchbark-ud-train.conllu1 MB
- UD_Guajajara-TuDeT
- stats.xml12 kB
- README.md3 kB
- gub_tudet-ud-test.txt46 kB
- gub_tudet-ud-test.conllu683 kB
- LICENSE.txt202 B
- UD_Norwegian-NynorskLIA
- no_nynorsklia-ud-test.txt42 kB
- no_nynorsklia-ud-dev.conllu593 kB
- no_nynorsklia-ud-test.conllu594 kB
- stats.xml8 kB
- LICENSE.txt202 B
- README.txt1 kB
- no_nynorsklia-ud-dev.txt42 kB
- no_nynorsklia-ud-train.txt147 kB
- no_nynorsklia-ud-train.conllu2 MB
- UD_Ligurian-GLT
- stats.xml8 kB
- lij_glt-ud-train.txt918 B
- lij_glt-ud-test.conllu411 kB
- README.md1 kB
- lij_glt-ud-train.conllu14 kB
- LICENSE.txt3 kB
- lij_glt-ud-test.txt27 kB
- UD_Bulgarian-BTB
- bg_btb-ud-dev.txt155 kB
- bg_btb-ud-train.txt1 MB
- bg_btb-ud-test.conllu1 MB
- bg_btb-ud-train.conllu11 MB
- stats.xml12 kB
- bg_btb-ud-test.txt152 kB
- LICENSE.txt327 B
- README.txt7 kB
- bg_btb-ud-dev.conllu1 MB
- UD_Romanian-SiMoNERo
- ro_simonero-ud-test.conllu1 MB
- README.md2 kB
- ro_simonero-ud-dev.conllu1 MB
- ro_simonero-ud-test.txt93 kB
- ro_simonero-ud-train.txt719 kB
- ro_simonero-ud-dev.txt91 kB
- stats.xml11 kB
- ro_simonero-ud-train.conllu9 MB
- LICENSE.txt202 B
- UD_Spanish-PUD
- stats.xml10 kB
- es_pud-ud-test.conllu1 MB
- README.md5 kB
- LICENSE.txt19 kB
- es_pud-ud-test.txt123 kB
- UD_Cebuano-GJA
- ceb_gja-ud-test.conllu99 kB
- stats.xml7 kB
- README.md1 kB
- LICENSE.txt202 B
- ceb_gja-ud-test.txt5 kB
- UD_Tatar-NMCTT
- stats.xml11 kB
- README.md1 kB
- tt_nmctt-ud-test.txt17 kB
- LICENSE.txt202 B
- tt_nmctt-ud-test.conllu141 kB
- UD_Serbian-SET
- sr_set-ud-test.txt67 kB
- README.md1 kB
- sr_set-ud-train.conllu5 MB
- sr_set-ud-dev.txt68 kB
- stats.xml11 kB
- sr_set-ud-test.conllu847 kB
- LICENSE.txt230 B
- sr_set-ud-train.txt432 kB
- sr_set-ud-dev.conllu888 kB
- UD_Chinese-HK
- stats.xml3 kB
- README.md4 kB
- LICENSE.txt202 B
- zh_hk-ud-test.conllu482 kB
- zh_hk-ud-test.txt41 kB
- UD_Marathi-UFAL
- stats.xml14 kB
- UD_Arabic-PADT
- README.md6 kB
- ar_padt-ud-dev.conllu5 MB
- ar_padt-ud-train.conllu38 MB
- ar_padt-ud-train.txt1 MB
- ar_padt-ud-test.txt234 kB
- stats.xml11 kB
- ar_padt-ud-test.conllu4 MB
- ar_padt-ud-dev.txt241 kB
- LICENSE.txt19 kB
- UD_English-Pronouns
- stats.xml5 kB
- en_pronouns-ud-test.conllu138 kB
- README.md9 kB
- LICENSE.txt202 B
- en_pronouns-ud-test.txt7 kB
- UD_Upper_Sorbian-UFAL
- stats.xml11 kB
- README.md1 kB
- hsb_ufal-ud-test.conllu730 kB
- hsb_ufal-ud-train.conllu31 kB
- hsb_ufal-ud-test.txt64 kB
- LICENSE.txt202 B
- hsb_ufal-ud-train.txt2 kB
- UD_Ancient_Greek-PROIEL
- README.md2 kB
- grc_proiel-ud-train.conllu19 MB
- grc_proiel-ud-dev.txt159 kB
- grc_proiel-ud-test.conllu1 MB
- grc_proiel-ud-test.txt154 kB
- stats.xml13 kB
- LICENSE.txt279 B
- grc_proiel-ud-train.txt2 MB
- grc_proiel-ud-dev.conllu1 MB
- UD_Chinese-GSD
- README.md2 kB
- zh_gsd-ud-test.conllu647 kB
- zh_gsd-ud-train.conllu5 MB
- zh_gsd-ud-train.txt433 kB
- zh_gsd-ud-dev.txt55 kB
- zh_gsd-ud-dev.conllu680 kB
- stats.xml5 kB
- zh_gsd-ud-test.txt53 kB
- LICENSE.txt202 B
- UD_Old_Church_Slavonic-PROIEL
- cu_proiel-ud-train.txt369 kB
- README.md2 kB
- cu_proiel-ud-test.txt99 kB
- cu_proiel-ud-dev.conllu1 MB
- cu_proiel-ud-test.conllu1 MB
- cu_proiel-ud-train.conllu3 MB
- stats.xml12 kB
- LICENSE.txt279 B
- cu_proiel-ud-dev.txt97 kB
- UD_Russian-PUD
- stats.xml12 kB
- README.md5 kB
- LICENSE.txt19 kB
- ru_pud-ud-test.txt209 kB
- ru_pud-ud-test.conllu1 MB
- UD_Arabic-PUD
- stats.xml9 kB
- README.md5 kB
- ar_pud-ud-test.txt168 kB
- LICENSE.txt19 kB
- ar_pud-ud-test.conllu1 MB
- UD_Icelandic-PUD
- stats.xml9 kB
- is_pud-ud-test.txt119 kB
- README.md3 kB
- LICENSE.txt202 B
- is_pud-ud-test.conllu1 MB
- UD_Yupik-SLI
- stats.xml8 kB
- README.md2 kB
- ess_sli-ud-test.txt9 kB
- LICENSE.txt202 B
- ess_sli-ud-test.conllu302 kB
- UD_Mbya_Guarani-Dooley
- stats.xml7 kB
- gun_dooley-ud-test.conllu560 kB
- README.md3 kB
- LICENSE.txt202 B
- gun_dooley-ud-test.txt23 kB
- UD_French-GSD
- fr_gsd-ud-train.conllu21 MB
- README.md7 kB
- fr_gsd-ud-dev.conllu2 MB
- fr_gsd-ud-dev.txt184 kB
- stats.xml10 kB
- fr_gsd-ud-test.conllu626 kB
- LICENSE.txt202 B
- fr_gsd-ud-test.txt49 kB
- fr_gsd-ud-train.txt1 MB
- UD_Assyrian-AS
- stats.xml7 kB
- aii_as-ud-test.conllu31 kB
- aii_as-ud-test.txt4 kB
- README.md1 kB
- LICENSE.txt202 B
- UD_Chukchi-HSE
- stats.xml3 kB
- README.md4 kB
- ckt_hse-ud-test.txt72 kB
- LICENSE.txt202 B
- ckt_hse-ud-test.conllu793 kB
- UD_Albanian-TSA
- stats.xml8 kB
- sq_tsa-ud-test.conllu61 kB
- README.md1 kB
- sq_tsa-ud-test.txt5 kB
- LICENSE.txt202 B
- UD_Bhojpuri-BHTB
- bho_bhtb-ud-test.txt73 kB
- stats.xml11 kB
- README.md3 kB
- bho_bhtb-ud-test.conllu599 kB
- LICENSE.txt202 B
- UD_Hindi-PUD
- stats.xml9 kB
- hi_pud-ud-test.conllu2 MB
- README.md5 kB
- LICENSE.txt19 kB
- hi_pud-ud-test.txt281 kB
- UD_Greek-GDT
- README.md3 kB
- el_gdt-ud-train.txt440 kB
- el_gdt-ud-train.conllu3 MB
- el_gdt-ud-dev.txt107 kB
- el_gdt-ud-test.conllu951 kB
- el_gdt-ud-dev.conllu933 kB
- el_gdt-ud-test.txt110 kB
- stats.xml12 kB
- LICENSE.txt398 B
- UD_Latin-LLCT
- la_llct-ud-dev.conllu2 MB
- README.md6 kB
- la_llct-ud-test.conllu2 MB
- la_llct-ud-train.conllu16 MB
- stats.xml12 kB
- la_llct-ud-dev.txt136 kB
- LICENSE.txt202 B
- la_llct-ud-test.txt136 kB
- la_llct-ud-train.txt1 MB
- UD_Japanese-BCCWJ
- ja_bccwj-ud-train.txt902 kB
- ja_bccwj-ud-train.conllu67 MB
- ja_bccwj-ud-dev.txt177 kB
- ja_bccwj-ud-test.conllu12 MB
- merge
- dev_pos.pkl2 MB
- test_pos.pkl2 MB
- script
- lib.py5 kB
- restore_word_unit_bccwj.py7 kB
- convert_core_bccwj_pkl.py746 B
- misc_mapping.pkl23 MB
- merge.sh1 kB
- train_pos.pkl13 MB
- stats.xml2 kB
- LICENSE.txt18 kB
- README.txt3 kB
- ja_bccwj-ud-test.txt165 kB
- ja_bccwj-ud-dev.conllu13 MB
- UD_Latin-ITTB
- la_ittb-ud-train.txt2 MB
- README.md9 kB
- la_ittb-ud-dev.txt168 kB
- la_ittb-ud-test.conllu2 MB
- la_ittb-ud-dev.conllu2 MB
- stats.xml17 kB
- LICENSE.txt19 kB
- la_ittb-ud-test.txt169 kB
- la_ittb-ud-train.conllu35 MB
- UD_Armenian-ArmTDP
- README.md4 kB
- hy_armtdp-ud-train.conllu5 MB
- hy_armtdp-ud-dev.conllu694 kB
- hy_armtdp-ud-test.txt51 kB
- hy_armtdp-ud-dev.txt57 kB
- hy_armtdp-ud-train.txt434 kB
- stats.xml24 kB
- hy_armtdp-ud-test.conllu656 kB
- LICENSE.txt202 B
- UD_Vietnamese-VTB
- vi_vtb-ud-test.txt72 kB
- README.md1 kB
- vi_vtb-ud-train.txt127 kB
- vi_vtb-ud-train.conllu939 kB
- vi_vtb-ud-dev.txt69 kB
- stats.xml3 kB
- LICENSE.txt19 kB
- vi_vtb-ud-test.conllu545 kB
- vi_vtb-ud-dev.conllu522 kB
- UD_Akkadian-RIAO
- stats.xml9 kB
- README.md2 kB
- akk_riao-ud-test.txt148 kB
- akk_riao-ud-test.conllu1 MB
- LICENSE.txt21 kB
- UD_French-ParisStories
- stats.xml8 kB
- fr_parisstories-ud-train.txt81 kB
- README.md5 kB
- fr_parisstories-ud-train.conllu1 MB
- LICENSE.txt202 B
- fr_parisstories-ud-test.conllu664 kB
- fr_parisstories-ud-test.txt40 kB
- UD_Russian-Taiga
- ru_taiga-ud-train.conllu16 MB
- README.md5 kB
- ru_taiga-ud-test.conllu845 kB
- ru_taiga-ud-test.txt92 kB
- ru_taiga-ud-dev.txt99 kB
- ru_taiga-ud-dev.conllu888 kB
- ru_taiga-ud-train.txt1 MB
- stats.xml17 kB
- LICENSE.txt202 B
- UD_Icelandic-IcePaHC
- is_icepahc-ud-dev.conllu11 MB
- is_icepahc-ud-test.txt738 kB
- README.md6 kB
- is_icepahc-ud-dev.txt735 kB
- is_icepahc-ud-train.conllu58 MB
- stats.xml11 kB
- LICENSE.txt202 B
- is_icepahc-ud-train.txt3 MB
- is_icepahc-ud-test.conllu11 MB
- UD_English-PUD
- ... too many files ...0 B
- Name
- ud-documentation-v2.10.tgz
- Size
- 94.58 MB
- Format
- application/x-gzip
- Description
- Documentation
- MD5
- de1c43803b76598d84d6aad6a974304a
- ... too many files ...0 B
- ud-documentation-v2.10
- markdown-source
- _xnr
- index.md3 kB
- ext-feat-index.md122 kB
- _qtd
- _ti
- template-index.md1 kB
- _ha
- template-index.md1 kB
- _ne
- template-index.md1 kB
- _u-pos
- PRON.md2 kB
- ADV.md1 kB
- VERB.md1 kB
- NUM.md1 kB
- CCONJ.md719 B
- ADJ.md2 kB
- SCONJ.md1 kB
- SYM.md1 kB
- DET.md4 kB
- NOUN.md829 B
- PROPN.md1 kB
- INTJ.md1 kB
- PUNCT.md1013 B
- ADP.md2 kB
- AUX_.md1 kB
- X.md775 B
- PART.md1 kB
- obsolete_introductions.md1 kB
- how_to_start.md9 kB
- _kfm
- index.md2 kB
- resources
- jquery-1.11.3.min.js93 kB
- js-treex-view.min.js177 kB
- bootstrap-theme.min.css19 kB
- filesaver.min.js2 kB
- bootstrap.min.css114 kB
- blob.min.js2 kB
- conllu_viewer.css386 B
- bootstrap.min.js35 kB
- _mt
- index.md12 kB
- dep
- cop-expl.md304 B
- case-det.md460 B
- aux-neg.md1 kB
- aux-part.md318 B
- advmod-neg.md1 kB
- _hyw
- index.md17 kB
- feat
- AdpType.md1 kB
- Aspect.md4 kB
- NumForm.md1 kB
- Connegative.md2 kB
- LangId.md775 B
- Deixis-psor.md1 kB
- tokenization.md6 kB
- dep
- nmod-npmod.md3 kB
- case-loc.md2 kB
- aux-caus.md1 kB
- aux-ex.md1 kB
- iobj-agent.md2 kB
- flat-frac.md1 kB
- flat-dist.md1 kB
- nsubj-caus.md1 kB
- flat-range.md2 kB
- advcl-relcl.md1 kB
- introduction.md1 kB
- template-index.md1 kB
- pos
- PUNCT.md1 kB
- _urb
- index.md4 kB
- feat
- Person.md1013 B
- Number.md1003 B
- Aspect.md1 kB
- Case.md1 kB
- Intense.md733 B
- Tense.md1 kB
- Voice.md813 B
- Mood.md701 B
- Nomzr.md724 B
- Animacy.md979 B
- Rel.md1 kB
- _sw
- template-index.md2 kB
- _gl
- index.md4 kB
- feat
- Clitic.md995 B
- tokenization.md121 B
- introduction.md1 kB
- _koi
- index.md4 kB
- feat-index.md136 B
- feat
- NounType.md531 B
- NumType.md1 kB
- Reflex.md894 B
- Connegative.md670 B
- Person-psor.md1 kB
- Valency.md835 B
- Case.md7 kB
- Derivation.md2 kB
- dep-index.md142 B
- dep
- advcl-lcl.md710 B
- nmod-poss.md472 B
- xcomp-ds.md1 kB
- aux-neg.md1 kB
- advcl-mcl.md602 B
- advmod-tmod.md369 B
- nsubj-cop.md481 B
- advcl-tcl.md684 B
- advmod-deg.md345 B
- advmod-mmod.md492 B
- nmod-lmod.md606 B
- obl-lmod.md410 B
- aux-cnd.md457 B
- _pgl
- template-index.md1 kB
- conv-eng
- conv.py3 kB
- pick-tikz.py1 kB
- _pl
- dep
- xcomp-subj.md2 kB
- aux-imp.md889 B
- obl-orphan.md1 kB
- aux-cnd.md1 kB
- xcomp-obj.md1 kB
- advcl-relcl.md3 kB
- parataxis-obj.md1 kB
- nmod-flat.md1 kB
- det-numgov.md2 kB
- parataxis-insert.md2 kB
- ccomp-cleft.md2 kB
- nmod-pred.md1 kB
- flat-foreign.md1 kB
- cop-locat.md830 B
- obl-cmpr.md2 kB
- amod-flat.md1 kB
- discourse-intj.md1 kB
- advcl-cmpr.md1 kB
- discourse-emo.md1 kB
- xcomp-pred.md2 kB
- dep
- morphology.md94 B
- contributing.md13 kB
- _yo
- index.md7 kB
- introduction.md27 kB
- _ga
- index.md29 kB
- feat-index.md2 kB
- tokenization.md256 B
- feat
- Definite.md2 kB
- Aspect.md1 kB
- Number.md2 kB
- Abbr.md709 B
- Reflex.md598 B
- Foreign.md766 B
- Degree.md1 kB
- Tense.md1 kB
- Dialect.md1 kB
- Gender.md692 B
- VerbForm.md3 kB
- NounType.md1 kB
- Polarity.md1 kB
- Mood.md2 kB
- Poss.md2 kB
- Person.md3 kB
- Form.md5 kB
- PartType.md3 kB
- NumType.md1 kB
- PronType.md3 kB
- PrepForm.md4 kB
- Case.md2 kB
- introduction.md2 kB
- pos
- PRON.md2 kB
- ADV.md534 B
- VERB.md2 kB
- NUM.md988 B
- CCONJ.md796 B
- ADJ.md389 B
- SCONJ.md1 kB
- SYM.md310 B
- DET.md1012 B
- NOUN.md1 kB
- PROPN.md1 kB
- INTJ.md334 B
- PUNCT.md410 B
- ADP.md1 kB
- AUX_.md2 kB
- X.md637 B
- PART.md1 kB
- dep
- advcl.md2 kB
- obj.md2 kB
- nsubj.md744 B
- vocative.md1 kB
- mark-prt.md3 kB
- discourse-emo.md405 B
- mark.md3 kB
- compound-prt.md955 B
- xcomp.md2 kB
- flat.md4 kB
- compound.md2 kB
- flat-foreign.md1 kB
- csubj.md613 B
- parataxis-sentence.md568 B
- amod.md1 kB
- flat-name.md1 kB
- nmod.md4 kB
- nummod.md818 B
- parataxis-hashtag.md889 B
- acl-relcl.md5 kB
- parataxis-url.md726 B
- acl.md769 B
- case.md2 kB
- xcomp-pred.md3 kB
- nmod-poss.md535 B
- punct.md2 kB
- advmod.md3 kB
- ccomp.md3 kB
- parataxis.md1 kB
- parataxis-rt.md429 B
- nmod-prep.md1 kB
- appos.md2 kB
- case-voc.md854 B
- cc.md3 kB
- fixed.md2 kB
- det.md2 kB
- obl-tmod.md1 kB
- discourse.md1 kB
- list.md2 kB
- csubj-cleft.md4 kB
- cop.md2 kB
- csubj-cop.md1 kB
- orphan.md902 B
- obl.md2 kB
- root.md5 kB
- obl-prep.md1 kB
- vocative-mention.md747 B
- dislocated.md1 kB
- conj.md1 kB
- dep-index.md7 kB
- pos-index.md3 kB
- _si
- index.md498 B
- workgroups
- 2015-08-23-uppsala
- coordination.md3 kB
- index.md4 kB
- ellipsis.md11 kB
- future.md1 kB
- mwe.md2 kB
- tokenization.md6 kB
- copula.md5 kB
- clitics.md1 kB
- determiners.md37 kB
- particles.md1 kB
- conversion.md3 kB
- issues.md7 kB
- v3.md2 kB
- index.md1 kB
- core.md96 kB
- enhanced.md19 kB
- v1_to_v2.md1 kB
- mwe.md38 kB
- comparatives.md44 kB
- newdoc
- ditransitive_clauses.md30 kB
- index.md2 kB
- simple_noun_phrases.md11 kB
- two_nominals.md5 kB
- simple_verbal_clauses.md55 kB
- comparatives.md44 kB
- word_segmentation.md17 kB
- valency_changing_operations.md82 kB
- relative_clauses.md51 kB
- expletives.md54 kB
- existentials.md247 B
- 2015-08-23-uppsala
- _hsb
- index.md13 kB
- dep
- dep-alt.md784 B
- _lzz
- template-index.md1 kB
- _sd
- template-index.md1 kB
- _naq
- template-index.md1 kB
- _tagset-conversion
- hr-multext-uposf.md205 kB
- sv-mamba-uposf.md6 kB
- sv-parole-uposf.md23 kB
- la-conll-uposf.md94 kB
- nl-cgn-uposf.md59 kB
- pt-cintil-uposf.md24 kB
- ca-conll2009-uposf.md51 kB
- el-conll-uposf.md86 kB
- hu-conll-uposf.md120 kB
- sl-conll-uposf.md190 kB
- de-conll2009-uposf.md137 kB
- lt-multext-uposf.md122 kB
- es-conll2009-uposf.md51 kB
- te-conll-uposf.md101 kB
- fi-turku-uposf.md1013 kB
- nl-conll-uposf.md34 kB
- cs-conll-uposf.md989 kB
- en-penn-uposf.md6 kB
- ta-tamiltb-uposf.md58 kB
- it-isdt-uposf.md48 kB
- fa-conll-uposf.md56 kB
- la-itconll-uposf.md325 kB
- cs-pdt-uposf.md757 kB
- sk-snk-uposf.md256 kB
- de-smor-uposf.md159 kB
- pt-conll-uposf.md89 kB
- ro-multext-uposf.md45 kB
- ja-conll-uposf.md13 kB
- mt-mlss-uposf.md5 kB
- et-puudepank-uposf.md88 kB
- cs-multext-uposf.md224 kB
- hi-conll-uposf.md688 kB
- cs-ajka-uposf.md343 kB
- ar-padt-uposf.md48 kB
- pt-freeling-uposf.md57 kB
- ja-ipadic-uposf.md10 kB
- bn-conll-uposf.md74 kB
- de-stts-uposf.md7 kB
- ar-conll2007-uposf.md65 kB
- tr-conll-uposf.md215 kB
- ar-conll-uposf.md55 kB
- he-conll-uposf.md64 kB
- ro-rdt-uposf.md2 kB
- sl-multext-uposf.md171 kB
- ru-syntagrus-uposf.md82 kB
- index.md4 kB
- da-conll-uposf.md31 kB
- eu-conll-uposf.md952 kB
- pl-ipipan-uposf.md234 kB
- grc-conll-uposf.md250 kB
- zh-conll-uposf.md35 kB
- sv-suc-uposf.md24 kB
- bg-conll-uposf.md117 kB
- it-conll-uposf.md27 kB
- lt-jablonskis-uposf.md136 kB
- _pa
- index.md1 kB
- dep-index.md184 B
- dep
- compound-redup.md673 B
- nsubj-pass.md598 B
- acl-relcl.md1 kB
- nsubj.md2 kB
- xcomp.md1 kB
- compound-lvc.md1002 B
- acl.md1 kB
- obl-agent.md1 kB
- aux-pass.md548 B
- compound-svc.md597 B
- ccomp.md1 kB
- _u-dep-v1
- auxpass.md355 B
- remnant.md4 kB
- name.md2 kB
- csubjpass.md402 B
- foreign.md653 B
- mwe.md1 kB
- dobj.md1 kB
- neg.md482 B
- nsubjpass.md352 B
- contribute.md1 kB
- LICENSE.txt11 kB
- _fo
- index.md4 kB
- dep-index.md140 B
- dep
- cop.md1 kB
- conj.md784 B
- slavic.md744 B
- _or
- index.md1 kB
- release_checklist_add_language.md7 kB
- _ckb
- specific-syntax.md657 B
- _nyq
- index.md2 kB
- _template
- template-index-sv-example.md5 kB
- template-index-cs-example.md17 kB
- template-index.md1 kB
- _abq
- template-index.md1 kB
- _u-feat
- NounClass.md12 kB
- PronType.md6 kB
- Polite-dat.md2 kB
- Polarity.md2 kB
- Gender-obj.md2 kB
- NameType.md2 kB
- NounType.md665 B
- NumType.md5 kB
- Style.md4 kB
- Foreign.md1 kB
- Mood.md6 kB
- Person-obj.md2 kB
- Number-abs.md2 kB
- Clusivity.md1 kB
- PartType.md1 kB
- Gender.md3 kB
- Poss.md1 kB
- Case.md25 kB
- VerbType.md3 kB
- Gender-erg.md1 kB
- Person-psor.md1 kB
- Clusivity-psor.md1 kB
- Clusivity-obj.md1 kB
- AdpType.md1 kB
- Echo.md1 kB
- Person-erg.md2 kB
- Number.md5 kB
- Number-dat.md2 kB
- Person.md3 kB
- Reflex.md2 kB
- Polite-erg.md2 kB
- Animacy.md5 kB
- Definite.md4 kB
- Deixis.md4 kB
- Number-psed.md2 kB
- Number-psor.md989 B
- Voice.md5 kB
- Person-subj.md2 kB
- Typo.md2 kB
- Tense.md6 kB
- NumForm.md1 kB
- Clusivity-subj.md1 kB
- PrepCase.md1 kB
- Gender-psor.md1 kB
- Aspect.md4 kB
- Person-abs.md2 kB
- Hyph.md850 B
- Number-obj.md3 kB
- DeixisRef.md1 kB
- Evident.md1 kB
- Gender-dat.md1 kB
- Abbr.md693 B
- Polite-abs.md2 kB
- VerbForm.md6 kB
- Degree.md2 kB
- PunctType.md2 kB
- PunctSide.md769 B
- AdvType.md1 kB
- Number-subj.md3 kB
- Person-dat.md2 kB
- Subcat.md1 kB
- Number-erg.md2 kB
- Polite.md4 kB
- ConjType.md970 B
- Gender-subj.md2 kB
- NumValue.md1 kB
- logos
- by.svg9 kB
- by-nc-sa.svg22 kB
- by-sa.svg16 kB
- logo-ud.png10 kB
- by-nc-nd.svg18 kB
- F.svg3 kB
- LGPLLR.svg1 kB
- gpl.svg3 kB
- D.svg3 kB
- L.svg3 kB
- cc-zero.svg8 kB
- _myu
- index.md6 kB
- feat
- Person.md1 kB
- Red.md675 B
- Class.md1 kB
- Aspect.md2 kB
- Poss.md1 kB
- Incorp.md764 B
- PronType.md887 B
- Case.md414 B
- Trans.md603 B
- Contv.md627 B
- Voice.md1 kB
- Nomzr.md835 B
- Rel.md1 kB
- makedata.sh2 kB
- misc.md62 kB
- static
- fonts
- PT_Sans-Caption-Web-Regular.ttf378 kB
- Liberation_Sans-Regular.ttf156 kB
- fonts
- uralic.md688 B
- _akk
- _gun
- _ug
- css
- images
- ui-bg_flat_0_aaaaaa_40x100.png180 B
- ui-icons_217bc0_256x240.png4 kB
- ui-icons_cd0a0a_256x240.png4 kB
- ui-bg_inset-hard_100_fcfdfd_1x100.png88 B
- ui-icons_6da8d5_256x240.png4 kB
- ui-icons_f9bd01_256x240.png4 kB
- ui-bg_glass_95_fef1ec_1x400.png119 B
- ui-bg_inset-hard_100_f5f8f9_1x100.png104 B
- ui-icons_d8e7f3_256x240.png4 kB
- ui-bg_flat_55_fbec88_40x100.png182 B
- ui-bg_gloss-wave_55_5c9ccc_500x100.png3 kB
- ui-bg_glass_75_d0e5f5_1x400.png124 B
- ui-icons_2e83ff_256x240.png4 kB
- ui-bg_glass_85_dfeffc_1x400.png123 B
- ui-icons_469bdd_256x240.png4 kB
- style-vis.css10 kB
- style.css10 kB
- jquery-ui-redmond.css33 kB
- hint.css7 kB
- images
- events.md1 kB
- _et
- index.md6 kB
- pos-index.md132 B
- feat-index.md134 B
- feat
- Degree.md1 kB
- Mood.md3 kB
- Connegative.md751 B
- Polarity.md565 B
- Case.md6 kB
- dep-index.md140 B
- dep
- ccomp.md487 B
- nsubj.md367 B
- flat.md514 B
- cc.md1 kB
- csubj-cop.md553 B
- compound.md571 B
- obj.md761 B
- case.md595 B
- acl.md938 B
- neg.md323 B
- csubj.md576 B
- nmod.md553 B
- advcl.md995 B
- nsubj-cop.md472 B
- advmod.md518 B
- cop.md975 B
- aux_.md1 kB
- conj.md614 B
- amod.md424 B
- appos.md953 B
- pos
- PRON.md1 kB
- ADV.md720 B
- VERB.md1 kB
- NUM.md501 B
- CCONJ.md750 B
- ADJ.md797 B
- SCONJ.md515 B
- SYM.md375 B
- DET.md180 B
- NOUN.md386 B
- PROPN.md401 B
- INTJ.md341 B
- PUNCT.md263 B
- ADP.md483 B
- AUX_.md892 B
- X.md653 B
- PART.md201 B
- introduction.md2 kB
- _es
- index.md10 kB
- pos-index.md132 B
- dep-index.md140 B
- morphology.md911 B
- dep
- ccomp.md431 B
- iobj.md320 B
- nsubj.md508 B
- punct.md293 B
- det.md302 B
- cc.md670 B
- obj.md312 B
- acl.md632 B
- parataxis.md389 B
- nummod.md397 B
- xcomp.md333 B
- csubj.md491 B
- advcl.md716 B
- advmod.md409 B
- cop.md364 B
- vocative.md483 B
- aux_.md649 B
- conj.md501 B
- nsubj-pass.md403 B
- csubj-pass.md432 B
- aux-pass.md345 B
- amod.md333 B
- root.md510 B
- mark.md542 B
- pos
- NOUN.md569 B
- INTJ.md1 kB
- ADV.md1 kB
- PUNCT.md480 B
- ADJ.md1 kB
- introduction.md884 B
- _hu
- template-index.md1 kB
- syntax.md2 kB
- feat-index.md134 B
- tokenization.md494 B
- specific-syntax.md674 B
- morphology.md1 kB
- feat
- VerbForm.md2 kB
- Number-psor.md920 B
- Person.md1003 B
- Number.md712 B
- Aspect.md311 B
- Definite.md1 kB
- PronType.md1 kB
- NumType.md1019 B
- Number-psed.md2 kB
- Case.md7 kB
- Degree.md1013 B
- Person-psor.md1 kB
- Tense.md634 B
- Voice.md847 B
- Mood.md1 kB
- pos
- PRON.md344 B
- ADV.md246 B
- VERB.md447 B
- NUM.md255 B
- ADJ.md473 B
- DET.md425 B
- NOUN.md216 B
- PROPN.md231 B
- ADP.md172 B
- AUX_.md383 B
- PART.md328 B
- dep
- amod-attlvc.md2 kB
- nmod-attlvc.md599 B
- nsubj-lvc.md2 kB
- nmod-obl.md722 B
- advmod-locy.md1 kB
- compound.md407 B
- advmod-mode.md1 kB
- ccomp-obj.md830 B
- amod-att.md480 B
- advmod-tfrom.md1 kB
- advmod-tlocy.md1 kB
- advmod-que.md807 B
- ccomp-obl.md1 kB
- compound-preverb.md560 B
- nmod-att.md503 B
- ccomp-pred.md1 kB
- obl-lvc.md2 kB
- obj-lvc.md2 kB
- advmod-tto.md1 kB
- advmod-to.md1 kB
- dep-index.md140 B
- pos-index.md132 B
- _grc
- pos-index.md134 B
- feat-index.md136 B
- feat
- Degree.md4 kB
- Gender.md1 kB
- Case.md2 kB
- tokenization.md1 kB
- pos
- PRON.md1 kB
- ADV.md1 kB
- VERB.md1 kB
- CCONJ.md421 B
- NUM.md1 kB
- ADJ.md2 kB
- SCONJ.md967 B
- SYM.md270 B
- DET.md1 kB
- NOUN.md1004 B
- PROPN.md331 B
- INTJ.md300 B
- PUNCT.md1 kB
- ADP.md2 kB
- AUX_.md1 kB
- X.md137 B
- PART.md1 kB
- introduction.md1 kB
- template-index.md1 kB
- _cgg
- template-index.md1 kB
- _hr
- index.md8 kB
- _tpn
- index.md10 kB
- feat
- ConjType.md633 B
- Aspect.md1 kB
- Number.md738 B
- Priv.md611 B
- AdvType.md1 kB
- Voice.md1 kB
- Corf.md440 B
- Nomzr.md2 kB
- Int.md749 B
- Emph.md431 B
- Recip.md416 B
- Mood.md1 kB
- Person.md2 kB
- Poss.md794 B
- Hum.md688 B
- Red.md868 B
- Foc.md650 B
- Speech.md830 B
- Incorp.md640 B
- Rel.md2 kB
- Intens.md700 B
- Augm.md720 B
- Case.md1 kB
- NonFoc.md869 B
- Delib.md663 B
- Dev.md914 B
- dep
- obl-subj.md663 B
- advcl.md831 B
- obl-obj.md670 B
- pos
- ADP.md787 B
- _bm
- template-index.md1 kB
- feat-index.md145 B
- tokenization.md161 B
- morphology.md4 kB
- feat
- Person.md800 B
- Valency.md836 B
- VerbForm.md1014 B
- Number.md1 kB
- Aspect.md1 kB
- Polarity.md728 B
- PronType.md1 kB
- NumType.md755 B
- Tense.md1015 B
- Mood.md1 kB
- pos
- PRON.md389 B
- VERB.md466 B
- ADV.md342 B
- NUM.md346 B
- CCONJ.md497 B
- ADJ.md467 B
- SCONJ.md448 B
- DET.md854 B
- NOUN.md243 B
- PROPN.md301 B
- INTJ.md429 B
- AUX_.md537 B
- ADP.md495 B
- PART.md472 B
- dep
- ccomp.md1 kB
- nsubj.md512 B
- nmod-poss.md1 kB
- flat.md939 B
- det.md713 B
- cc.md823 B
- obj.md630 B
- det-rel.md932 B
- compound-redup.md800 B
- case.md2 kB
- parataxis-obj.md738 B
- dislocated.md844 B
- acl.md1 kB
- nummod.md721 B
- parataxis.md1 kB
- orphan.md882 B
- xcomp.md1 kB
- fixed.md808 B
- csubj.md702 B
- advcl.md707 B
- obl.md2 kB
- vocative.md707 B
- aux_.md1 kB
- conj.md768 B
- discourse.md1 kB
- amod.md630 B
- root.md454 B
- reparandum.md855 B
- mark.md1 kB
- appos.md673 B
- dep-index.md229 B
- pos-index.md216 B
- _no
- index.md2 kB
- syntax.md1 kB
- tokenization.md363 B
- specific-syntax.md4 kB
- morphology.md358 B
- introduction.md2 kB
- pos
- PRON.md1 kB
- VERB.md1 kB
- ADV.md435 B
- CCONJ.md431 B
- NUM.md478 B
- ADJ.md469 B
- SCONJ.md549 B
- SYM.md446 B
- DET.md1 kB
- NOUN.md507 B
- PROPN.md495 B
- INTJ.md375 B
- PUNCT.md361 B
- AUX_.md1 kB
- ADP.md456 B
- X.md302 B
- PART.md523 B
- dep
- obj.md340 B
- advcl.md863 B
- nsubj.md922 B
- mark.md538 B
- compound-prt.md1 kB
- xcomp.md1 kB
- compound.md841 B
- flat-foreign.md400 B
- csubj.md620 B
- flat-name.md708 B
- amod.md599 B
- nmod.md576 B
- nummod.md501 B
- iobj.md688 B
- acl-relcl.md1 kB
- nsubj-pass.md652 B
- acl.md667 B
- case.md698 B
- punct.md1 kB
- advmod.md421 B
- aux-pass.md385 B
- ccomp.md579 B
- parataxis.md861 B
- parataxis-deletion.md653 B
- goeswith.md520 B
- appos.md740 B
- cc.md760 B
- csubj-pass.md546 B
- det.md778 B
- discourse.md481 B
- cop.md463 B
- orphan.md768 B
- aux_.md856 B
- obl.md817 B
- root.md296 B
- expl.md2 kB
- discourse-filler.md629 B
- acl-cleft.md393 B
- conj.md740 B
- dep-index.md140 B
- pos-index.md132 B
- _bg
- index.md8 kB
- feat-index.md145 B
- specific-syntax.md432 B
- morphology.md665 B
- feat
- Person.md1 kB
- VerbForm.md2 kB
- Number.md1 kB
- Aspect.md1 kB
- Polarity.md1 kB
- Poss.md925 B
- Definite.md1 kB
- Gender.md1 kB
- PronType.md3 kB
- Reflex.md1 kB
- NumType.md2 kB
- Case.md1 kB
- Degree.md1 kB
- Tense.md2 kB
- Mood.md2 kB
- Voice.md1 kB
- Animacy.md2 kB
- pos
- PRON.md2 kB
- ADV.md2 kB
- VERB.md1 kB
- CCONJ.md825 B
- NUM.md1 kB
- ADJ.md1 kB
- SCONJ.md859 B
- DET.md2 kB
- NOUN.md765 B
- PROPN.md1 kB
- INTJ.md1009 B
- PUNCT.md747 B
- ADP.md991 B
- AUX_.md1 kB
- PART.md1 kB
- dep
- iobj.md869 B
- ccomp.md1 kB
- nsubj.md1 kB
- flat.md1 kB
- det.md1013 B
- cc.md415 B
- obj.md626 B
- case.md641 B
- acl.md1 kB
- parataxis.md875 B
- nummod.md649 B
- xcomp.md1 kB
- fixed.md887 B
- csubj.md976 B
- obl.md767 B
- nmod.md789 B
- advcl.md745 B
- advmod.md768 B
- cop.md518 B
- vocative.md756 B
- aux_.md846 B
- conj.md598 B
- nsubj-pass.md743 B
- csubj-pass.md894 B
- expl.md2 kB
- discourse.md642 B
- amod.md465 B
- mark.md607 B
- appos.md767 B
- dep-index.md151 B
- pos-index.md143 B
- _v2
- segmentation.md4 kB
- language-specific.md7 kB
- coordination.md3 kB
- enhanced.md9 kB
- features.md49 kB
- index.md2 kB
- summary.md8 kB
- ellipsis.md8 kB
- mwe.md4 kB
- core-dependents.md10 kB
- copula.md16 kB
- sentence-mood.md80 B
- minimaldoc.md5 kB
- postags.md17 kB
- function.md5 kB
- conll-u.md3 kB
- semantic-categories.md2 kB
- _xnr
- markdown-source
- Name
- ud-tools-v2.10.tgz
- Size
- 782.79 KB
- Format
- application/x-gzip
- Description
- Tools
- MD5
- 4528404492cafe1371fc5692ff0c35bb
- ud-tools-v2.10
- check_text_wosp_match.sh814 B
- conll_convert_tags_to_uposf.pl1 kB
- check_sentence_ids.pl1 kB
- conllu-sort-sentences-by-ids.pl1 kB
- conllu-stats.py6 kB
- package_st_data.sh10 kB
- runtests.sh1 kB
- conllu-w2t.py2 kB
- file_util.pyc2 kB
- validate_repo_metadata.py4 kB
- example-data
- long-token-to-text-wrong.txt333 B
- long-token-to-text-correct.txt332 B
- long-token-to-text.conllu2 kB
- tanl.conll471 B
- conllu-copy-basic-to-enhanced.pl1 kB
- evaluate_treebank.pl18 kB
- enhanced_classify_relations.pl26 kB
- package_ud_release.sh7 kB
- conllu-stats.pl107 kB
- conllu-dependency-stats.pl944 B
- check-space-after-paragraph.pl2 kB
- file_util.py2 kB
- conllu-quick-fix-id-sequence.pl2 kB
- conllu_copy_tokenization.pl10 kB
- check_release.pl31 kB
- conllu-formconvert.py3 kB
- find_duplicate_sentences.pl1 kB
- survey_misc.pl6 kB
- remove_duplicate_sentences.pl2 kB
- validate_all.sh943 B
- fix_format_of_deps.pl1 kB
- conllu_to_conllx.pl2 kB
- LICENSE.txt17 kB
- restore_conllu_lines.pl1 kB
- mwtoken-stats.pl1 kB
- Node.pm18 kB
- overlap.py2 kB
- collect_propn_sequences.pl3 kB
- fix-space-after-paragraph.pl4 kB
- __pycache__
- file_util.cpython-37.pyc2 kB
- survey_features.pl11 kB
- udlib.pm57 kB
- survey_deprel_subtypes.pl8 kB
- compat
- argparse.pyc65 kB
- argparse.py85 kB
- __init__.pyc140 B
- __init__.py0 B
- validate-python2-obsolete.py36 kB
- v2-conversion
- convert.py3 kB
- README.md2 kB
- processors_en.py1 kB
- processors_universal.py5 kB
- depgraph_utils.py6 kB
- nmod_obl_adjudication.py3 kB
- text_without_spaces.pl2 kB
- conllu_copy_sentence_segmentation.pl7 kB
- remove_sense_suffixes_from_lemmas.pl1 kB
- generate_comparison_of_treebanks.pl2 kB
- csort.pm7 kB
- enhanced_graph_properties.pl21 kB
- create_iso_639_3_symlinks.py175 kB
- conllu-quick-fix.pl20 kB
- validate.py177 kB
- eval.py36 kB
- test-cases
- nonvalid
- lowercase-postag.conllu141 B
- lowercase-feature-value-in-empty.conllu251 B
- empty-head.conllu114 B
- invalid-deps-id.conllu173 B
- invalid-deps-syntax.conllu194 B
- misordered-feature.conllu243 B
- missing-final-line.conllu155 B
- empty-field.conllu100 B
- head-not-0-deprel-root.conllu172 B
- ambiguous-feature.conllu175 B
- empty-sentence.conllu163 B
- trailing-tab.conllu127 B
- lowercase-postag-in-empty.conllu239 B
- head-0-deprel-not-root.conllu133 B
- malformed_deps.conllu683 B
- multiple-sent_id.conllu736 B
- head-not-empty-in-empty.conllu224 B
- lowercase-feature.conllu238 B
- duplicate-value.conllu137 B
- tanl-broken.conllu690 B
- misordered-layered-feature.conllu239 B
- whitespace_nonv.conllu274 B
- misplaced-comment-end.conllu429 B
- nonsequential-empty-node-id.conllu238 B
- dos-newlines.conllu698 B
- duplicate-layered-feature.conllu182 B
- cyclic-deps.conllu227 B
- invalid-head.conllu164 B
- id-with-extra-0.conllu140 B
- duplicate-feature.conllu142 B
- overlapping-multiword.conllu387 B
- token_with_cols_filled.conllu385 B
- self-cycle-deps.conllu164 B
- nonsequential-id.conllu176 B
- space-in-field.conllu127 B
- extra-empty-line.conllu287 B
- lowercase-feature-in-empty.conllu244 B
- non-proj.conllu109 B
- no-sent_id.conllu686 B
- id-starting-from-2.conllu247 B
- misindexed-empty-node.conllu235 B
- self-cycle-head.conllu190 B
- invalid-range.conllu375 B
- uppercase-deps-deprel.conllu206 B
- empty-node-without-dependent.conllu251 B
- multiword-with-pos.conllu407 B
- uppercase-deprel.conllu184 B
- missing-space-after.conllu176 B
- invalid-deps-order.conllu409 B
- extra-field.conllu130 B
- duplicate-id.conllu171 B
- invalid-range-format.conllu380 B
- deprel-not-empty-in-empty.conllu233 B
- misplaced-comment-mid.conllu401 B
- misordered-multiword.conllu392 B
- lowercase-value.conllu237 B
- valid
- maximal-empty-node.conllu273 B
- whitespace.conllu294 B
- multiple-features.conllu295 B
- id_test_part2.conllu375 B
- empty-nodes.conllu324 B
- id_test_part1.conllu375 B
- tanl.conllu673 B
- empty-file.conllu0 B
- minimal-empty-node.conllu239 B
- layered-features.conllu272 B
- nonvalid
- README.md12 kB
- conllu-tenfold.pl2 kB
- conllu-remove-enhanced-deps.pl443 B
- save_evaluation_logs.sh962 B
- mergept.pl2 kB
- Graph.pm12 kB
- normalize_unicode.pl511 B
- data
- deprel.shopen311 B
- edeprel.ta2 kB
- tokens_w_space.ud27 B
- edeprel.ar27 kB
- tokens_w_space.br457 B
- tokens_w_space.koi86 B
- docdeps.json223 kB
- tokens_w_space.kk1 kB
- tokens_w_space.nl158 B
- cpos.ud79 B
- edeprels.json788 kB
- tokens_w_space.hit72 B
- edeprel.lt2 kB
- tokens_w_space.am82 B
- edeprel.ru14 kB
- deprels.json670 kB
- tokens_w_space.sv131 B
- tokens_w_space.myv82 B
- tokens_w_space.mdf82 B
- tokens_w_space.pl366 B
- edeprel.uk5 kB
- feats.json963 kB
- tokens_w_space.akk246 B
- tokens_w_space.ja844 B
- tokens_w_space.vi3 B
- deprel.ud237 B
- tokens_w_space.kpv86 B
- data.json348 kB
- tokens_w_space.fro10 B
- tokens_w_space.shopen9 B
- feat_val.shopen2 kB
- tokens_w_space.kmr277 B
- docfeats.json994 kB
- tokens_w_space.fr10 B
- tokens_w_space.lv112 B
- tokens_w_space.sms151 B
- tokens_w_space.sjo2 kB
- tokens_w_space.lt1 kB
- README.md808 B
- edeprel.be6 kB
- tokens_w_space.apu123 B
- tokens_w_space.fi78 B
- generate_treebank_hub.pl1 kB
- conllu_to_text.pl9 kB
- check_overlaps.pl1 kB
- survey_enhancements.pl7 kB
- conllu_align_tokens.pl6 kB
- check_files.pl3 kB
- enhanced_collapse_empty_nodes.pl8 kB
- klcpos3.pl1 kB