Files in this item
Download all files in item (501.12 MB)- Name
- ud-treebanks-v2.8.tgz
- Size
- 410.63 MB
- Format
- application/x-gzip
- Description
- Treebank data
- MD5
- c5e5e30518fb98c3846f3f11af77e612
- ud-treebanks-v2.8
- UD_Italian-PUD
- it_pud-ud-test.txt123 kB
- stats.xml8 kB
- README.md5 kB
- it_pud-ud-test.conllu1 MB
- LICENSE.txt19 kB
- UD_Telugu-MTG
- te_mtg-ud-test.txt10 kB
- te_mtg-ud-train.conllu494 kB
- te_mtg-ud-dev.conllu64 kB
- stats.xml3 kB
- LICENSE.txt202 B
- te_mtg-ud-test.conllu70 kB
- README.txt1 kB
- te_mtg-ud-train.txt72 kB
- te_mtg-ud-dev.txt9 kB
- UD_Swedish-Talbanken
- sv_talbanken-ud-test.txt122 kB
- README.md7 kB
- sv_talbanken-ud-train.txt402 kB
- stats.xml9 kB
- LICENSE.txt20 kB
- sv_talbanken-ud-train.conllu5 MB
- sv_talbanken-ud-dev.conllu834 kB
- sv_talbanken-ud-dev.txt58 kB
- sv_talbanken-ud-test.conllu1 MB
- UD_Makurap-TuDeT
- stats.xml4 kB
- README.md1 kB
- mpu_tudet-ud-test.txt798 B
- LICENSE.txt202 B
- mpu_tudet-ud-test.conllu10 kB
- UD_Finnish-OOD
- fi_ood-ud-test.txt134 kB
- stats.xml18 kB
- README.md1 kB
- fi_ood-ud-test.conllu1 MB
- LICENSE.txt202 B
- UD_Czech-CLTT
- cs_cltt-ud-dev.conllu483 kB
- cs_cltt-ud-test.txt29 kB
- README.md2 kB
- cs_cltt-ud-train.txt195 kB
- cs_cltt-ud-dev.txt33 kB
- cs_cltt-ud-train.conllu2 MB
- stats.xml13 kB
- LICENSE.txt265 B
- cs_cltt-ud-test.conllu416 kB
- UD_Gothic-PROIEL
- README.md2 kB
- got_proiel-ud-train.conllu3 MB
- got_proiel-ud-test.txt64 kB
- got_proiel-ud-train.txt221 kB
- got_proiel-ud-dev.conllu930 kB
- stats.xml9 kB
- LICENSE.txt279 B
- got_proiel-ud-test.conllu946 kB
- got_proiel-ud-dev.txt62 kB
- UD_Czech-PUD
- stats.xml16 kB
- README.md3 kB
- LICENSE.txt202 B
- cs_pud-ud-test.txt114 kB
- cs_pud-ud-test.conllu2 MB
- UD_French-Sequoia
- fr_sequoia-ud-test.txt53 kB
- fr_sequoia-ud-dev.conllu612 kB
- README.md4 kB
- fr_sequoia-ud-test.conllu612 kB
- fr_sequoia-ud-train.txt267 kB
- fr_sequoia-ud-dev.txt52 kB
- stats.xml8 kB
- LICENSE.txt14 kB
- fr_sequoia-ud-train.conllu3 MB
- UD_Swedish-LinES
- sv_lines-ud-train.conllu4 MB
- sv_lines-ud-dev.conllu1 MB
- sv_lines-ud-train.txt302 kB
- sv_lines-ud-dev.txt101 kB
- sv_lines-ud-test.conllu1 MB
- stats.xml9 kB
- sv_lines-ud-test.txt92 kB
- LICENSE.txt18 kB
- README.txt7 kB
- UD_German-GSD
- README.md7 kB
- de_gsd-ud-dev.conllu876 kB
- de_gsd-ud-dev.txt72 kB
- de_gsd-ud-train.txt1 MB
- de_gsd-ud-test.conllu1 MB
- stats.xml10 kB
- de_gsd-ud-train.conllu18 MB
- LICENSE.txt202 B
- de_gsd-ud-test.txt97 kB
- UD_Faroese-FarPaHC
- fo_farpahc-ud-dev.conllu464 kB
- README.md4 kB
- fo_farpahc-ud-dev.txt42 kB
- fo_farpahc-ud-test.conllu458 kB
- fo_farpahc-ud-train.txt105 kB
- fo_farpahc-ud-train.conllu1 MB
- stats.xml5 kB
- fo_farpahc-ud-test.txt42 kB
- LICENSE.txt202 B
- UD_Japanese-PUD
- ja_pud-ud-test.txt138 kB
- stats.xml3 kB
- README.md5 kB
- ja_pud-ud-test.conllu4 MB
- LICENSE.txt19 kB
- UD_Italian-Valico
- stats.xml8 kB
- README.md3 kB
- it_valico-ud-test.conllu520 kB
- LICENSE.txt202 B
- it_valico-ud-test.txt31 kB
- UD_Turkish_German-SAGT
- qtd_sagt-ud-train.conllu720 kB
- qtd_sagt-ud-test.txt77 kB
- README.md3 kB
- qtd_sagt-ud-train.txt55 kB
- qtd_sagt-ud-dev.conllu922 kB
- qtd_sagt-ud-test.conllu1013 kB
- qtd_sagt-ud-dev.txt71 kB
- stats.xml15 kB
- LICENSE.txt202 B
- UD_Chinese-PUD
- stats.xml4 kB
- zh_pud-ud-test.conllu1 MB
- README.md5 kB
- zh_pud-ud-test.txt101 kB
- LICENSE.txt19 kB
- UD_English-LinES
- en_lines-ud-test.conllu1013 kB
- en_lines-ud-train.conllu3 MB
- en_lines-ud-test.txt83 kB
- en_lines-ud-dev.conllu1 MB
- stats.xml8 kB
- en_lines-ud-train.txt272 kB
- LICENSE.txt18 kB
- README.txt7 kB
- en_lines-ud-dev.txt91 kB
- UD_Buryat-BDT
- stats.xml12 kB
- README.txt1 kB
- bxr_bdt-ud-train.conllu10 kB
- bxr_bdt-ud-train.txt1 kB
- LICENSE.txt202 B
- bxr_bdt-ud-test.conllu699 kB
- bxr_bdt-ud-test.txt114 kB
- UD_Latin-PROIEL
- la_proiel-ud-dev.txt87 kB
- README.md2 kB
- la_proiel-ud-dev.conllu1 MB
- la_proiel-ud-test.txt88 kB
- stats.xml10 kB
- la_proiel-ud-train.conllu15 MB
- LICENSE.txt279 B
- la_proiel-ud-train.txt1 MB
- la_proiel-ud-test.conllu1 MB
- UD_English-GUMReddit
- README.md13 kB
- en_gumreddit-ud-train.txt23 kB
- en_gumreddit-ud-train.conllu1 MB
- en_gumreddit-ud-dev.conllu149 kB
- get_text.py26 kB
- en_gumreddit-ud-dev.txt3 kB
- stats.xml6 kB
- en_gumreddit-ud-test.txt3 kB
- LICENSE.txt313 B
- en_gumreddit-ud-test.conllu151 kB
- UD_Sanskrit-Vedic
- stats.xml8 kB
- README.md2 kB
- sa_vedic-ud-train.conllu1 MB
- sa_vedic-ud-test.conllu710 kB
- LICENSE.txt202 B
- sa_vedic-ud-test.txt74 kB
- sa_vedic-ud-train.txt135 kB
- UD_Norwegian-Bokmaal
- README.md6 kB
- no_bokmaal-ud-dev.txt195 kB
- no_bokmaal-ud-train.txt1 MB
- no_bokmaal-ud-test.txt161 kB
- stats.xml9 kB
- no_bokmaal-ud-train.conllu14 MB
- no_bokmaal-ud-test.conllu1 MB
- no_bokmaal-ud-dev.conllu2 MB
- LICENSE.txt68 B
- UD_Turkish-IMST
- tr_imst-ud-test.txt65 kB
- README.md2 kB
- tr_imst-ud-train.conllu2 MB
- tr_imst-ud-test.conllu801 kB
- tr_imst-ud-dev.conllu797 kB
- tr_imst-ud-dev.txt64 kB
- stats.xml13 kB
- LICENSE.txt20 kB
- tr_imst-ud-train.txt246 kB
- UD_French-FQB
- stats.xml7 kB
- fr_fqb-ud-test.conllu1 MB
- README.md3 kB
- fr_fqb-ud-test.txt117 kB
- LICENSE.txt14 kB
- UD_South_Levantine_Arabic-MADAR
- stats.xml4 kB
- README.md2 kB
- ajp_madar-ud-test.conllu42 kB
- LICENSE.txt202 B
- ajp_madar-ud-test.txt5 kB
- UD_Old_East_Slavic-TOROT
- README.md3 kB
- orv_torot-ud-test.txt150 kB
- orv_torot-ud-train.txt1 MB
- orv_torot-ud-train.conllu11 MB
- orv_torot-ud-dev.conllu1 MB
- orv_torot-ud-dev.txt151 kB
- orv_torot-ud-test.conllu1 MB
- stats.xml12 kB
- LICENSE.txt197 B
- UD_French-PUD
- stats.xml8 kB
- fr_pud-ud-test.txt130 kB
- fr_pud-ud-test.conllu1 MB
- README.md5 kB
- LICENSE.txt19 kB
- UD_Manx-Cadhan
- stats.xml7 kB
- README.md2 kB
- LICENSE.txt656 B
- gv_cadhan-ud-test.txt82 kB
- gv_cadhan-ud-test.conllu1 MB
- UD_Moksha-JR
- stats.xml23 kB
- README.md5 kB
- LICENSE.txt202 B
- mdf_jr-ud-test.conllu295 kB
- mdf_jr-ud-test.txt29 kB
- UD_Munduruku-TuDeT
- stats.xml7 kB
- README.md2 kB
- myu_tudet-ud-test.conllu39 kB
- LICENSE.txt202 B
- myu_tudet-ud-test.txt2 kB
- UD_Tagalog-TRG
- stats.xml7 kB
- tl_trg-ud-test.txt3 kB
- tl_trg-ud-test.conllu59 kB
- README.md1 kB
- LICENSE.txt202 B
- UD_French-ParTUT
- README.md5 kB
- fr_partut-ud-dev.conllu116 kB
- fr_partut-ud-train.conllu1 MB
- fr_partut-ud-test.txt14 kB
- fr_partut-ud-train.txt128 kB
- stats.xml8 kB
- LICENSE.txt18 kB
- fr_partut-ud-test.conllu164 kB
- fr_partut-ud-dev.txt9 kB
- UD_Turkish-PUD
- stats.xml12 kB
- README.md6 kB
- tr_pud-ud-test.conllu1 MB
- tr_pud-ud-test.txt119 kB
- LICENSE.txt19 kB
- UD_Spanish-GSD
- README.md4 kB
- es_gsd-ud-test.conllu714 kB
- es_gsd-ud-train.conllu22 MB
- es_gsd-ud-test.txt61 kB
- es_gsd-ud-train.txt1 MB
- es_gsd-ud-dev.conllu2 MB
- es_gsd-ud-dev.txt191 kB
- stats.xml10 kB
- LICENSE.txt202 B
- UD_Persian-PerDT
- fa_perdt-ud-train.conllu28 MB
- README.md4 kB
- fa_perdt-ud-dev.conllu1 MB
- fa_perdt-ud-dev.txt206 kB
- fa_perdt-ud-test.txt198 kB
- fa_perdt-ud-train.txt3 MB
- stats.xml7 kB
- LICENSE.txt19 kB
- fa_perdt-ud-test.conllu1 MB
- UD_Korean-GSD
- ko_gsd-ud-dev.txt103 kB
- README.md3 kB
- ko_gsd-ud-dev.conllu709 kB
- ko_gsd-ud-train.conllu3 MB
- ko_gsd-ud-test.txt100 kB
- ko_gsd-ud-test.conllu691 kB
- ko_gsd-ud-train.txt485 kB
- stats.xml4 kB
- LICENSE.txt202 B
- UD_Ancient_Greek-Perseus
- README.md3 kB
- grc_perseus-ud-dev.txt250 kB
- grc_perseus-ud-test.conllu1 MB
- grc_perseus-ud-test.txt231 kB
- grc_perseus-ud-train.txt1 MB
- stats.xml10 kB
- grc_perseus-ud-train.conllu14 MB
- LICENSE.txt279 B
- grc_perseus-ud-dev.conllu1 MB
- UD_Italian-TWITTIRO
- README.md3 kB
- it_twittiro-ud-test.conllu184 kB
- it_twittiro-ud-test.txt15 kB
- it_twittiro-ud-train.txt120 kB
- it_twittiro-ud-train.conllu1 MB
- stats.xml9 kB
- it_twittiro-ud-dev.conllu188 kB
- it_twittiro-ud-dev.txt15 kB
- LICENSE.txt202 B
- UD_Hindi-HDTB
- README.md2 kB
- hi_hdtb-ud-dev.conllu4 MB
- hi_hdtb-ud-train.conllu39 MB
- hi_hdtb-ud-dev.txt428 kB
- hi_hdtb-ud-test.txt425 kB
- hi_hdtb-ud-test.conllu4 MB
- hi_hdtb-ud-train.txt3 MB
- stats.xml13 kB
- LICENSE.txt249 B
- UD_Polish-LFG
- pl_lfg-ud-dev.txt74 kB
- pl_lfg-ud-train.txt596 kB
- README.md6 kB
- pl_lfg-ud-test.txt74 kB
- pl_lfg-ud-dev.conllu1 MB
- pl_lfg-ud-test.conllu1 MB
- stats.xml14 kB
- LICENSE.txt34 kB
- pl_lfg-ud-train.conllu11 MB
- UD_Romanian-ArT
- ro_art-ud-test.conllu44 kB
- stats.xml8 kB
- README.md1 kB
- ro_art-ud-test.txt2 kB
- LICENSE.txt202 B
- UD_German-HDT
- README.md6 kB
- de_hdt-ud-dev.conllu22 MB
- de_hdt-ud-test.txt2 MB
- de_hdt-ud-test.conllu22 MB
- stats.xml10 kB
- de_hdt-ud-train.conllu192 MB
- de_hdt-ud-dev.txt2 MB
- LICENSE.txt266 B
- de_hdt-ud-train.txt17 MB
- UD_Komi_Zyrian-Lattice
- stats.xml25 kB
- README.md7 kB
- kpv_lattice-ud-test.txt78 kB
- LICENSE.txt202 B
- kpv_lattice-ud-test.conllu735 kB
- UD_Estonian-EWT
- et_ewt-ud-train.txt260 kB
- README.md3 kB
- et_ewt-ud-dev.txt49 kB
- et_ewt-ud-dev.conllu622 kB
- et_ewt-ud-test.conllu920 kB
- et_ewt-ud-test.txt76 kB
- et_ewt-ud-train.conllu3 MB
- stats.xml12 kB
- LICENSE.txt202 B
- UD_Italian-ParTUT
- README.md4 kB
- it_partut-ud-dev.txt15 kB
- it_partut-ud-test.txt19 kB
- it_partut-ud-train.txt259 kB
- stats.xml9 kB
- it_partut-ud-test.conllu234 kB
- it_partut-ud-dev.conllu189 kB
- LICENSE.txt18 kB
- it_partut-ud-train.conllu3 MB
- UD_Romanian-Nonstandard
- ro_nonstandard-ud-test.txt104 kB
- README.md9 kB
- ro_nonstandard-ud-dev.txt91 kB
- ro_nonstandard-ud-dev.conllu1 MB
- ro_nonstandard-ud-test.conllu1 MB
- stats.xml12 kB
- ro_nonstandard-ud-train.txt2 MB
- ro_nonstandard-ud-train.conllu44 MB
- LICENSE.txt202 B
- UD_Livvi-KKPP
- stats.xml10 kB
- olo_kkpp-ud-train.txt808 B
- README.md4 kB
- olo_kkpp-ud-test.conllu103 kB
- olo_kkpp-ud-test.txt9 kB
- LICENSE.txt202 B
- olo_kkpp-ud-train.conllu15 kB
- UD_German-PUD
- stats.xml9 kB
- README.md5 kB
- LICENSE.txt19 kB
- de_pud-ud-test.conllu1 MB
- de_pud-ud-test.txt126 kB
- UD_Turkish-Kenet
- tr_kenet-ud-dev.txt122 kB
- README.md1 kB
- tr_kenet-ud-train.conllu9 MB
- tr_kenet-ud-test.txt123 kB
- tr_kenet-ud-dev.conllu1 MB
- stats.xml11 kB
- LICENSE.txt202 B
- tr_kenet-ud-train.txt989 kB
- tr_kenet-ud-test.conllu1 MB
- UD_Urdu-UDTB
- README.md2 kB
- ur_udtb-ud-train.txt853 kB
- ur_udtb-ud-test.txt117 kB
- ur_udtb-ud-train.conllu11 MB
- ur_udtb-ud-test.conllu1 MB
- stats.xml10 kB
- ur_udtb-ud-dev.txt115 kB
- LICENSE.txt247 B
- ur_udtb-ud-dev.conllu1 MB
- UD_Kaapor-TuDeT
- stats.xml4 kB
- README.md2 kB
- LICENSE.txt202 B
- urb_tudet-ud-test.txt1 kB
- urb_tudet-ud-test.conllu18 kB
- UD_Estonian-EDT
- et_edt-ud-test.txt312 kB
- et_edt-ud-train.txt2 MB
- README.md4 kB
- et_edt-ud-test.conllu3 MB
- et_edt-ud-dev.conllu3 MB
- et_edt-ud-train.conllu24 MB
- stats.xml13 kB
- LICENSE.txt279 B
- et_edt-ud-dev.txt284 kB
- UD_Akkadian-PISANDUB
- stats.xml3 kB
- README.md871 B
- akk_pisandub-ud-test.txt15 kB
- LICENSE.txt202 B
- akk_pisandub-ud-test.conllu99 kB
- UD_Finnish-FTB
- fi_ftb-ud-train.conllu10 MB
- README.md3 kB
- fi_ftb-ud-test.txt116 kB
- fi_ftb-ud-test.conllu1 MB
- stats.xml17 kB
- LICENSE.txt43 kB
- fi_ftb-ud-dev.txt111 kB
- fi_ftb-ud-dev.conllu1 MB
- fi_ftb-ud-train.txt904 kB
- UD_Galician-TreeGal
- stats.xml9 kB
- README.md5 kB
- gl_treegal-ud-test.txt50 kB
- gl_treegal-ud-train.conllu1 MB
- LICENSE.txt14 kB
- gl_treegal-ud-train.txt76 kB
- gl_treegal-ud-test.conllu670 kB
- UD_Portuguese-GSD
- pt_gsd-ud-test.conllu1 MB
- README.md3 kB
- pt_gsd-ud-train.conllu11 MB
- pt_gsd-ud-train.txt1 MB
- pt_gsd-ud-dev.conllu1 MB
- stats.xml5 kB
- pt_gsd-ud-test.txt153 kB
- LICENSE.txt202 B
- pt_gsd-ud-dev.txt156 kB
- UD_Latin-Perseus
- stats.xml8 kB
- la_perseus-ud-train.conllu1 MB
- README.md3 kB
- la_perseus-ud-test.txt61 kB
- la_perseus-ud-test.conllu961 kB
- LICENSE.txt279 B
- la_perseus-ud-train.txt104 kB
- UD_Old_Turkish-Tonqq
- stats.xml2 kB
- otk_tonqq-ud-test.txt2 kB
- README.md1 kB
- otk_tonqq-ud-test.conllu14 kB
- LICENSE.txt6 kB
- UD_Hindi_English-HIENCS
- README.md3 kB
- qhe_hiencs-ud-train.conllu681 kB
- qhe_hiencs-ud-test.conllu104 kB
- qhe_hiencs-ud-test.txt6 kB
- qhe_hiencs-ud-train.txt39 kB
- qhe_hiencs-ud-dev.conllu107 kB
- stats.xml2 kB
- merge
- train-annot.json1 MB
- tweet_ids_dev.txt4 kB
- EDITS6 kB
- EMOTICONS3 kB
- test-annot.json229 kB
- NONBREAKING_PREFIXES812 B
- tweet_ids_test.txt4 kB
- DOMAINS293 B
- tweet_ids_train.txt26 kB
- dev-annot.json236 kB
- LICENSE.txt202 B
- crawl_tweets.py18 kB
- qhe_hiencs-ud-dev.txt6 kB
- UD_Italian-PoSTWITA
- it_postwita-ud-test.conllu759 kB
- it_postwita-ud-train.txt526 kB
- README.md3 kB
- it_postwita-ud-dev.conllu734 kB
- it_postwita-ud-train.conllu5 MB
- stats.xml9 kB
- LICENSE.txt18 kB
- it_postwita-ud-dev.txt64 kB
- it_postwita-ud-test.txt67 kB
- UD_Karelian-KKPP
- stats.xml10 kB
- krl_kkpp-ud-test.conllu220 kB
- README.md2 kB
- LICENSE.txt202 B
- krl_kkpp-ud-test.txt21 kB
- UD_Finnish-TDT
- fi_tdt-ud-train.txt1 MB
- fi_tdt-ud-train.conllu12 MB
- fi_tdt-ud-test.conllu1 MB
- stats.xml20 kB
- fi_tdt-ud-test.txt154 kB
- LICENSE.txt24 kB
- README.txt3 kB
- fi_tdt-ud-dev.conllu1 MB
- fi_tdt-ud-dev.txt136 kB
- UD_Tamil-MWTT
- stats.xml16 kB
- ta_mwtt-ud-test.conllu408 kB
- README.md1 kB
- ta_mwtt-ud-test.txt44 kB
- LICENSE.txt202 B
- UD_Swedish-PUD
- stats.xml8 kB
- README.md3 kB
- LICENSE.txt202 B
- sv_pud-ud-test.txt115 kB
- sv_pud-ud-test.conllu1 MB
- UD_Polish-PDB
- README.md5 kB
- pl_pdb-ud-train.txt1 MB
- pl_pdb-ud-dev.conllu3 MB
- pl_pdb-ud-test.txt203 kB
- pl_pdb-ud-train.conllu27 MB
- pl_pdb-ud-dev.txt210 kB
- stats.xml17 kB
- LICENSE.txt384 B
- pl_pdb-ud-test.conllu3 MB
- UD_Amharic-ATT
- stats.xml7 kB
- am_att-ud-test.txt53 kB
- README.md1 kB
- am_att-ud-test.conllu995 kB
- LICENSE.txt202 B
- UD_North_Sami-Giella
- stats.xml10 kB
- README.md2 kB
- sme_giella-ud-train.conllu1 MB
- sme_giella-ud-train.txt107 kB
- LICENSE.txt202 B
- sme_giella-ud-test.conllu668 kB
- sme_giella-ud-test.txt70 kB
- UD_Khunsari-AHA
- stats.xml4 kB
- README.md1 kB
- kfm_aha-ud-test.conllu6 kB
- LICENSE.txt202 B
- kfm_aha-ud-test.txt542 B
- UD_Korean-Kaist
- ko_kaist-ud-test.conllu1 MB
- README.md1 kB
- ko_kaist-ud-train.txt2 MB
- ko_kaist-ud-dev.txt233 kB
- ko_kaist-ud-test.txt255 kB
- ko_kaist-ud-dev.conllu1 MB
- stats.xml4 kB
- LICENSE.txt202 B
- ko_kaist-ud-train.conllu17 MB
- UD_Bambara-CRB
- stats.xml6 kB
- README.md2 kB
- LICENSE.txt202 B
- bm_crb-ud-test.txt51 kB
- bm_crb-ud-test.conllu873 kB
- UD_Ukrainian-IU
- README.md9 kB
- uk_iu-ud-train.txt895 kB
- uk_iu-ud-test.txt176 kB
- uk_iu-ud-dev.conllu1 MB
- uk_iu-ud-test.conllu2 MB
- uk_iu-ud-dev.txt128 kB
- stats.xml17 kB
- LICENSE.txt172 B
- uk_iu-ud-train.conllu12 MB
- UD_English-ESL
- en_esl-ud-dev.conllu319 kB
- README.md4 kB
- en_esl-ud-train.txt153 kB
- en_esl-ud-train.conllu2 MB
- merge.py905 B
- en_esl-ud-test.txt18 kB
- stats.xml3 kB
- en_esl-ud-dev.txt18 kB
- LICENSE.txt19 kB
- en_esl-ud-test.conllu321 kB
- UD_Persian-Seraji
- fa_seraji-ud-train.txt995 kB
- README.md5 kB
- LICENSE.txt110 B
- fa_seraji-ud-dev.conllu989 kB
- UD_Naija-NSC
- pcm_nsc-ud-train.conllu11 MB
- README.md7 kB
- pcm_nsc-ud-test.conllu1 MB
- pcm_nsc-ud-dev.conllu1 MB
- pcm_nsc-ud-test.txt54 kB
- pcm_nsc-ud-train.txt433 kB
- stats.xml9 kB
- LICENSE.txt202 B
- pcm_nsc-ud-dev.txt54 kB
- UD_Norwegian-Nynorsk
- README.md4 kB
- no_nynorsk-ud-dev.conllu1 MB
- no_nynorsk-ud-test.txt135 kB
- no_nynorsk-ud-dev.txt166 kB
- stats.xml9 kB
- no_nynorsk-ud-test.conllu1 MB
- LICENSE.txt68 B
- no_nynorsk-ud-train.txt1 MB
- no_nynorsk-ud-train.conllu14 MB
- UD_Norwegian-NynorskLIA
- no_nynorsklia-ud-test.txt42 kB
- no_nynorsklia-ud-dev.conllu593 kB
- no_nynorsklia-ud-test.conllu594 kB
- stats.xml8 kB
- LICENSE.txt202 B
- README.txt1 kB
- no_nynorsklia-ud-dev.txt42 kB
- no_nynorsklia-ud-train.txt147 kB
- no_nynorsklia-ud-train.conllu2 MB
- UD_Italian-VIT
- it_vit-ud-test.conllu1 MB
- README.md4 kB
- it_vit-ud-dev.conllu1 MB
- it_vit-ud-train.conllu13 MB
- it_vit-ud-dev.txt150 kB
- it_vit-ud-test.txt130 kB
- stats.xml10 kB
- LICENSE.txt202 B
- it_vit-ud-train.txt1 MB
- UD_Bulgarian-BTB
- bg_btb-ud-dev.txt155 kB
- bg_btb-ud-train.txt1 MB
- bg_btb-ud-test.conllu1 MB
- bg_btb-ud-train.conllu11 MB
- stats.xml12 kB
- bg_btb-ud-test.txt152 kB
- LICENSE.txt327 B
- README.txt7 kB
- bg_btb-ud-dev.conllu1 MB
- UD_Romanian-SiMoNERo
- ro_simonero-ud-test.conllu1 MB
- README.md2 kB
- ro_simonero-ud-dev.conllu1 MB
- ro_simonero-ud-test.txt93 kB
- ro_simonero-ud-train.txt719 kB
- ro_simonero-ud-dev.txt91 kB
- stats.xml11 kB
- ro_simonero-ud-train.conllu9 MB
- LICENSE.txt202 B
- UD_Spanish-PUD
- stats.xml8 kB
- es_pud-ud-test.conllu1 MB
- README.md5 kB
- LICENSE.txt19 kB
- es_pud-ud-test.txt123 kB
- UD_Scottish_Gaelic-ARCOSG
- gd_arcosg-ud-train.txt255 kB
- README.md7 kB
- gd_arcosg-ud-test.conllu584 kB
- gd_arcosg-ud-dev.txt51 kB
- gd_arcosg-ud-test.txt51 kB
- gd_arcosg-ud-train.conllu2 MB
- stats.xml8 kB
- LICENSE.txt202 B
- gd_arcosg-ud-dev.conllu585 kB
- UD_Korean-PUD
- ko_pud-ud-test.txt129 kB
- stats.xml6 kB
- README.md5 kB
- LICENSE.txt19 kB
- ko_pud-ud-test.conllu1 MB
- UD_Chinese-HK
- stats.xml3 kB
- README.md4 kB
- LICENSE.txt202 B
- zh_hk-ud-test.conllu482 kB
- zh_hk-ud-test.txt41 kB
- UD_Japanese-GSD
- ja_gsd-ud-dev.txt58 kB
- README.md8 kB
- ja_gsd-ud-dev.conllu1 MB
- ja_gsd-ud-train.conllu25 MB
- stats.xml4 kB
- LICENSE.txt202 B
- ja_gsd-ud-test.conllu1 MB
- ja_gsd-ud-train.txt804 kB
- ja_gsd-ud-test.txt62 kB
- UD_English-ParTUT
- README.md4 kB
- en_partut-ud-train.txt229 kB
- en_partut-ud-test.conllu183 kB
- en_partut-ud-test.txt18 kB
- en_partut-ud-train.conllu2 MB
- stats.xml8 kB
- LICENSE.txt18 kB
- en_partut-ud-dev.conllu148 kB
- en_partut-ud-dev.txt13 kB
- UD_Kangri-KDTB
- stats.xml2 kB
- xnr_kdtb-ud-test.conllu132 kB
- README.md1 kB
- LICENSE.txt202 B
- xnr_kdtb-ud-test.txt29 kB
- UD_Czech-CAC
- cs_cac-ud-test.conllu1 MB
- cs_cac-ud-test.txt71 kB
- README.md5 kB
- cs_cac-ud-train.conllu51 MB
- cs_cac-ud-dev.txt72 kB
- cs_cac-ud-train.txt2 MB
- stats.xml19 kB
- LICENSE.txt265 B
- cs_cac-ud-dev.conllu1 MB
- UD_Faroese-OFT
- stats.xml7 kB
- README.md1 kB
- fo_oft-ud-test.txt58 kB
- fo_oft-ud-test.conllu783 kB
- LICENSE.txt822 B
- UD_Ancient_Greek-PROIEL
- README.md2 kB
- grc_proiel-ud-dev.txt159 kB
- grc_proiel-ud-train.conllu19 MB
- grc_proiel-ud-test.conllu1 MB
- stats.xml13 kB
- grc_proiel-ud-test.txt154 kB
- LICENSE.txt279 B
- grc_proiel-ud-train.txt2 MB
- grc_proiel-ud-dev.conllu1 MB
- UD_English-Pronouns
- stats.xml5 kB
- README.md9 kB
- en_pronouns-ud-test.conllu138 kB
- LICENSE.txt202 B
- en_pronouns-ud-test.txt7 kB
- UD_Czech-PDT
- cs_pdt-ud-train.conllu127 MB
- README.md8 kB
- cs_pdt-ud-test.conllu18 MB
- cs_pdt-ud-test.txt1 MB
- cs_pdt-ud-dev.txt989 kB
- cs_pdt-ud-dev.conllu17 MB
- stats.xml20 kB
- LICENSE.txt19 kB
- cs_pdt-ud-train.txt7 MB
- UD_Swedish_Sign_Language-SSLC
- swl_sslc-ud-dev.txt6 kB
- README.md1 kB
- swl_sslc-ud-train.txt6 kB
- swl_sslc-ud-test.conllu13 kB
- swl_sslc-ud-train.conllu32 kB
- swl_sslc-ud-test.txt2 kB
- stats.xml2 kB
- LICENSE.txt19 kB
- swl_sslc-ud-dev.conllu33 kB
- UD_Chinese-GSD
- README.md2 kB
- zh_gsd-ud-test.conllu647 kB
- zh_gsd-ud-train.conllu5 MB
- zh_gsd-ud-train.txt433 kB
- zh_gsd-ud-dev.txt55 kB
- zh_gsd-ud-dev.conllu680 kB
- stats.xml5 kB
- zh_gsd-ud-test.txt53 kB
- LICENSE.txt202 B
- UD_Catalan-AnCora
- README.md2 kB
- ca_ancora-ud-test.txt297 kB
- ca_ancora-ud-dev.conllu3 MB
- ca_ancora-ud-test.conllu3 MB
- ca_ancora-ud-train.conllu26 MB
- ca_ancora-ud-train.txt2 MB
- stats.xml11 kB
- ca_ancora-ud-dev.txt289 kB
- LICENSE.txt68 B
- UD_Arabic-PUD
- stats.xml9 kB
- README.md5 kB
- ar_pud-ud-test.txt168 kB
- LICENSE.txt19 kB
- ar_pud-ud-test.conllu1 MB
- UD_Tupinamba-TuDeT
- stats.xml11 kB
- README.md1 kB
- LICENSE.txt202 B
- tpn_tudet-ud-test.txt11 kB
- tpn_tudet-ud-test.conllu111 kB
- UD_Icelandic-PUD
- stats.xml9 kB
- is_pud-ud-test.txt119 kB
- README.md3 kB
- LICENSE.txt202 B
- is_pud-ud-test.conllu1 MB
- UD_Erzya-JR
- stats.xml30 kB
- myv_jr-ud-test.txt175 kB
- README.txt5 kB
- LICENSE.txt202 B
- myv_jr-ud-test.conllu1 MB
- UD_Spanish-AnCora
- README.md2 kB
- es_ancora-ud-train.txt2 MB
- es_ancora-ud-test.conllu3 MB
- es_ancora-ud-dev.conllu3 MB
- es_ancora-ud-test.txt277 kB
- stats.xml11 kB
- es_ancora-ud-train.conllu27 MB
- LICENSE.txt68 B
- es_ancora-ud-dev.txt275 kB
- UD_Mbya_Guarani-Dooley
- stats.xml7 kB
- README.md3 kB
- gun_dooley-ud-test.conllu560 kB
- LICENSE.txt202 B
- gun_dooley-ud-test.txt23 kB
- UD_French-GSD
- fr_gsd-ud-train.conllu21 MB
- README.md7 kB
- fr_gsd-ud-dev.conllu2 MB
- fr_gsd-ud-dev.txt184 kB
- stats.xml9 kB
- fr_gsd-ud-test.conllu624 kB
- LICENSE.txt202 B
- fr_gsd-ud-test.txt49 kB
- fr_gsd-ud-train.txt1 MB
- UD_Irish-IDT
- ga_idt-ud-test.conllu676 kB
- ga_idt-ud-dev.conllu671 kB
- ga_idt-ud-dev.txt51 kB
- ga_idt-ud-train.txt538 kB
- ga_idt-ud-train.conllu6 MB
- ga_idt-ud-test.txt52 kB
- stats.xml14 kB
- LICENSE.txt13 B
- README.txt14 kB
- UD_Frisian_Dutch-Fame
- stats.xml3 kB
- README.md3 kB
- qfn_fame-ud-test.conllu215 kB
- LICENSE.txt202 B
- qfn_fame-ud-test.txt19 kB
- UD_Sanskrit-UFAL
- stats.xml16 kB
- README.md1 kB
- sa_ufal-ud-test.conllu414 kB
- LICENSE.txt202 B
- sa_ufal-ud-test.txt27 kB
- UD_Kurmanji-MG
- stats.xml9 kB
- kmr_mg-ud-train.conllu17 kB
- README.txt1 kB
- kmr_mg-ud-test.txt49 kB
- LICENSE.txt202 B
- kmr_mg-ud-train.txt1 kB
- kmr_mg-ud-test.conllu729 kB
- UD_Albanian-TSA
- stats.xml8 kB
- sq_tsa-ud-test.conllu67 kB
- README.md1 kB
- sq_tsa-ud-test.txt5 kB
- LICENSE.txt202 B
- UD_Portuguese-PUD
- stats.xml7 kB
- README.md5 kB
- LICENSE.txt19 kB
- pt_pud-ud-test.txt119 kB
- pt_pud-ud-test.conllu1 MB
- UD_Arabic-NYUAD
- README.md2 kB
- ar_nyuad-ud-test.conllu5 MB
- stats.xml6 kB
- LICENSE.txt202 B
- ar_nyuad-ud-dev.txt123 kB
- ar_nyuad-ud-train.conllu44 MB
- ar_nyuad-ud-train.txt982 kB
- ar_nyuad-ud-test.txt123 kB
- ar_nyuad-ud-dev.conllu5 MB
- merge.jar91 kB
- UD_Bhojpuri-BHTB
- stats.xml11 kB
- bho_bhtb-ud-test.txt73 kB
- README.md3 kB
- bho_bhtb-ud-test.conllu599 kB
- LICENSE.txt202 B
- UD_Chinese-CFL
- stats.xml4 kB
- zh_cfl-ud-test.conllu375 kB
- zh_cfl-ud-test.conllux395 kB
- README.txt7 kB
- zh_cfl-ud-test.txt30 kB
- LICENSE.txt202 B
- UD_English-EWT
- en_ewt-ud-dev.conllu1 MB
- en_ewt-ud-test.txt123 kB
- en_ewt-ud-train.conllu12 MB
- README.md8 kB
- en_ewt-ud-train.txt989 kB
- en_ewt-ud-dev.txt123 kB
- stats.xml9 kB
- LICENSE.txt19 kB
- en_ewt-ud-test.conllu1 MB
- UD_Latin-LLCT
- la_llct-ud-dev.conllu2 MB
- README.md6 kB
- la_llct-ud-test.conllu2 MB
- la_llct-ud-train.conllu16 MB
- stats.xml12 kB
- la_llct-ud-dev.txt136 kB
- LICENSE.txt202 B
- la_llct-ud-test.txt136 kB
- la_llct-ud-train.txt1 MB
- UD_Latin-ITTB
- la_ittb-ud-train.txt2 MB
- README.md9 kB
- la_ittb-ud-dev.txt168 kB
- la_ittb-ud-test.conllu2 MB
- la_ittb-ud-dev.conllu2 MB
- stats.xml13 kB
- LICENSE.txt19 kB
- la_ittb-ud-test.txt169 kB
- la_ittb-ud-train.conllu32 MB
- UD_Cantonese-HK
- stats.xml4 kB
- yue_hk-ud-test.txt53 kB
- README.md4 kB
- LICENSE.txt202 B
- yue_hk-ud-test.conllu693 kB
- UD_Akkadian-RIAO
- stats.xml9 kB
- README.md2 kB
- akk_riao-ud-test.txt151 kB
- akk_riao-ud-test.conllu2 MB
- LICENSE.txt21 kB
- UD_Japanese-Modern
- stats.xml3 kB
- ja_modern-ud-test.conllu2 MB
- README.txt3 kB
- LICENSE.txt17 kB
- ja_modern-ud-test.txt62 kB
- UD_Italian-ISDT
- README.md10 kB
- it_isdt-ud-train.txt1 MB
- it_isdt-ud-train.conllu18 MB
- it_isdt-ud-dev.txt59 kB
- it_isdt-ud-test.txt52 kB
- it_isdt-ud-test.conllu717 kB
- stats.xml10 kB
- LICENSE.txt22 kB
- it_isdt-ud-dev.conllu814 kB
- UD_Icelandic-IcePaHC
- is_icepahc-ud-dev.conllu11 MB
- is_icepahc-ud-test.txt738 kB
- README.md6 kB
- is_icepahc-ud-dev.txt735 kB
- is_icepahc-ud-train.conllu58 MB
- stats.xml11 kB
- LICENSE.txt202 B
- is_icepahc-ud-train.txt3 MB
- is_icepahc-ud-test.conllu11 MB
- UD_Russian-Taiga
- ru_taiga-ud-train.conllu16 MB
- README.md5 kB
- ru_taiga-ud-test.conllu845 kB
- ru_taiga-ud-test.txt92 kB
- ru_taiga-ud-dev.conllu888 kB
- ru_taiga-ud-dev.txt99 kB
- ru_taiga-ud-train.txt1 MB
- stats.xml17 kB
- LICENSE.txt202 B
- UD_Italian-PUD
- ... too many files ...0 B
- Name
- ud-documentation-v2.8.tgz
- Size
- 89.97 MB
- Format
- application/x-gzip
- Description
- Documentation
- MD5
- 953bce3e033374da99456b2531f0810d
- ud-documentation-v2.8
- markdown-source
- _th
- dep
- obl-poss.md1 kB
- template-index.md1 kB
- dep
- _te
- dep
- obl-cau.md694 B
- nsubj-nc.md488 B
- advcl-cond.md1 kB
- obl-cmp.md1 kB
- template-index.md1 kB
- dep
- _urj
- syntax.md2 kB
- feat-index.md146 B
- tokenization.md1 kB
- morphology.md4 kB
- feat
- VerbForm.md2 kB
- Person.md537 B
- Number.md589 B
- Aspect.md703 B
- Polarity.md513 B
- Poss.md450 B
- Definite.md426 B
- PronType.md543 B
- Reflex.md342 B
- NumType.md265 B
- Case.md1 kB
- Degree.md258 B
- Tense.md616 B
- Voice.md579 B
- Mood.md504 B
- introduction.md1 kB
- dep-index.md152 B
- dep
- amod.md1 kB
- acl-relcl.md1 kB
- cop.md401 B
- vocative.md912 B
- acl.md429 B
- appos.md1 kB
- case.md395 B
- punct.md2 kB
- compound.md569 B
- ccomp.md306 B
- advcl.md437 B
- aux_.md698 B
- pos
- PRON.md651 B
- ADV.md3 kB
- VERB.md1 kB
- CCONJ.md908 B
- NUM.md589 B
- ADJ.md683 B
- SCONJ.md413 B
- SYM.md523 B
- DET.md560 B
- NOUN.md480 B
- PROPN.md413 B
- INTJ.md291 B
- ADP.md770 B
- PUNCT.md253 B
- AUX_.md761 B
- X.md633 B
- PART.md527 B
- pos-index.md144 B
- _otk
- index.md2 kB
- lib
- local
- config.js1 kB
- collections.js796 B
- ext
- head.load.min.js3 kB
- jquery.timeago.js7 kB
- jquery.svg.min.js18 kB
- jquery.svgdom.min.js4 kB
- jquery.address.min.js10 kB
- waypoints.min.js7 kB
- webfont.js16 kB
- jquery-ui.min.js205 kB
- jquery.min.js91 kB
- annodoc
- annodoc.js56 kB
- brat
- url_monitor.js6 kB
- visualizer.js131 kB
- util.js23 kB
- dispatcher.js3 kB
- annotation_log.js1 kB
- configuration.js868 B
- local
- resources
- jquery-1.11.3.min.js93 kB
- js-treex-view.min.js177 kB
- bootstrap-theme.min.css19 kB
- filesaver.min.js2 kB
- blob.min.js2 kB
- bootstrap.min.css114 kB
- conllu_viewer.css386 B
- bootstrap.min.js35 kB
- _mr
- _pt
- index.md4 kB
- syntax.md210 B
- feat-index.md134 B
- feat
- Degree.md1 kB
- Person.md1 kB
- Number.md817 B
- Gender.md827 B
- Case.md1 kB
- Definite.md627 B
- introduction.md2 kB
- pos
- PRON.md677 B
- VERB.md2 kB
- ADV.md876 B
- NUM.md1 kB
- CCONJ.md462 B
- ADJ.md1 kB
- SCONJ.md1 kB
- SYM.md1 kB
- DET.md1014 B
- NOUN.md517 B
- PROPN.md1 kB
- INTJ.md1 kB
- AUX_.md525 B
- PUNCT.md584 B
- ADP.md1 kB
- PART.md1 kB
- dep
- advcl.md1 kB
- obj.md1 kB
- nsubj.md1 kB
- vocative.md687 B
- mark.md1 kB
- xcomp.md3 kB
- flat.md2 kB
- compound.md794 B
- csubj.md775 B
- reparandum.md465 B
- amod.md1 kB
- nmod.md374 B
- nummod.md779 B
- acl-relcl.md470 B
- iobj.md1 kB
- nsubj-pass.md449 B
- acl.md1 kB
- case.md1 kB
- punct.md1 kB
- advmod.md1 kB
- aux-pass.md453 B
- ccomp.md1 kB
- parataxis.md5 kB
- goeswith.md376 B
- appos.md1 kB
- cc.md1 kB
- csubj-pass.md483 B
- fixed.md1 kB
- det.md635 B
- discourse.md723 B
- list.md1 kB
- expl-pass.md741 B
- cop.md3 kB
- orphan.md2 kB
- aux_.md1 kB
- root.md813 B
- acl-inf.md420 B
- expl.md1 kB
- dislocated.md1 kB
- conj.md1 kB
- dep.md661 B
- dep-index.md140 B
- pos-index.md132 B
- _sv
- index.md4 kB
- syntax.md1 kB
- feat-index.md134 B
- specific-syntax.md1 kB
- tokenization.md978 B
- morphology.md1 kB
- feat
- VerbForm.md2 kB
- Number.md648 B
- Polarity.md390 B
- Poss.md531 B
- Definite.md757 B
- Gender.md1 kB
- Foreign.md316 B
- PronType.md2 kB
- Case.md1 kB
- Degree.md1 kB
- Voice.md773 B
- Mood.md1 kB
- Tense.md1 kB
- Abbr.md277 B
- introduction.md4 kB
- dep
- obj.md807 B
- nsubj.md582 B
- advcl.md758 B
- vocative.md522 B
- xcomp.md1 kB
- compound-prt.md432 B
- mark.md615 B
- compound.md577 B
- csubj.md495 B
- reparandum.md549 B
- amod.md569 B
- flat-name.md714 B
- nmod.md683 B
- nummod.md576 B
- acl-relcl.md855 B
- iobj.md649 B
- nsubj-pass.md377 B
- acl.md1 kB
- case.md867 B
- nmod-poss.md481 B
- punct.md686 B
- advmod.md677 B
- aux-pass.md646 B
- ccomp.md718 B
- parataxis.md931 B
- goeswith.md412 B
- appos.md710 B
- cc.md1 kB
- csubj-pass.md518 B
- fixed.md698 B
- det.md416 B
- discourse.md424 B
- list.md860 B
- obl-agent.md442 B
- cop.md1 kB
- orphan.md573 B
- aux_.md715 B
- obl.md769 B
- root.md537 B
- expl.md539 B
- dislocated.md999 B
- acl-cleft.md1 kB
- conj.md644 B
- pos
- PRON.md1 kB
- VERB.md683 B
- PUNCT.md377 B
- PART.md663 B
- DET.md1 kB
- SCONJ.md413 B
- CONJ.md399 B
- AUX_.md1 kB
- ADV.md616 B
- X.md536 B
- ADP.md544 B
- PROPN.md470 B
- ADJ.md677 B
- CCONJ.md411 B
- NUM.md843 B
- SYM.md391 B
- INTJ.md311 B
- NOUN.md327 B
- dep-index.md140 B
- index_template.md5 kB
- pos-index.md132 B
- release_checklist.md31 kB
- ext-format.md11 kB
- _sq
- _mk
- template-index.md1 kB
- _config.yml4 kB
- _ja
- pos-index.md143 B
- tokenization.md3 kB
- morphology.md2 kB
- dep
- nummod.md276 B
- discourse.md365 B
- csubj.md657 B
- obl.md434 B
- nsubj.md371 B
- fixed.md638 B
- cop.md1 kB
- det.md567 B
- mark.md425 B
- compound.md383 B
- dislocated.md566 B
- aux_.md534 B
- introduction.md28 kB
- pos
- PRON.md1 kB
- ADV.md1 kB
- VERB.md1 kB
- CCONJ.md856 B
- NUM.md1 kB
- ADJ.md2 kB
- SCONJ.md614 B
- SYM.md1 kB
- DET.md1 kB
- NOUN.md1 kB
- PROPN.md981 B
- INTJ.md1 kB
- ADP.md942 B
- AUX_.md1 kB
- PUNCT.md972 B
- X.md263 B
- PART.md899 B
- _vi
- dep-index.md140 B
- dep
- amod.md376 B
- csubj.md497 B
- discourse.md556 B
- cop.md370 B
- cc.md578 B
- conj.md644 B
- det.md782 B
- advmod.md407 B
- iobj.md516 B
- obj.md390 B
- appos.md538 B
- aux-pass.md421 B
- mark.md576 B
- dislocated.md539 B
- ccomp.md576 B
- aux_.md519 B
- template-index.md1 kB
- _ckt
- index.md2 kB
- dep
- acl-relat.md1 kB
- acl-attr.md672 B
- nmod-attr.md754 B
- aux-neg.md1 kB
- parataxis-rep.md659 B
- nmod-relat.md910 B
- workgroups
- 2015-08-23-uppsala
- coordination.md3 kB
- index.md4 kB
- ellipsis.md11 kB
- future.md1 kB
- tokenization.md6 kB
- mwe.md2 kB
- copula.md5 kB
- clitics.md1 kB
- particles.md1 kB
- determiners.md37 kB
- conversion.md3 kB
- v3.md2 kB
- index.md1 kB
- enhanced.md19 kB
- core.md96 kB
- v1_to_v2.md1 kB
- mwe.md38 kB
- comparatives.md44 kB
- newdoc
- simple_verbal_clauses.md55 kB
- index.md2 kB
- word_segmentation.md17 kB
- comparatives.md44 kB
- valency_changing_operations.md82 kB
- simple_noun_phrases.md11 kB
- ditransitive_clauses.md30 kB
- two_nominals.md5 kB
- expletives.md54 kB
- existentials.md247 B
- 2015-08-23-uppsala
- _tagset-conversion
- hr-multext-uposf.md205 kB
- sv-mamba-uposf.md6 kB
- sv-parole-uposf.md23 kB
- la-conll-uposf.md94 kB
- nl-cgn-uposf.md59 kB
- pt-cintil-uposf.md24 kB
- ca-conll2009-uposf.md51 kB
- el-conll-uposf.md86 kB
- hu-conll-uposf.md120 kB
- sl-conll-uposf.md190 kB
- de-conll2009-uposf.md137 kB
- lt-multext-uposf.md122 kB
- es-conll2009-uposf.md51 kB
- te-conll-uposf.md101 kB
- nl-conll-uposf.md34 kB
- fi-turku-uposf.md1013 kB
- cs-conll-uposf.md989 kB
- en-penn-uposf.md6 kB
- ta-tamiltb-uposf.md58 kB
- it-isdt-uposf.md48 kB
- fa-conll-uposf.md56 kB
- la-itconll-uposf.md325 kB
- cs-pdt-uposf.md757 kB
- sk-snk-uposf.md256 kB
- pt-conll-uposf.md89 kB
- ro-multext-uposf.md45 kB
- de-smor-uposf.md159 kB
- ja-conll-uposf.md13 kB
- mt-mlss-uposf.md5 kB
- et-puudepank-uposf.md88 kB
- cs-multext-uposf.md224 kB
- hi-conll-uposf.md688 kB
- cs-ajka-uposf.md343 kB
- pt-freeling-uposf.md57 kB
- ar-padt-uposf.md48 kB
- bn-conll-uposf.md74 kB
- ja-ipadic-uposf.md10 kB
- de-stts-uposf.md7 kB
- ar-conll2007-uposf.md65 kB
- tr-conll-uposf.md215 kB
- ar-conll-uposf.md55 kB
- sl-multext-uposf.md171 kB
- he-conll-uposf.md64 kB
- ro-rdt-uposf.md2 kB
- da-conll-uposf.md31 kB
- ru-syntagrus-uposf.md82 kB
- index.md4 kB
- eu-conll-uposf.md952 kB
- pl-ipipan-uposf.md234 kB
- grc-conll-uposf.md250 kB
- zh-conll-uposf.md35 kB
- sv-suc-uposf.md24 kB
- bg-conll-uposf.md117 kB
- it-conll-uposf.md27 kB
- lt-jablonskis-uposf.md136 kB
- _u-dep-v1
- auxpass.md355 B
- remnant.md4 kB
- name.md2 kB
- csubjpass.md402 B
- foreign.md653 B
- mwe.md1 kB
- dobj.md1 kB
- neg.md482 B
- nsubjpass.md352 B
- _lv
- index.md12 kB
- slavic.md744 B
- _bho
- index.md3 kB
- _hil
- template-index.md1 kB
- _ru
- template-index.md1 kB
- index.md9 kB
- syntax.md341 B
- feat-index.md145 B
- specific-syntax.md12 kB
- tokenization.md5 kB
- morphology.md591 B
- feat
- VerbForm.md2 kB
- Person.md1 kB
- Number.md2 kB
- Aspect.md1 kB
- Poss.md1 kB
- Polarity.md1 kB
- Gender.md1 kB
- Variant.md1 kB
- Reflex.md1 kB
- Case.md6 kB
- Degree.md1 kB
- NameType.md3 kB
- Voice.md2 kB
- Tense.md3 kB
- Mood.md1 kB
- Animacy.md1 kB
- introduction.md6 kB
- pos
- PRON.md1 kB
- VERB.md3 kB
- ADV.md1 kB
- NUM.md4 kB
- CCONJ.md481 B
- ADJ.md2 kB
- SCONJ.md578 B
- SYM.md1 kB
- DET.md1 kB
- NOUN.md1 kB
- PROPN.md2 kB
- INTJ.md780 B
- AUX_.md1 kB
- PUNCT.md463 B
- ADP.md875 B
- X.md952 B
- PART.md1 kB
- dep
- nsubj.md1 kB
- advcl.md1 kB
- obj.md1 kB
- vocative.md646 B
- nummod-entity.md387 B
- xcomp.md5 kB
- mark.md1 kB
- flat.md2 kB
- compound.md2 kB
- csubj.md922 B
- flat-foreign.md757 B
- reparandum.md446 B
- amod.md1 kB
- flat-name.md811 B
- nmod.md2 kB
- nummod.md10 kB
- acl-relcl.md1 kB
- iobj.md3 kB
- nsubj-pass.md696 B
- acl.md2 kB
- case.md1 kB
- punct.md2 kB
- advmod.md1 kB
- aux-pass.md867 B
- ccomp.md1 kB
- parataxis.md3 kB
- goeswith.md587 B
- appos.md2 kB
- cc.md1 kB
- csubj-pass.md425 B
- fixed.md1 kB
- det.md664 B
- discourse.md1 kB
- list.md1 kB
- obl-agent.md398 B
- cop.md1 kB
- orphan.md1 kB
- aux_.md1 kB
- obl.md512 B
- root.md1 kB
- nummod-gov.md1021 B
- expl.md1 kB
- dislocated.md1 kB
- conj.md1 kB
- dep.md654 B
- dep-index.md151 B
- pos-index.md143 B
- _template
- template-index-sv-example.md5 kB
- template-index-cs-example.md17 kB
- template-index.md1 kB
- discussion.md1 kB
- _fi
- extra.md13 kB
- index.md3 kB
- syntax.md4 kB
- FTB-tokenization.md419 B
- feat-index.md134 B
- specific-syntax.md70 kB
- tokenization.md402 B
- FTB-introduction.md2 kB
- feat
- Typo.md415 B
- Number.md715 B
- Abbr.md638 B
- Voice.md623 B
- Degree.md1 kB
- Tense.md1 kB
- VerbForm.md1 kB
- Polarity.md345 B
- Mood.md2 kB
- Person.md1 kB
- Clitic.md2 kB
- Derivation.md2 kB
- NumType.md911 B
- PronType.md3 kB
- PartForm.md1 kB
- Person-psor.md743 B
- Connegative.md812 B
- InfForm.md1 kB
- Case.md6 kB
- Number-psor.md745 B
- Style.md585 B
- introduction.md2 kB
- FTB1tokenization.md365 B
- dep-index.md235 B
- pos
- PRON.md919 B
- ADV.md480 B
- VERB.md614 B
- NUM.md552 B
- CCONJ.md882 B
- ADJ.md745 B
- SCONJ.md631 B
- SYM.md376 B
- DET.md910 B
- NOUN.md471 B
- PROPN.md528 B
- INTJ.md384 B
- ADP.md419 B
- PUNCT.md336 B
- AUX_.md1 kB
- X.md455 B
- PART.md785 B
- dep
- advcl.md1 kB
- obj.md946 B
- nsubj.md504 B
- vocative.md567 B
- cc-preconj.md1 kB
- mark.md2 kB
- compound-prt.md3 kB
- xcomp.md2 kB
- flat.md1 kB
- compound.md1 kB
- csubj.md485 B
- xcomp-ds.md1 kB
- amod.md781 B
- nmod.md818 B
- nummod.md751 B
- acl-relcl.md1 kB
- nmod-gobj.md665 B
- case.md898 B
- acl.md2 kB
- punct.md1 kB
- nmod-poss.md1 kB
- advmod.md1 kB
- aux-pass.md1 kB
- ccomp.md2 kB
- parataxis.md2 kB
- goeswith.md683 B
- appos.md1 kB
- cc.md2 kB
- fixed.md4 kB
- det.md796 B
- discourse.md1016 B
- cop-own.md965 B
- list.md993 B
- nsubj-cop.md619 B
- compound-nn.md1 kB
- nmod-gsubj.md553 B
- cop.md860 B
- csubj-cop.md796 B
- orphan.md881 B
- aux_.md1 kB
- root.md315 B
- conj.md1 kB
- FTB1introduction.md1 kB
- pos-index.md132 B
- _ur
- index.md3 kB
- _got
- feat
- Strength.md1 kB
- introduction.md695 B
- template-index.md1 kB
- feat
- logos
- by.svg9 kB
- by-nc-sa.svg22 kB
- logo-ud.png10 kB
- by-sa.svg16 kB
- F.svg3 kB
- LGPLLR.svg1 kB
- gpl.svg3 kB
- D.svg3 kB
- L.svg3 kB
- _id
- index.md13 kB
- dep
- cc-preconj.md1 kB
- nsubj-pass.md746 B
- acl-relcl.md430 B
- clf.md722 B
- nmod-tmod.md599 B
- nmod-poss.md603 B
- fixed.md1 kB
- cop.md683 B
- csubj-pass.md760 B
- obl-tmod.md696 B
- compound-a.md948 B
- nmod-lmod.md1 kB
- obl-agent.md918 B
- advmod-emph.md1 kB
- aux_.md743 B
- case-adv.md1 kB
- _orv
- index.md7 kB
- feat
- Variant.md1 kB
- NumForm.md1 kB
- Number.md2 kB
- VerbForm.md4 kB
- Analyt.md829 B
- uralic.md688 B
- _u-dep
- advcl.md847 B
- obj.md1 kB
- nsubj.md2 kB
- vocative.md661 B
- det-numgov.md1 kB
- cc-preconj.md535 B
- compound-prt.md807 B
- mark.md1 kB
- xcomp.md4 kB
- flat.md9 kB
- compound.md1 kB
- flat-foreign.md750 B
- csubj.md1 kB
- expl-pv.md918 B
- reparandum.md448 B
- amod.md556 B
- flat-name.md1 kB
- nmod.md905 B
- nummod.md673 B
- iobj.md3 kB
- acl-relcl.md493 B
- nsubj-pass.md635 B
- nmod-tmod.md388 B
- case.md5 kB
- expl-impers.md1018 B
- acl.md1 kB
- punct.md2 kB
- nmod-poss.md524 B
- advmod.md1 kB
- aux-pass.md1 kB
- advmod-lmod.md406 B
- clf.md4 kB
- ccomp.md1 kB
- parataxis.md5 kB
- obl-arg.md2 kB
- goeswith.md1 kB
- appos.md4 kB
- compound-svc.md4 kB
- cc.md1 kB
- obl-lmod.md431 B
- csubj-pass.md751 B
- fixed.md1 kB
- det.md855 B
- obl-tmod.md433 B
- discourse.md908 B
- list.md2 kB
- compound-redup.md1 kB
- obl-agent.md1 kB
- expl-pass.md607 B
- cop.md5 kB
- advmod-emph.md1 kB
- det-nummod.md1 kB
- orphan.md1 kB
- aux_.md1 kB
- obl.md2 kB
- root.md1 kB
- nummod-gov.md1 kB
- expl.md5 kB
- dislocated.md1 kB
- det-poss.md643 B
- compound-lvc.md1020 B
- conj.md3 kB
- dep.md590 B
- _hy
- index.md16 kB
- syntax.md1 kB
- feat-index.md145 B
- specific-syntax.md15 kB
- tokenization.md5 kB
- morphology.md934 B
- feat
- Typo.md508 B
- Definite.md1 kB
- ConjType.md1 kB
- Aspect.md4 kB
- Number.md4 kB
- Abbr.md2 kB
- Reflex.md1 kB
- Foreign.md1 kB
- Voice.md5 kB
- Subcat.md868 B
- Hyph.md1 kB
- Degree.md3 kB
- NameType.md2 kB
- Tense.md5 kB
- VerbForm.md6 kB
- Polarity.md2 kB
- Mood.md4 kB
- Poss.md1 kB
- Person.md1 kB
- NumType.md2 kB
- PronType.md6 kB
- AdpType.md2 kB
- NumForm.md1 kB
- Person-psor.md3 kB
- Animacy.md1 kB
- Connegative.md1 kB
- Echo.md2 kB
- Polite.md1 kB
- Case.md5 kB
- Number-psor.md1 kB
- Style.md1 kB
- Deixis.md1 kB
- introduction.md2 kB
- pos
- PRON.md2 kB
- ADV.md1 kB
- VERB.md3 kB
- CCONJ.md496 B
- NUM.md3 kB
- ADJ.md1 kB
- SCONJ.md1 kB
- SYM.md1 kB
- DET.md3 kB
- NOUN.md1 kB
- PROPN.md4 kB
- INTJ.md1 kB
- PUNCT.md960 B
- ADP.md2 kB
- AUX_.md5 kB
- X.md1 kB
- PART.md1 kB
- dep-index.md151 B
- dep
- advcl.md1 kB
- obj.md1 kB
- nsubj.md1 kB
- vocative.md765 B
- nmod-npmod.md2 kB
- mark.md1 kB
- xcomp.md4 kB
- flat.md4 kB
- compound.md2 kB
- csubj.md1 kB
- reparandum.md433 B
- amod.md885 B
- nmod.md3 kB
- nummod.md3 kB
- iobj.md2 kB
- acl-relcl.md1 kB
- nsubj-pass.md577 B
- case.md2 kB
- acl.md1 kB
- punct.md2 kB
- nmod-poss.md566 B
- advmod.md1 kB
- case-loc.md2 kB
- ccomp.md1 kB
- parataxis.md4 kB
- goeswith.md818 B
- appos.md2 kB
- compound-svc.md1 kB
- cc.md1 kB
- csubj-pass.md1 kB
- fixed.md1 kB
- det.md1 kB
- discourse.md1 kB
- compound-redup.md1 kB
- aux-ex.md865 B
- list.md1 kB
- obl-agent.md472 B
- nsubj-caus.md899 B
- cop.md4 kB
- advmod-emph.md1 kB
- orphan.md1 kB
- aux_.md1 kB
- aux-caus.md1 kB
- obl.md4 kB
- root.md1 kB
- iobj-agent.md2 kB
- dislocated.md2 kB
- det-poss.md697 B
- compound-lvc.md746 B
- dep.md1 kB
- conj.md2 kB
- pos-index.md143 B
- index.md4 kB
- _pbv
- template-index.md1 kB
- _eu
- template-index.md1 kB
- syntax.md658 B
- feat-index.md134 B
- tokenization.md330 B
- morphology.md661 B
- feat
- Person.md1 kB
- Number.md936 B
- introduction.md1 kB
- dep-index.md140 B
- pos
- NOUN.md329 B
- PROPN.md355 B
- VERB.md833 B
- ADV.md539 B
- ADJ.md400 B
- dep
- iobj.md1 kB
- ccomp.md1 kB
- nsubj.md1 kB
- punct.md2 kB
- flat.md1 kB
- det.md3 kB
- cc.md1 kB
- compound.md1 kB
- obj.md841 B
- acl.md1 kB
- nummod.md1 kB
- xcomp.md1 kB
- fixed.md1 kB
- csubj.md1 kB
- advcl.md1 kB
- nmod.md1 kB
- advmod.md962 B
- cop.md999 B
- vocative.md720 B
- aux_.md1 kB
- conj.md1 kB
- discourse.md910 B
- amod.md1 kB
- mark.md2 kB
- appos.md2 kB
- pos-index.md132 B
- events.md998 B
- _br
- index.md2 kB
- dep
- nmod-gen.md464 B
- nsubj-cop.md619 B
- _el
- index.md4 kB
- pos-index.md132 B
- dep-index.md140 B
- dep
- nsubj.md841 B
- advcl.md2 kB
- obj.md1 kB
- vocative.md693 B
- mark.md2 kB
- xcomp.md2 kB
- flat.md2 kB
- compound.md1004 B
- csubj.md793 B
- reparandum.md478 B
- amod.md1 kB
- nmod.md2 kB
- nummod.md513 B
- acl-relcl.md1 kB
- iobj.md3 kB
- nsubj-pass.md1 kB
- acl.md1 kB
- case.md2 kB
- punct.md3 kB
- advmod.md1 kB
- ccomp.md811 B
- parataxis.md1 kB
- goeswith.md394 B
- appos.md1 kB
- cc.md1 kB
- csubj-pass.md727 B
- fixed.md612 B
- det.md1 kB
- discourse.md536 B
- list.md927 B
- cop.md1 kB
- orphan.md803 B
- aux_.md1 kB
- root.md534 B
- expl.md593 B
- dislocated.md715 B
- conj.md2 kB
- specific-syntax.md2 kB
- introduction.md1 kB
- pos
- CCONJ.md813 B
- ADJ.md1 kB
- _pnt
- template-index.md1 kB
- _ko
- feat
- Form.md1 kB
- tokenization.md417 B
- introduction.md1 kB
- template-index.md1 kB
- feat
- _kab
- template-index.md1 kB
- _apu
- _th
- markdown-source
- ... too many files ...0 B
- Name
- ud-tools-v2.8.tgz
- Size
- 533.49 KB
- Format
- application/x-gzip
- Description
- Tools
- MD5
- 0fee55d28bc2b0698f17332ba7cccbb6
- ud-tools-v2.8
- check_text_wosp_match.sh814 B
- conll_convert_tags_to_uposf.pl1 kB
- conllu-sort-sentences-by-ids.pl1 kB
- check_sentence_ids.pl1 kB
- conllu-stats.py6 kB
- package_st_data.sh10 kB
- runtests.sh1 kB
- conllu-w2t.py2 kB
- file_util.pyc2 kB
- validate_repo_metadata.py4 kB
- example-data
- long-token-to-text-wrong.txt333 B
- long-token-to-text-correct.txt332 B
- long-token-to-text.conllu2 kB
- tanl.conll471 B
- conllu-copy-basic-to-enhanced.pl1 kB
- enhanced_classify_relations.pl26 kB
- evaluate_treebank.pl18 kB
- iwpt20_xud_eval.py36 kB
- package_ud_release.sh6 kB
- conllu-stats.pl107 kB
- conllu-dependency-stats.pl944 B
- check-space-after-paragraph.pl2 kB
- file_util.py2 kB
- conllu-quick-fix-id-sequence.pl2 kB
- conllu-formconvert.py3 kB
- find_duplicate_sentences.pl1 kB
- survey_misc.pl6 kB
- remove_duplicate_sentences.pl2 kB
- validate_all.sh943 B
- fix_format_of_deps.pl1 kB
- conllu_to_conllx.pl2 kB
- restore_conllu_lines.pl1 kB
- LICENSE.txt17 kB
- mwtoken-stats.pl1 kB
- Node.pm18 kB
- overlap.py2 kB
- collect_propn_sequences.pl3 kB
- survey_features.pl11 kB
- __pycache__
- file_util.cpython-37.pyc2 kB
- fix-space-after-paragraph.pl4 kB
- survey_deprel_subtypes.pl8 kB
- udlib.pm20 kB
- compat
- argparse.pyc65 kB
- argparse.py85 kB
- __init__.pyc140 B
- __init__.py0 B
- validate-python2-obsolete.py36 kB
- v2-conversion
- convert.py3 kB
- README.md2 kB
- processors_en.py1 kB
- processors_universal.py5 kB
- nmod_obl_adjudication.py3 kB
- depgraph_utils.py6 kB
- text_without_spaces.pl2 kB
- remove_sense_suffixes_from_lemmas.pl1 kB
- generate_comparison_of_treebanks.pl2 kB
- csort.pm7 kB
- enhanced_graph_properties.pl21 kB
- package_ud_release.sh~6 kB
- validate.py119 kB
- create_iso_639_3_symlinks.py175 kB
- conllu-quick-fix.pl20 kB
- test-cases
- nonvalid
- lowercase-postag.conllu141 B
- lowercase-feature-value-in-empty.conllu251 B
- empty-head.conllu114 B
- invalid-deps-id.conllu173 B
- misordered-feature.conllu243 B
- invalid-deps-syntax.conllu194 B
- missing-final-line.conllu155 B
- empty-field.conllu100 B
- head-not-0-deprel-root.conllu172 B
- empty-sentence.conllu163 B
- ambiguous-feature.conllu175 B
- trailing-tab.conllu127 B
- lowercase-postag-in-empty.conllu239 B
- multiple-sent_id.conllu736 B
- malformed_deps.conllu683 B
- head-0-deprel-not-root.conllu133 B
- lowercase-feature.conllu238 B
- head-not-empty-in-empty.conllu224 B
- duplicate-value.conllu137 B
- tanl-broken.conllu690 B
- misordered-layered-feature.conllu239 B
- whitespace_nonv.conllu274 B
- misplaced-comment-end.conllu429 B
- nonsequential-empty-node-id.conllu238 B
- dos-newlines.conllu698 B
- invalid-head.conllu164 B
- duplicate-layered-feature.conllu182 B
- cyclic-deps.conllu227 B
- id-with-extra-0.conllu140 B
- overlapping-multiword.conllu387 B
- duplicate-feature.conllu142 B
- token_with_cols_filled.conllu385 B
- self-cycle-deps.conllu164 B
- nonsequential-id.conllu176 B
- space-in-field.conllu127 B
- extra-empty-line.conllu287 B
- lowercase-feature-in-empty.conllu244 B
- non-proj.conllu109 B
- no-sent_id.conllu686 B
- misindexed-empty-node.conllu235 B
- id-starting-from-2.conllu247 B
- invalid-range.conllu375 B
- self-cycle-head.conllu190 B
- empty-node-without-dependent.conllu251 B
- uppercase-deps-deprel.conllu206 B
- multiword-with-pos.conllu407 B
- uppercase-deprel.conllu184 B
- invalid-deps-order.conllu409 B
- missing-space-after.conllu176 B
- extra-field.conllu130 B
- duplicate-id.conllu171 B
- invalid-range-format.conllu380 B
- deprel-not-empty-in-empty.conllu233 B
- misplaced-comment-mid.conllu401 B
- misordered-multiword.conllu392 B
- lowercase-value.conllu237 B
- valid
- maximal-empty-node.conllu273 B
- multiple-features.conllu295 B
- whitespace.conllu294 B
- id_test_part2.conllu375 B
- empty-nodes.conllu324 B
- id_test_part1.conllu375 B
- tanl.conllu673 B
- empty-file.conllu0 B
- minimal-empty-node.conllu239 B
- layered-features.conllu272 B
- nonvalid
- README.md11 kB
- conllu-remove-enhanced-deps.pl443 B
- conllu-tenfold.pl2 kB
- save_evaluation_logs.sh962 B
- mergept.pl2 kB
- normalize_unicode.pl511 B
- Graph.pm12 kB
- data
- deprel.shopen311 B
- edeprel.ta2 kB
- tokens_w_space.ud27 B
- edeprel.ar27 kB
- edeprel.akk22 B
- tokens_w_space.br457 B
- edeprel.sv4 kB
- tokens_w_space.koi86 B
- docdeps.json196 kB
- edeprel.pl21 kB
- tokens_w_space.kk1 kB
- tokens_w_space.nl158 B
- edeprel.sk3 kB
- cpos.ud79 B
- edeprel.cs28 kB
- edeprel.fr430 B
- edeprel.it3 kB
- edeprel.lv998 B
- edeprel.lt2 kB
- tokens_w_space.am82 B
- edeprel.ru12 kB
- deprels.json591 kB
- tokens_w_space.sv131 B
- edeprel.fi8 kB
- tokens_w_space.myv82 B
- tokens_w_space.mdf82 B
- tokens_w_space.pl366 B
- feats.json808 kB
- edeprel.uk5 kB
- tokens_w_space.akk246 B
- tokens_w_space.gun0 B
- tokens_w_space.vi3 B
- edeprel.ud4 B
- deprel.ud237 B
- data.json286 kB
- tokens_w_space.fro10 B
- tokens_w_space.kpv86 B
- edeprel.ojp6 B
- tokens_w_space.shopen9 B
- feat_val.shopen2 kB
- tokens_w_space.kmr277 B
- edeprel.et10 kB
- docfeats.json860 kB
- edeprel.en5 kB
- tokens_w_space.sms151 B
- tokens_w_space.fr10 B
- tokens_w_space.lv112 B
- tokens_w_space.lt1 kB
- edeprel.bg2 kB
- edeprel.be6 kB
- edeprel.nl6 kB
- tokens_w_space.apu123 B
- tokens_w_space.fi78 B
- edeprel.lzh76 B
- generate_treebank_hub.pl1 kB
- conllu_to_text.pl9 kB
- check_overlaps.pl1 kB
- survey_enhancements.pl7 kB
- conllu_align_tokens.pl6 kB
- check_files.pl64 kB
- enhanced_collapse_empty_nodes.pl8 kB
- klcpos3.pl1 kB