Files in this item

This item is
Publicly Available
and licensed under:
Licence Universal Dependencies v2.2
GNU General Public License, version 3.0 Distributed under Creative Commons
Icon
Name
ud-2.2-conll18-baseline-models.tar.xz
Size
1.2 GB
Format
application/x-xz
Description
Baseline UDPipe models for CoNLL 2018 Shared Task in UD Parsing.
MD5
9db1c4e4eacb0ee5dcb259487c721a42
 Download file  Preview
 File Preview  
  • training
    • params_tagger33 kB
    • params_parser25 kB
    • README.txt1 kB
    • embeddings
      • ga_idt.skip.forms.50.vectors485 kB
      • sr_set.skip.forms.50.vectors2 MB
      • ru_taiga.skip.forms.50.vectors364 kB
      • nl_alpino.skip.forms.50.vectors4 MB
      • hsb_ufal.skip.forms.50.vectors17 kB
      • ar_padt.skip.forms.50.vectors5 MB
      • mix.skip.forms.50.vectors10 MB
      • gl_ctg.skip.forms.50.vectors2 MB
      • sv_talbanken.skip.forms.50.vectors2 MB
      • sme_giella.skip.forms.50.vectors703 kB
      • ja_gsd.skip.forms.50.vectors4 MB
      • grc_proiel.skip.forms.50.vectors5 MB
      • pl_sz.skip.forms.50.vectors2 MB
      • fi_tdt.skip.forms.50.vectors6 MB
      • no_nynorsklia.skip.forms.50.vectors122 kB
      • fi_ftb.skip.forms.50.vectors4 MB
      • nl_lassysmall.skip.forms.50.vectors2 MB
      • de_gsd.skip.forms.50.vectors7 MB
      • gen.sh346 B
      • sl_ssj.skip.forms.50.vectors4 MB
      • la_ittb.skip.forms.50.vectors3 MB
      • es_ancora.skip.forms.50.vectors8 MB
      • sl_sst.skip.forms.50.vectors603 kB
      • ca_ancora.skip.forms.50.vectors7 MB
      • fr_gsd.skip.forms.50.vectors7 MB
      • fa_seraji.skip.forms.50.vectors3 MB
      • grc_perseus.skip.forms.50.vectors5 MB
      • got_proiel.skip.forms.50.vectors1 MB
      • uk_iu.skip.forms.50.vectors3 MB
      • pl_lfg.skip.forms.50.vectors3 MB
      • la_proiel.skip.forms.50.vectors5 MB
      • gl_treegal.skip.forms.50.vectors566 kB
      • ur_udtb.skip.forms.50.vectors2 MB
      • sv_lines.skip.forms.50.vectors1 MB
      • eu_bdt.skip.forms.50.vectors3 MB
      • cs_cac.skip.forms.50.vectors13 MB
      • bg_btb.skip.forms.50.vectors4 MB
      • ko_kaist.skip.forms.50.vectors12 MB
      • la_perseus.skip.forms.50.vectors809 kB
      • fro_srcmf.skip.forms.50.vectors3 MB
      • ro_rrt.skip.forms.50.vectors5 MB
      • zh_gsd.skip.forms.50.vectors3 MB
      • hu_szeged.skip.forms.50.vectors897 kB
      • cs_fictree.skip.forms.50.vectors4 MB
      • af_afribooms.skip.forms.50.vectors1 MB
      • vi_vtb.skip.forms.50.vectors826 kB
      • pt_bosque.skip.forms.50.vectors5 MB
      • sk_snk.skip.forms.50.vectors3 MB
      • ko_gsd.skip.forms.50.vectors2 MB
      • tr_imst.skip.forms.50.vectors1 MB
      • hy_armtdp.skip.forms.50.vectors28 kB
      • en_lines.skip.forms.50.vectors1 MB
      • it_postwita.skip.forms.50.vectors2 MB
      • cs_pdt.skip.forms.50.vectors27 MB
      • id_gsd.skip.forms.50.vectors3 MB
      • no_bokmaal.skip.forms.50.vectors5 MB
      • he_htb.skip.forms.50.vectors3 MB
      • bxr_bdt.skip.forms.50.vectors7 kB
      • ug_udt.skip.forms.50.vectors1007 kB
      • en_ewt.skip.forms.50.vectors4 MB
      • el_gdt.skip.forms.50.vectors1 MB
      • cu_proiel.skip.forms.50.vectors1 MB
      • it_isdt.skip.forms.50.vectors6 MB
      • ru_syntagrus.skip.forms.50.vectors22 MB
      • lv_lvtb.skip.forms.50.vectors3 MB
      • en_gum.skip.forms.50.vectors1 MB
      • hr_set.skip.forms.50.vectors5 MB
      • kmr_mg.skip.forms.50.vectors14 kB
      • no_nynorsk.skip.forms.50.vectors5 MB
      • fr_sequoia.skip.forms.50.vectors1 MB
      • fr_spoken.skip.forms.50.vectors510 kB
      • hi_hdtb.skip.forms.50.vectors4 MB
      • et_edt.skip.forms.50.vectors10 MB
      • kk_ktb.skip.forms.50.vectors26 kB
      • da_ddt.skip.forms.50.vectors2 MB
    • params_tokenizer8 kB
    • training_data
      • nl_alpino
        • nl_alpino-ud-train.conllu13 MB
        • nl_alpino-ud-dev.txt62 kB
        • nl_alpino-ud-train.txt1017 kB
        • nl_alpino-ud-dev.conllu882 kB
      • fro_srcmf
        • fro_srcmf-ud-dev.conllu896 kB
        • fro_srcmf-ud-dev.txt87 kB
        • fro_srcmf-ud-train.txt681 kB
        • fro_srcmf-ud-train.conllu6 MB
      • fi_ftb
        • fi_ftb-ud-dev.txt111 kB
        • fi_ftb-ud-train.txt904 kB
        • fi_ftb-ud-train.conllu9 MB
        • fi_ftb-ud-dev.conllu1 MB
      • he_htb
        • he_htb-ud-dev.txt71 kB
        • he_htb-ud-train.conllu9 MB
        • he_htb-ud-train.txt833 kB
        • he_htb-ud-dev.conllu838 kB
      • vi_vtb
        • vi_vtb-ud-dev.conllu522 kB
        • vi_vtb-ud-train.conllu939 kB
        • vi_vtb-ud-train.txt127 kB
        • vi_vtb-ud-dev.txt69 kB
      • uk_iu
        • uk_iu-ud-train.txt739 kB
        • uk_iu-ud-dev.txt106 kB
        • uk_iu-ud-dev.conllu995 kB
        • uk_iu-ud-train.conllu6 MB
      • fi_tdt
        • fi_tdt-ud-train.conllu11 MB
        • fi_tdt-ud-dev.txt136 kB
        • fi_tdt-ud-train.txt1 MB
        • fi_tdt-ud-dev.conllu1 MB
      • pl_lfg
        • pl_lfg-ud-dev.txt74 kB
        • pl_lfg-ud-train.txt596 kB
        • pl_lfg-ud-train.conllu11 MB
        • pl_lfg-ud-dev.conllu1 MB
      • ga_idt
        • ga_idt-ud-train.conllu792 kB
        • ga_idt-ud-dev.conllu90 kB
        • ga_idt-ud-train.txt64 kB
        • ga_idt-ud-dev.txt7 kB
      • hi_hdtb
        • hi_hdtb-ud-dev.txt427 kB
        • hi_hdtb-ud-train.conllu39 MB
        • hi_hdtb-ud-train.txt3 MB
        • hi_hdtb-ud-dev.conllu4 MB
      • no_nynorsk
        • no_nynorsk-ud-train.conllu14 MB
        • no_nynorsk-ud-train.txt1 MB
        • no_nynorsk-ud-dev.txt166 kB
        • no_nynorsk-ud-dev.conllu1 MB
      • sl_sst
        • sl_sst-ud-dev.txt11 kB
        • sl_sst-ud-train.conllu1 MB
        • sl_sst-ud-train.txt91 kB
        • sl_sst-ud-dev.conllu191 kB
      • tr_imst
        • tr_imst-ud-dev.conllu787 kB
        • tr_imst-ud-train.txt246 kB
        • tr_imst-ud-train.conllu2 MB
        • tr_imst-ud-dev.txt63 kB
      • fa_seraji
        • fa_seraji-ud-train.txt995 kB
        • fa_seraji-ud-dev.conllu989 kB
        • fa_seraji-ud-dev.txt133 kB
        • fa_seraji-ud-train.conllu7 MB
      • sk_snk
        • sk_snk-ud-train.txt447 kB
        • sk_snk-ud-train.conllu6 MB
        • sk_snk-ud-dev.conllu1 MB
        • sk_snk-ud-dev.txt77 kB
      • sl_ssj
        • sl_ssj-ud-train.txt617 kB
        • sl_ssj-ud-dev.conllu1 MB
        • sl_ssj-ud-dev.txt79 kB
        • sl_ssj-ud-train.conllu9 MB
      • grc_perseus
        • grc_perseus-ud-train.conllu14 MB
        • grc_perseus-ud-dev.txt250 kB
        • grc_perseus-ud-train.txt1 MB
        • grc_perseus-ud-dev.conllu1 MB
      • sv_talbanken
        • sv_talbanken-ud-train.conllu5 MB
        • sv_talbanken-ud-train.txt402 kB
        • sv_talbanken-ud-dev.txt58 kB
        • sv_talbanken-ud-dev.conllu834 kB
      • got_proiel
        • got_proiel-ud-dev.txt62 kB
        • got_proiel-ud-train.conllu3 MB
        • got_proiel-ud-dev.conllu928 kB
        • got_proiel-ud-train.txt221 kB
      • eu_bdt
        • eu_bdt-ud-train.txt459 kB
        • eu_bdt-ud-dev.conllu1 MB
        • eu_bdt-ud-train.conllu4 MB
        • eu_bdt-ud-dev.txt151 kB
      • bxr_bdt
        • bxr_bdt-ud-dev.conllu1 kB
        • bxr_bdt-ud-train.conllu9 kB
        • bxr_bdt-ud-train.txt1 kB
        • bxr_bdt-ud-dev.txt192 B
      • ru_taiga
        • ru_taiga-ud-dev.txt13 kB
        • ru_taiga-ud-dev.conllu113 kB
        • ru_taiga-ud-train.txt82 kB
        • ru_taiga-ud-train.conllu712 kB
      • ca_ancora
        • ca_ancora-ud-train.conllu26 MB
        • ca_ancora-ud-dev.conllu3 MB
        • ca_ancora-ud-dev.txt289 kB
        • ca_ancora-ud-train.txt2 MB
      • hy_armtdp
        • hy_armtdp-ud-dev.txt1 kB
        • hy_armtdp-ud-dev.conllu10 kB
        • hy_armtdp-ud-train.txt7 kB
        • hy_armtdp-ud-train.conllu67 kB
      • en_lines
        • en_lines-ud-train.txt239 kB
        • en_lines-ud-dev.txt82 kB
        • en_lines-ud-dev.conllu954 kB
        • en_lines-ud-train.conllu2 MB
      • kk_ktb
        • kk_ktb-ud-dev.conllu6 kB
        • kk_ktb-ud-train.conllu33 kB
        • kk_ktb-ud-train.txt4 kB
        • kk_ktb-ud-dev.txt995 B
      • ja_gsd
        • ja_gsd-ud-dev.conllu612 kB
        • ja_gsd-ud-dev.txt57 kB
        • ja_gsd-ud-train.txt802 kB
        • ja_gsd-ud-train.conllu8 MB
      • conllu_to_text.pl8 kB
      • sr_set
        • sr_set-ud-dev.txt58 kB
        • sr_set-ud-train.txt384 kB
        • sr_set-ud-train.conllu4 MB
        • sr_set-ud-dev.conllu677 kB
      • et_edt
        • et_edt-ud-dev.conllu2 MB
        • et_edt-ud-dev.txt237 kB
        • et_edt-ud-train.txt1 MB
        • et_edt-ud-train.conllu18 MB
      • sv_lines
        • sv_lines-ud-dev.txt91 kB
        • sv_lines-ud-train.txt265 kB
        • sv_lines-ud-train.conllu3 MB
        • sv_lines-ud-dev.conllu1 MB
      • it_postwita
        • it_postwita-ud-train.conllu5 MB
        • it_postwita-ud-train.txt541 kB
        • it_postwita-ud-dev.conllu754 kB
        • it_postwita-ud-dev.txt66 kB
      • en_ewt
        • en_ewt-ud-train.txt985 kB
        • en_ewt-ud-dev.txt123 kB
        • en_ewt-ud-dev.conllu1 MB
        • en_ewt-ud-train.conllu12 MB
      • get.sh780 B
      • la_perseus
        • la_perseus-ud-train.conllu1 MB
        • la_perseus-ud-dev.txt10 kB
        • la_perseus-ud-dev.conllu157 kB
        • la_perseus-ud-train.txt94 kB
      • pl_sz
        • pl_sz-ud-train.conllu5 MB
        • pl_sz-ud-train.txt383 kB
        • pl_sz-ud-dev.conllu942 kB
        • pl_sz-ud-dev.txt62 kB
      • fr_spoken
        • fr_spoken-ud-dev.txt50 kB
        • fr_spoken-ud-dev.conllu413 kB
        • fr_spoken-ud-train.conllu615 kB
        • fr_spoken-ud-train.txt77 kB
      • af_afribooms
        • af_afribooms-ud-dev.conllu321 kB
        • af_afribooms-ud-train.txt195 kB
        • af_afribooms-ud-dev.txt30 kB
        • af_afribooms-ud-train.conllu2 MB
      • fr_gsd
        • fr_gsd-ud-train.txt1 MB
        • fr_gsd-ud-dev.conllu2 MB
        • fr_gsd-ud-dev.txt184 kB
        • fr_gsd-ud-train.conllu21 MB
      • zh_gsd
        • zh_gsd-ud-train.conllu5 MB
        • zh_gsd-ud-dev.txt53 kB
        • zh_gsd-ud-dev.conllu673 kB
        • zh_gsd-ud-train.txt411 kB
      • nl_lassysmall
        • nl_lassysmall-ud-dev.conllu837 kB
        • nl_lassysmall-ud-train.conllu5 MB
        • nl_lassysmall-ud-train.txt419 kB
        • nl_lassysmall-ud-dev.txt61 kB
      • gl_treegal
        • gl_treegal-ud-dev.txt7 kB
        • gl_treegal-ud-train.conllu931 kB
        • gl_treegal-ud-train.txt69 kB
        • gl_treegal-ud-dev.conllu98 kB
      • sme_giella
        • sme_giella-ud-dev.txt17 kB
        • sme_giella-ud-dev.conllu172 kB
        • sme_giella-ud-train.txt89 kB
        • sme_giella-ud-train.conllu978 kB
      • la_proiel
        • la_proiel-ud-dev.conllu1 MB
        • la_proiel-ud-train.conllu15 MB
        • la_proiel-ud-dev.txt87 kB
        • la_proiel-ud-train.txt1 MB
      • id_gsd
        • id_gsd-ud-dev.conllu956 kB
        • id_gsd-ud-dev.txt74 kB
        • id_gsd-ud-train.conllu7 MB
        • id_gsd-ud-train.txt575 kB
      • es_ancora
        • es_ancora-ud-dev.conllu3 MB
        • es_ancora-ud-dev.txt275 kB
        • es_ancora-ud-train.txt2 MB
        • es_ancora-ud-train.conllu28 MB
      • hr_set
        • hr_set-ud-dev.conllu1 MB
        • hr_set-ud-train.txt904 kB
        • hr_set-ud-dev.txt115 kB
        • hr_set-ud-train.conllu10 MB
      • de_gsd
        • de_gsd-ud-dev.txt72 kB
        • de_gsd-ud-train.conllu18 MB
        • de_gsd-ud-train.txt1 MB
        • de_gsd-ud-dev.conllu862 kB
      • ur_udtb
        • ur_udtb-ud-dev.conllu1 MB
        • ur_udtb-ud-train.conllu11 MB
        • ur_udtb-ud-train.txt853 kB
        • ur_udtb-ud-dev.txt115 kB
      • ar_padt
        • ar_padt-ud-dev.conllu5 MB
        • ar_padt-ud-train.txt1 MB
        • ar_padt-ud-dev.txt241 kB
        • ar_padt-ud-train.conllu38 MB
      • ro_rrt
        • ro_rrt-ud-train.txt1 MB
        • ro_rrt-ud-dev.txt98 kB
        • ro_rrt-ud-dev.conllu1 MB
        • ro_rrt-ud-train.conllu13 MB
      • cu_proiel
        • cu_proiel-ud-train.conllu3 MB
        • cu_proiel-ud-dev.conllu1 MB
        • cu_proiel-ud-train.txt369 kB
        • cu_proiel-ud-dev.txt97 kB
      • cs_fictree
        • cs_fictree-ud-dev.conllu1 MB
        • cs_fictree-ud-train.conllu13 MB
        • cs_fictree-ud-dev.txt86 kB
        • cs_fictree-ud-train.txt696 kB
      • mix.sh618 B
      • fr_sequoia
        • fr_sequoia-ud-train.txt267 kB
        • fr_sequoia-ud-train.conllu3 MB
        • fr_sequoia-ud-dev.txt52 kB
        • fr_sequoia-ud-dev.conllu614 kB
      • ko_kaist
        • ko_kaist-ud-dev.txt235 kB
        • ko_kaist-ud-dev.conllu1 MB
        • ko_kaist-ud-train.conllu17 MB
        • ko_kaist-ud-train.txt2 MB
      • en_gum
        • en_gum-ud-dev.txt65 kB
        • en_gum-ud-dev.conllu734 kB
        • en_gum-ud-train.txt267 kB
        • en_gum-ud-train.conllu2 MB
      • no_bokmaal
        • no_bokmaal-ud-train.conllu14 MB
        • no_bokmaal-ud-dev.txt195 kB
        • no_bokmaal-ud-dev.conllu2 MB
        • no_bokmaal-ud-train.txt1 MB
      • gl_ctg
        • gl_ctg-ud-dev.conllu1 MB
        • gl_ctg-ud-dev.txt155 kB
        • gl_ctg-ud-train.conllu4 MB
        • gl_ctg-ud-train.txt413 kB
      • la_ittb
        • la_ittb-ud-dev.conllu949 kB
        • la_ittb-ud-train.txt1 MB
        • la_ittb-ud-train.conllu23 MB
        • la_ittb-ud-dev.txt59 kB
      • ru_syntagrus
        • ru_syntagrus-ud-dev.conllu10 MB
        • ru_syntagrus-ud-train.txt9 MB
        • ru_syntagrus-ud-train.conllu77 MB
        • ru_syntagrus-ud-dev.txt1 MB
      • hu_szeged
        • hu_szeged-ud-dev.conllu983 kB
        • hu_szeged-ud-train.conllu1 MB
        • hu_szeged-ud-dev.txt83 kB
        • hu_szeged-ud-train.txt137 kB
      • it_isdt
        • it_isdt-ud-dev.conllu737 kB
        • it_isdt-ud-dev.txt59 kB
        • it_isdt-ud-train.conllu16 MB
        • it_isdt-ud-train.txt1 MB
      • el_gdt
        • el_gdt-ud-dev.conllu932 kB
        • el_gdt-ud-train.conllu3 MB
        • el_gdt-ud-train.txt440 kB
        • el_gdt-ud-dev.txt107 kB
      • grc_proiel
        • grc_proiel-ud-dev.conllu1 MB
        • grc_proiel-ud-train.conllu19 MB
        • grc_proiel-ud-train.txt2 MB
        • grc_proiel-ud-dev.txt159 kB
      • da_ddt
        • da_ddt-ud-train.conllu4 MB
        • da_ddt-ud-dev.conllu643 kB
        • da_ddt-ud-train.txt423 kB
        • da_ddt-ud-dev.txt54 kB
      • ug_udt
        • ug_udt-ud-train.conllu1 MB
        • ug_udt-ud-dev.txt119 kB
        • ug_udt-ud-train.txt219 kB
        • ug_udt-ud-dev.conllu886 kB
      • ko_gsd
        • ko_gsd-ud-train.txt485 kB
        • ko_gsd-ud-train.conllu3 MB
        • ko_gsd-ud-dev.conllu709 kB
        • ko_gsd-ud-dev.txt103 kB
      • cs_cac
        • cs_cac-ud-dev.txt72 kB
        • cs_cac-ud-dev.conllu1 MB
        • cs_cac-ud-train.conllu50 MB
        • cs_cac-ud-train.txt2 MB
      • cs_pdt
        • cs_pdt-ud-train.txt7 MB
        • cs_pdt-ud-dev.txt989 kB
        • cs_pdt-ud-train.conllu125 MB
        • cs_pdt-ud-dev.conllu17 MB
      • mix
        • mix-ud-train.conllu17 MB
        • mix-ud-dev.conllu2 MB
        • mix-ud-dev.txt181 kB
        • mix-ud-train.txt1 MB
      • conllu_split.pl993 B
      • kmr_mg
        • kmr_mg-ud-dev.conllu919 B
        • kmr_mg-ud-train.conllu16 kB
        • kmr_mg-ud-dev.txt52 B
        • kmr_mg-ud-train.txt1 kB
      • hsb_ufal
        • hsb_ufal-ud-dev.txt452 B
        • hsb_ufal-ud-train.conllu26 kB
        • hsb_ufal-ud-dev.conllu5 kB
        • hsb_ufal-ud-train.txt2 kB
      • bg_btb
        • bg_btb-ud-dev.txt155 kB
        • bg_btb-ud-dev.conllu1 MB
        • bg_btb-ud-train.txt1 MB
        • bg_btb-ud-train.conllu10 MB
      • iso_names.txt1 kB
      • lv_lvtb
        • lv_lvtb-ud-train.txt499 kB
        • lv_lvtb-ud-dev.txt86 kB
        • lv_lvtb-ud-train.conllu8 MB
        • lv_lvtb-ud-dev.conllu1 MB
      • no_nynorsklia
        • no_nynorsklia-ud-train.txt12 kB
        • no_nynorsklia-ud-dev.conllu34 kB
        • no_nynorsklia-ud-train.conllu166 kB
        • no_nynorsklia-ud-dev.txt2 kB
      • pt_bosque
        • pt_bosque-ud-train.conllu13 MB
        • pt_bosque-ud-train.txt1020 kB
        • pt_bosque-ud-dev.txt52 kB
        • pt_bosque-ud-dev.conllu717 kB
  • models
    • arabic-padt-ud-2.2-conll18-180430.udpipe18 MB
    • latin-perseus-ud-2.2-conll18-180430.udpipe4 MB
    • spanish-ancora-ud-2.2-conll18-180430.udpipe20 MB
    • czech-fictree-ud-2.2-conll18-180430.udpipe15 MB
    • old_church_slavonic-proiel-ud-2.2-conll18-180430.udpipe6 MB
    • kazakh-ktb-ud-2.2-conll18-180430.udpipe1 MB
    • italian-postwita-ud-2.2-conll18-180430.udpipe11 MB
    • greek-gdt-ud-2.2-conll18-180430.udpipe6 MB
    • hungarian-szeged-ud-2.2-conll18-180430.udpipe5 MB
    • swedish-talbanken-ud-2.2-conll18-180430.udpipe8 MB
    • polish-lfg-ud-2.2-conll18-180430.udpipe15 MB
    • czech-pdt-ud-2.2-conll18-180430.udpipe53 MB
    • kurmanji-mg-ud-2.2-conll18-180430.udpipe1 MB
    • swedish-lines-ud-2.2-conll18-180430.udpipe6 MB
    • norwegian-nynorsk-ud-2.2-conll18-180430.udpipe16 MB
    • ancient_greek-perseus-ud-2.2-conll18-180430.udpipe17 MB
    • latin-ittb-ud-2.2-conll18-180430.udpipe17 MB
    • upper_sorbian-ufal-ud-2.2-conll18-180430.udpipe1 MB
    • croatian-set-ud-2.2-conll18-180430.udpipe19 MB
    • english-gum-ud-2.2-conll18-180430.udpipe6 MB
    • polish-sz-ud-2.2-conll18-180430.udpipe11 MB
    • north_sami-giella-ud-2.2-conll18-180430.udpipe4 MB
    • estonian-edt-ud-2.2-conll18-180430.udpipe30 MB
    • indonesian-gsd-ud-2.2-conll18-180430.udpipe13 MB
    • vietnamese-vtb-ud-2.2-conll18-180430.udpipe4 MB
    • gothic-proiel-ud-2.2-conll18-180430.udpipe6 MB
    • english-ewt-ud-2.2-conll18-180430.udpipe16 MB
    • bulgarian-btb-ud-2.2-conll18-180430.udpipe14 MB
    • old_french-srcmf-ud-2.2-conll18-180430.udpipe10 MB
    • persian-seraji-ud-2.2-conll18-180430.udpipe10 MB
    • norwegian-nynorsklia-ud-2.2-conll18-180430.udpipe1 MB
    • japanese-gsd-ud-2.2-conll18-180430.udpipe11 MB
    • portuguese-bosque-ud-2.2-conll18-180430.udpipe16 MB
    • russian-taiga-ud-2.2-conll18-180430.udpipe3 MB
    • uyghur-udt-ud-2.2-conll18-180430.udpipe5 MB
    • urdu-udtb-ud-2.2-conll18-180430.udpipe15 MB
    • english-lines-ud-2.2-conll18-180430.udpipe6 MB
    • french-sequoia-ud-2.2-conll18-180430.udpipe5 MB
    • slovak-snk-ud-2.2-conll18-180430.udpipe13 MB
    • irish-idt-ud-2.2-conll18-180430.udpipe4 MB
    • norwegian-bokmaal-ud-2.2-conll18-180430.udpipe17 MB
    • turkish-imst-ud-2.2-conll18-180430.udpipe8 MB
    • galician-treegal-ud-2.2-conll18-180430.udpipe3 MB
    • czech-cac-ud-2.2-conll18-180430.udpipe27 MB
    • basque-bdt-ud-2.2-conll18-180430.udpipe12 MB
    • ukrainian-iu-ud-2.2-conll18-180430.udpipe14 MB
    • slovenian-sst-ud-2.2-conll18-180430.udpipe4 MB
    • latin-proiel-ud-2.2-conll18-180430.udpipe22 MB
    • latvian-lvtb-ud-2.2-conll18-180430.udpipe14 MB
    • hindi-hdtb-ud-2.2-conll18-180430.udpipe20 MB
    • finnish-tdt-ud-2.2-conll18-180430.udpipe21 MB
    • finnish-ftb-ud-2.2-conll18-180430.udpipe19 MB
    • italian-isdt-ud-2.2-conll18-180430.udpipe16 MB
    • danish-ddt-ud-2.2-conll18-180430.udpipe9 MB
    • romanian-rrt-ud-2.2-conll18-180430.udpipe14 MB
    • catalan-ancora-ud-2.2-conll18-180430.udpipe18 MB
    • mixed-ud-ud-2.2-conll18-180430.udpipe47 MB
    • serbian-set-ud-2.2-conll18-180430.udpipe8 MB
    • dutch-alpino-ud-2.2-conll18-180430.udpipe15 MB
    • afrikaans-afribooms-ud-2.2-conll18-180430.udpipe4 MB
    • armenian-armtdp-ud-2.2-conll18-180430.udpipe1 MB
    • chinese-gsd-ud-2.2-conll18-180430.udpipe13 MB
    • buryat-bdt-ud-2.2-conll18-180430.udpipe1 MB
    • hebrew-htb-ud-2.2-conll18-180430.udpipe14 MB
    • dutch-lassysmall-ud-2.2-conll18-180430.udpipe8 MB
    • galician-ctg-ud-2.2-conll18-180430.udpipe7 MB
    • korean-kaist-ud-2.2-conll18-180430.udpipe39 MB
    • korean-gsd-ud-2.2-conll18-180430.udpipe15 MB
    • french-gsd-ud-2.2-conll18-180430.udpipe20 MB
    • russian-syntagrus-ud-2.2-conll18-180430.udpipe42 MB
    • ancient_greek-proiel-ud-2.2-conll18-180430.udpipe21 MB
    • slovenian-ssj-ud-2.2-conll18-180430.udpipe16 MB
    • german-gsd-ud-2.2-conll18-180430.udpipe23 MB
    • french-spoken-ud-2.2-conll18-180430.udpipe2 MB
    • README.txt31 kB
    • conll18_ud_eval.py26 kB
Icon
Name
ud-2.2-conll18-crossfold-morphology.tar.xz
Size
95.25 MB
Format
application/x-xz
Description
UD 2.2 CoNLL 2018 training data with automatically predicted morphology by UDPipe.
MD5
2576d55fcaab880f9f03e2f5d8eea5c9
 Download file  Preview
 File Preview  
  • UD_English-PUD
    • README.md6 kB
    • LICENSE.txt19 kB
  • UD_Finnish-PUD
    • README.txt2 kB
    • LICENSE.txt202 B
  • UD_Swedish-Talbanken
    • sv_talbanken-ud-train.conllu5 MB
    • EVALUATION.txt1 kB
    • README.md7 kB
    • LICENSE.txt20 kB
    • sv_talbanken-ud-dev.conllu835 kB
  • UD_Romanian-RRT
    • EVALUATION.txt1 kB
    • README.md3 kB
    • LICENSE.txt66 B
    • ro_rrt-ud-dev.conllu1 MB
    • ro_rrt-ud-train.conllu13 MB
  • UD_Gothic-PROIEL
    • EVALUATION.txt1 kB
    • README.md2 kB
    • got_proiel-ud-train.conllu3 MB
    • LICENSE.txt279 B
    • got_proiel-ud-dev.conllu926 kB
  • UD_Czech-PUD
    • README.md2 kB
    • LICENSE.txt202 B
  • UD_French-Sequoia
    • EVALUATION.txt1 kB
    • README.md3 kB
    • fr_sequoia-ud-train.conllu3 MB
    • LICENSE.txt4 kB
    • fr_sequoia-ud-dev.conllu614 kB
  • UD_Swedish-LinES
    • EVALUATION.txt1 kB
    • README.txt6 kB
    • sv_lines-ud-train.conllu3 MB
    • sv_lines-ud-dev.conllu1 MB
    • LICENSE.txt18 kB
  • UD_German-GSD
    • EVALUATION.txt1 kB
    • README.md12 kB
    • LICENSE.txt17 kB
    • de_gsd-ud-train.conllu18 MB
    • de_gsd-ud-dev.conllu871 kB
  • UD_Old_French-SRCMF
    • EVALUATION.txt1 kB
    • README.md7 kB
    • fro_srcmf-ud-dev.conllu896 kB
    • LICENSE.txt202 B
    • fro_srcmf-ud-train.conllu6 MB
  • UD_English-LinES
    • EVALUATION.txt1 kB
    • README.txt6 kB
    • en_lines-ud-dev.conllu954 kB
    • en_lines-ud-train.conllu2 MB
    • LICENSE.txt18 kB
  • UD_Buryat-BDT
    • EVALUATION.txt880 B
    • README.txt1 kB
    • bxr_bdt-ud-train.conllu10 kB
    • LICENSE.txt202 B
  • UD_Slovenian-SST
    • EVALUATION.txt879 B
    • README.txt4 kB
    • sl_sst-ud-train.conllu1 MB
    • LICENSE.txt441 B
  • UD_Latin-PROIEL
    • EVALUATION.txt1 kB
    • README.md2 kB
    • la_proiel-ud-dev.conllu1 MB
    • la_proiel-ud-train.conllu15 MB
    • LICENSE.txt279 B
  • UD_Turkish-IMST
    • tr_imst-ud-dev.conllu785 kB
    • EVALUATION.txt1 kB
    • README.txt1 kB
    • tr_imst-ud-train.conllu2 MB
    • LICENSE.txt20 kB
  • UD_Norwegian-Bokmaal
    • no_bokmaal-ud-train.conllu14 MB
    • EVALUATION.txt1 kB
    • README.md6 kB
    • no_bokmaal-ud-dev.conllu2 MB
    • LICENSE.txt68 B
  • UD_Galician-CTG
    • EVALUATION.txt1 kB
    • README.txt2 kB
    • gl_ctg-ud-dev.conllu1 MB
    • LICENSE.txt173 B
    • gl_ctg-ud-train.conllu4 MB
  • UD_Slovenian-SSJ
    • EVALUATION.txt1 kB
    • sl_ssj-ud-dev.conllu1 MB
    • README.txt4 kB
    • LICENSE.txt543 B
    • sl_ssj-ud-train.conllu9 MB
  • UD_Russian-SynTagRus
    • ru_syntagrus-ud-dev.conllu10 MB
    • EVALUATION.txt1 kB
    • README.txt3 kB
    • ru_syntagrus-ud-train.conllu77 MB
    • LICENSE.txt188 B
  • UD_English-GUM
    • EVALUATION.txt1 kB
    • README.md3 kB
    • en_gum-ud-dev.conllu734 kB
    • LICENSE.txt1 kB
    • en_gum-ud-train.conllu2 MB
  • UD_Indonesian-GSD
    • id_gsd-ud-dev.conllu957 kB
    • EVALUATION.txt1 kB
    • README.md8 kB
    • id_gsd-ud-train.conllu7 MB
    • LICENSE.txt17 kB
  • UD_Korean-GSD
    • EVALUATION.txt1 kB
    • README.md1 kB
    • ko_gsd-ud-dev.conllu703 kB
    • ko_gsd-ud-train.conllu3 MB
    • LICENSE.txt15 kB
  • UD_Ancient_Greek-Perseus
    • grc_perseus-ud-train.conllu14 MB
    • EVALUATION.txt1 kB
    • README.md3 kB
    • grc_perseus-ud-dev.conllu1 MB
    • LICENSE.txt279 B
  • UD_Hindi-HDTB
    • EVALUATION.txt1 kB
    • README.md2 kB
    • hi_hdtb-ud-train.conllu39 MB
    • LICENSE.txt249 B
    • hi_hdtb-ud-dev.conllu4 MB
  • UD_Polish-LFG
    • EVALUATION.txt1 kB
    • pl_lfg-ud-train.conllu11 MB
    • README.md6 kB
    • pl_lfg-ud-dev.conllu1 MB
    • LICENSE.txt34 kB
  • UD_French-Spoken
    • EVALUATION.txt1 kB
    • README.txt469 B
    • LICENSE.txt202 B
    • fr_spoken-ud-dev.conllu410 kB
    • fr_spoken-ud-train.conllu614 kB
  • UD_Hungarian-Szeged
    • hu_szeged-ud-dev.conllu1 MB
    • EVALUATION.txt1 kB
    • README.txt3 kB
    • hu_szeged-ud-train.conllu1 MB
    • LICENSE.txt30 B
  • UD_Dutch-Alpino
    • nl_alpino-ud-train.conllu13 MB
    • EVALUATION.txt1 kB
    • README.txt5 kB
    • LICENSE.txt19 kB
    • nl_alpino-ud-dev.conllu880 kB
  • UD_Urdu-UDTB
    • ur_udtb-ud-dev.conllu1 MB
    • EVALUATION.txt1 kB
    • README.md2 kB
    • ur_udtb-ud-train.conllu11 MB
    • LICENSE.txt247 B
  • UD_Estonian-EDT
    • et_edt-ud-dev.conllu2 MB
    • EVALUATION.txt1 kB
    • README.md3 kB
    • LICENSE.txt279 B
    • et_edt-ud-train.conllu18 MB
  • UD_Polish-SZ
    • pl_sz-ud-train.conllu5 MB
    • EVALUATION.txt1 kB
    • README.md2 kB
    • pl_sz-ud-dev.conllu941 kB
    • LICENSE.txt68 B
  • UD_Finnish-FTB
    • EVALUATION.txt1 kB
    • fi_ftb-ud-train.conllu9 MB
    • README.txt2 kB
    • LICENSE.txt1 kB
    • fi_ftb-ud-dev.conllu1 MB
  • UD_Galician-TreeGal
    • EVALUATION.txt883 B
    • README.md5 kB
    • gl_treegal-ud-train.conllu1 MB
    • LICENSE.txt14 kB
  • UD_Thai-PUD
    • README.md5 kB
    • LICENSE.txt19 kB
  • UD_Latin-Perseus
    • EVALUATION.txt883 B
    • la_perseus-ud-train.conllu1 MB
    • README.md3 kB
    • LICENSE.txt279 B
  • UD_Czech-FicTree
    • cs_fictree-ud-dev.conllu1 MB
    • EVALUATION.txt1 kB
    • README.md2 kB
    • cs_fictree-ud-train.conllu13 MB
    • LICENSE.txt219 B
  • UD_Latvian-LVTB
    • EVALUATION.txt1 kB
    • README.md4 kB
    • lv_lvtb-ud-train.conllu8 MB
    • LICENSE.txt20 kB
    • lv_lvtb-ud-dev.conllu1 MB
  • UD_Italian-PoSTWITA
    • EVALUATION.txt1 kB
    • README.md3 kB
    • it_postwita-ud-train.conllu5 MB
    • LICENSE.txt18 kB
    • it_postwita-ud-dev.conllu755 kB
  • UD_Breton-KEB
    • README.md1 kB
    • LICENSE.txt202 B
  • UD_Finnish-TDT
    • EVALUATION.txt1 kB
    • README.txt3 kB
    • fi_tdt-ud-train.conllu11 MB
    • LICENSE.txt24 kB
    • fi_tdt-ud-dev.conllu1 MB
  • UD_Kazakh-KTB
    • EVALUATION.txt879 B
    • kk_ktb-ud-train.conllu39 kB
    • README.txt2 kB
    • LICENSE.txt206 B
  • UD_Swedish-PUD
    • README.md3 kB
    • LICENSE.txt202 B
  • UD_North_Sami-Giella
    • EVALUATION.txt883 B
    • README.md2 kB
    • sme_giella-ud-train.conllu1 MB
    • LICENSE.txt202 B
  • UD_Croatian-SET
    • EVALUATION.txt1 kB
    • README.md4 kB
    • hr_set-ud-dev.conllu1 MB
    • LICENSE.txt233 B
    • hr_set-ud-train.conllu10 MB
  • UD_Korean-Kaist
    • EVALUATION.txt1 kB
    • README.md1 kB
    • LICENSE.txt202 B
    • ko_kaist-ud-dev.conllu1 MB
    • ko_kaist-ud-train.conllu17 MB
  • UD_Ukrainian-IU
    • EVALUATION.txt1 kB
    • README.md3 kB
    • uk_iu-ud-dev.conllu992 kB
    • uk_iu-ud-train.conllu6 MB
    • LICENSE.txt172 B
  • UD_Persian-Seraji
    • EVALUATION.txt1 kB
    • README.md5 kB
    • fa_seraji-ud-dev.conllu1000 kB
    • LICENSE.txt110 B
    • fa_seraji-ud-train.conllu7 MB
  • UD_Norwegian-Nynorsk
    • no_nynorsk-ud-train.conllu14 MB
    • EVALUATION.txt1 kB
    • README.md4 kB
    • LICENSE.txt68 B
    • no_nynorsk-ud-dev.conllu1 MB
  • UD_Naija-NSC
    • README.md3 kB
    • LICENSE.txt202 B
  • UD_Norwegian-NynorskLIA
    • EVALUATION.txt886 B
    • no_nynorsklia-ud-train.conllu200 kB
    • README.txt1 kB
    • LICENSE.txt202 B
  • UD_Bulgarian-BTB
    • bg_btb-ud-dev.conllu1 MB
    • EVALUATION.txt1 kB
    • README.txt5 kB
    • LICENSE.txt327 B
    • bg_btb-ud-train.conllu10 MB
  • UD_Serbian-SET
    • EVALUATION.txt1 kB
    • README.md1 kB
    • LICENSE.txt230 B
    • sr_set-ud-train.conllu4 MB
    • sr_set-ud-dev.conllu675 kB
  • UD_Basque-BDT
    • EVALUATION.txt1 kB
    • README.txt3 kB
    • eu_bdt-ud-dev.conllu1 MB
    • eu_bdt-ud-train.conllu4 MB
    • LICENSE.txt171 B
  • UD_Slovak-SNK
    • EVALUATION.txt1 kB
    • README.md3 kB
    • LICENSE.txt202 B
    • sk_snk-ud-train.conllu6 MB
    • sk_snk-ud-dev.conllu1 MB
  • UD_Afrikaans-AfriBooms
    • af_afribooms-ud-dev.conllu322 kB
    • EVALUATION.txt1 kB
    • README.txt1 kB
    • af_afribooms-ud-train.conllu2 MB
    • LICENSE.txt202 B
  • UD_Japanese-GSD
    • EVALUATION.txt1 kB
    • README.txt2 kB
    • ja_gsd-ud-dev.conllu612 kB
    • LICENSE.txt17 kB
    • ja_gsd-ud-train.conllu8 MB
  • UD_Czech-CAC
    • cs_cac-ud-dev.conllu1 MB
    • cs_cac-ud-train.conllu50 MB
    • EVALUATION.txt1 kB
    • README.md4 kB
    • LICENSE.txt265 B
  • UD_Arabic-PADT
    • EVALUATION.txt1 kB
    • ar_padt-ud-dev.conllu5 MB
    • README.md4 kB
    • LICENSE.txt19 kB
    • ar_padt-ud-train.conllu38 MB
  • UD_Faroese-OFT
    • README.md1 kB
    • LICENSE.txt822 B
  • UD_Upper_Sorbian-UFAL
    • EVALUATION.txt881 B
    • README.md919 B
    • hsb_ufal-ud-train.conllu31 kB
    • LICENSE.txt202 B
  • UD_Ancient_Greek-PROIEL
    • grc_proiel-ud-dev.conllu1 MB
    • grc_proiel-ud-train.conllu19 MB
    • EVALUATION.txt1 kB
    • README.md2 kB
    • LICENSE.txt279 B
  • UD_Czech-PDT
    • EVALUATION.txt1 kB
    • README.md7 kB
    • LICENSE.txt19 kB
    • cs_pdt-ud-train.conllu125 MB
    • cs_pdt-ud-dev.conllu17 MB
  • UD_Chinese-GSD
    • zh_gsd-ud-train.conllu5 MB
    • EVALUATION.txt1 kB
    • README.md903 B
    • zh_gsd-ud-dev.conllu673 kB
    • LICENSE.txt282 B
  • UD_Catalan-AnCora
    • EVALUATION.txt1 kB
    • README.md743 B
    • ca_ancora-ud-train.conllu26 MB
    • ca_ancora-ud-dev.conllu3 MB
    • LICENSE.txt68 B
  • UD_Old_Church_Slavonic-PROIEL
    • EVALUATION.txt1 kB
    • README.md2 kB
    • cu_proiel-ud-train.conllu3 MB
    • cu_proiel-ud-dev.conllu1 MB
    • LICENSE.txt279 B
  • UD_Spanish-AnCora
    • es_ancora-ud-dev.conllu3 MB
    • EVALUATION.txt1 kB
    • README.md648 B
    • LICENSE.txt68 B
    • es_ancora-ud-train.conllu28 MB
  • UD_Dutch-LassySmall
    • nl_lassysmall-ud-dev.conllu836 kB
    • EVALUATION.txt1 kB
    • README.txt2 kB
    • LICENSE.txt392 B
    • nl_lassysmall-ud-train.conllu5 MB
  • UD_Danish-DDT
    • EVALUATION.txt1 kB
    • da_ddt-ud-train.conllu4 MB
    • da_ddt-ud-dev.conllu644 kB
    • README.md5 kB
    • LICENSE.txt19 kB
  • UD_French-GSD
    • EVALUATION.txt1 kB
    • README.md11 kB
    • fr_gsd-ud-dev.conllu2 MB
    • LICENSE.txt17 kB
    • fr_gsd-ud-train.conllu21 MB
  • UD_Portuguese-Bosque
    • EVALUATION.txt1 kB
    • pt_bosque-ud-train.conllu13 MB
    • README.md6 kB
    • LICENSE.txt269 B
    • pt_bosque-ud-dev.conllu718 kB
  • UD_Irish-IDT
    • ga_idt-ud-train.conllu882 kB
    • EVALUATION.txt879 B
    • README.txt5 kB
    • LICENSE.txt13 B
  • UD_Kurmanji-MG
    • EVALUATION.txt879 B
    • kmr_mg-ud-train.conllu17 kB
    • README.txt1 kB
    • LICENSE.txt202 B
  • UD_Uyghur-UDT
    • EVALUATION.txt1 kB
    • README.md1 kB
    • ug_udt-ud-train.conllu1 MB
    • LICENSE.txt202 B
    • ug_udt-ud-dev.conllu890 kB
  • UD_Greek-GDT
    • EVALUATION.txt1 kB
    • README.md3 kB
    • el_gdt-ud-dev.conllu933 kB
    • LICENSE.txt398 B
    • el_gdt-ud-train.conllu3 MB
  • UD_English-EWT
    • EVALUATION.txt1 kB
    • en_ewt-ud-dev.conllu1 MB
    • README.md7 kB
    • LICENSE.txt19 kB
    • en_ewt-ud-train.conllu12 MB
  • UD_Latin-ITTB
    • EVALUATION.txt1 kB
    • README.md3 kB
    • la_ittb-ud-dev.conllu948 kB
    • LICENSE.txt19 kB
    • la_ittb-ud-train.conllu23 MB
  • UD_Armenian-ArmTDP
    • EVALUATION.txt882 B
    • README.md3 kB
    • hy_armtdp-ud-train.conllu77 kB
    • LICENSE.txt202 B
  • UD_Vietnamese-VTB
    • vi_vtb-ud-dev.conllu522 kB
    • EVALUATION.txt1 kB
    • vi_vtb-ud-train.conllu939 kB
    • README.txt636 B
    • LICENSE.txt19 kB
  • UD_Japanese-Modern
    • README.txt3 kB
    • LICENSE.txt17 kB
  • UD_Italian-ISDT
    • EVALUATION.txt1 kB
    • it_isdt-ud-dev.conllu737 kB
    • README.md10 kB
    • it_isdt-ud-train.conllu16 MB
    • LICENSE.txt22 kB
  • UD_Hebrew-HTB
    • EVALUATION.txt1 kB
    • README.txt3 kB
    • he_htb-ud-train.conllu9 MB
    • LICENSE.txt249 B
    • he_htb-ud-dev.conllu836 kB
    • README.txt1 kB
    • conll18_ud_eval.py26 kB
  • UD_Russian-Taiga
    • EVALUATION.txt881 B
    • README.md3 kB
    • LICENSE.txt202 B
    • ru_taiga-ud-train.conllu824 kB