dc.contributor.author | Mareček, David |
dc.date.accessioned | 2016-10-20T12:38:53Z |
dc.date.available | 2016-10-20T12:38:53Z |
dc.date.issued | 2016-10-20 |
dc.identifier.uri | http://hdl.handle.net/11234/1-1804 |
dc.description | Corpus of manually aligned Czech-English parallel sentences. It comprises 2500 parallel sentences from 7 different sources. |
dc.language.iso | ces |
dc.language.iso | eng |
dc.publisher | Charles University, Faculty of Mathematics and Physics, Institute of Formal and Applied Linguistics (UFAL) |
dc.rights | Creative Commons - Attribution-ShareAlike 4.0 International (CC BY-SA 4.0) |
dc.rights.uri | http://creativecommons.org/licenses/by-sa/4.0/ |
dc.source.uri | http://ufal.mff.cuni.cz/czech-english-manual-word-alignment |
dc.subject | word alignment |
dc.subject | parallel corpus |
dc.title | Czech-English Manual Word Alignment |
dc.type | corpus |
metashare.ResourceInfo#ContentInfo.mediaType | text |
dc.rights.label | PUB |
has.files | yes |
branding | LINDAT / CLARIAH-CZ |
contact.person | David Mareček marecek@ufal.mff.cuni.cz Charles University in Prague, UFAL |
size.info | 112765 tokens |
size.info | 2500 sentences |
files.size | 3253515 |
files.count | 1 |
Soubory tohoto záznamu
Licenční kategorie:
Licence: Creative Commons - Attribution-ShareAlike 4.0 International (CC BY-SA 4.0)
Publicly Available
Licence: Creative Commons - Attribution-ShareAlike 4.0 International (CC BY-SA 4.0)
- Název
- CzEnAli_1.0.tar.gz
- Velikost
- 3.1 MB
- Formát
- application/x-gzip
- Popis
- CzEnAli_1.0
- MD5
- dd9cffd89e74ddd8f0c29d8e022506f1
- merged_data
- project_syndicate
- project_syndicate_balibar1.wa23 kB
- project_syndicate_bertram19.wa25 kB
- project_syndicate_ban1.wa26 kB
- project_syndicate_balcerowicz1.wa26 kB
- project_syndicate_ber17.wa25 kB
- project_syndicate_bck2.wa25 kB
- project_syndicate_balkenende1.wa20 kB
- project_syndicate_bacchetta1.wa21 kB
- project_syndicate_blanchard8.wa22 kB
- project_syndicate_blo3.wa23 kB
- named_entities
- project_syndicate_ne06.wa26 kB
- project_syndicate_ne02.wa27 kB
- project_syndicate_ne09.wa26 kB
- project_syndicate_ne05.wa26 kB
- project_syndicate_ne01.wa28 kB
- project_syndicate_ne08.wa27 kB
- project_syndicate_ne10.wa23 kB
- project_syndicate_ne04.wa27 kB
- project_syndicate_ne07.wa25 kB
- project_syndicate_ne03.wa26 kB
- rd_books_kacenka
- pcedt_rd_00293.wa20 kB
- pcedt_rd_01493.wa15 kB
- pcedt_rd_01193.wa17 kB
- books_three_men_in_boat.wa18 kB
- pcedt_rd_00693.wa21 kB
- pcedt_rd_00393.wa21 kB
- kacenka_tess_durbervilles.wa28 kB
- pcedt_rd_00793.wa25 kB
- kacenka_oliver_twist.wa30 kB
- pcedt_rd_00893.wa17 kB
- celex
- celex_31975L0033.wa24 kB
- celex_31985L0203.wa27 kB
- celex_31995L0070.wa31 kB
- celex_21990A0714.wa23 kB
- celex_31980L0799.wa33 kB
- celex_31970L0220.wa23 kB
- celex_31962L2645.wa27 kB
- celex_22000A0411.wa32 kB
- celex_31958L0003.wa24 kB
- celex_31965L0079.wa25 kB
- pcedt
- wsj_2222.wa19 kB
- wsj_2303.wa17 kB
- wsj_2248.wa3 kB
- wsj_2211.wa25 kB
- wsj_2249.wa4 kB
- wsj_2435.wa4 kB
- wsj_2212.wa5 kB
- wsj_2436.wa5 kB
- wsj_2399.wa12 kB
- wsj_2393.wa5 kB
- wsj_2201.wa25 kB
- wsj_2406.wa24 kB
- wsj_2338.wa18 kB
- wsj_2313.wa7 kB
- wsj_2214.wa7 kB
- wsj_2332.wa4 kB
- wsj_2202.wa25 kB
- wsj_2308.wa24 kB
- wsj_2246.wa5 kB
- wsj_2203.wa9 kB
- wsj_2309.wa10 kB
- wsj_2315.wa7 kB
- project_syndicate
- data
- project_syndicate
- project_syndicate_blanchard8.m.wa22 kB
- project_syndicate_ber17.m.wa25 kB
- project_syndicate_blo3.z.wa24 kB
- project_syndicate_bacchetta1.z.wa22 kB
- project_syndicate_blo3.m.wa24 kB
- project_syndicate_bacchetta1.m.wa22 kB
- project_syndicate_ban1.z.wa27 kB
- project_syndicate_balibar1.z.wa23 kB
- project_syndicate_ban1.m.wa26 kB
- project_syndicate_balibar1.m.wa23 kB
- project_syndicate_bertram19.z.wa26 kB
- project_syndicate_balkenende1.z.wa21 kB
- project_syndicate_balcerowicz1.z.wa26 kB
- project_syndicate_bertram19.m.wa25 kB
- project_syndicate_bck2.z.wa25 kB
- project_syndicate_balkenende1.m.wa21 kB
- project_syndicate_balcerowicz1.m.wa26 kB
- project_syndicate_bck2.m.wa25 kB
- project_syndicate_blanchard8.z.wa23 kB
- project_syndicate_ber17.z.wa26 kB
- named_entities
- project_syndicate_ne07.g.wa26 kB
- project_syndicate_ne04.j.wa27 kB
- project_syndicate_ne10.g.wa23 kB
- project_syndicate_ne08.g.wa28 kB
- project_syndicate_ne05.j.wa26 kB
- project_syndicate_ne01.g.wa29 kB
- project_syndicate_ne09.g.wa27 kB
- project_syndicate_ne06.j.wa26 kB
- project_syndicate_ne02.g.wa28 kB
- project_syndicate_ne07.j.wa25 kB
- project_syndicate_ne03.g.wa27 kB
- project_syndicate_ne10.j.wa23 kB
- project_syndicate_ne08.j.wa28 kB
- project_syndicate_ne04.g.wa28 kB
- project_syndicate_ne01.j.wa28 kB
- project_syndicate_ne09.j.wa27 kB
- project_syndicate_ne05.g.wa27 kB
- project_syndicate_ne02.j.wa28 kB
- project_syndicate_ne06.g.wa26 kB
- project_syndicate_ne03.j.wa26 kB
- rd_books_kacenka
- pcedt_rd_01193.z.wa18 kB
- pcedt_rd_01493.z.wa16 kB
- pcedt_rd_00393.z.wa21 kB
- pcedt_rd_00893.z.wa18 kB
- kacenka_tess_durbervilles.z.wa28 kB
- pcedt_rd_01193.m.wa17 kB
- pcedt_rd_01493.m.wa15 kB
- kacenka_oliver_twist.z.wa30 kB
- pcedt_rd_00893.m.wa18 kB
- pcedt_rd_00393.m.wa21 kB
- kacenka_tess_durbervilles.m.wa27 kB
- kacenka_oliver_twist.m.wa30 kB
- books_three_men_in_boat.z.wa17 kB
- books_three_men_in_boat.m.wa17 kB
- pcedt_rd_00693.z.wa21 kB
- pcedt_rd_00793.z.wa25 kB
- pcedt_rd_00293.z.wa20 kB
- pcedt_rd_00693.m.wa21 kB
- pcedt_rd_00793.m.wa24 kB
- pcedt_rd_00293.m.wa20 kB
- celex
- celex_31995L0070.m.wa32 kB
- celex_31985L0203.z.wa28 kB
- celex_31985L0203.m.wa28 kB
- celex_21990A0714.z.wa24 kB
- celex_22000A0411.z.wa33 kB
- celex_21990A0714.m.wa23 kB
- celex_22000A0411.m.wa33 kB
- celex_31970L0220.z.wa24 kB
- celex_31970L0220.m.wa24 kB
- celex_31965L0079.z.wa25 kB
- celex_31958L0003.z.wa25 kB
- celex_31965L0079.m.wa25 kB
- celex_31962L2645.z.wa27 kB
- celex_31958L0003.m.wa25 kB
- celex_31962L2645.m.wa27 kB
- celex_31975L0033.z.wa25 kB
- celex_31975L0033.m.wa25 kB
- celex_31980L0799.z.wa34 kB
- celex_31980L0799.m.wa34 kB
- celex_31995L0070.z.wa32 kB
- pcedt
- wsj_2399.o.wa12 kB
- wsj_2309.o.wa10 kB
- wsj_2435.o.wa4 kB
- wsj_2211.p.wa25 kB
- wsj_2201.p.wa26 kB
- wsj_2203.p.wa9 kB
- wsj_2212.o.wa5 kB
- wsj_2202.o.wa25 kB
- wsj_2313.p.wa7 kB
- wsj_2393.p.wa5 kB
- wsj_2303.p.wa17 kB
- wsj_2222.o.wa19 kB
- wsj_2214.o.wa8 kB
- wsj_2315.p.wa7 kB
- wsj_2249.p.wa4 kB
- wsj_2246.o.wa5 kB
- wsj_2332.o.wa4 kB
- wsj_2309.p.wa10 kB
- wsj_2399.p.wa12 kB
- wsj_2248.o.wa3 kB
- wsj_2435.p.wa4 kB
- wsj_2338.o.wa19 kB
- wsj_2308.o.wa24 kB
- wsj_2406.o.wa24 kB
- wsj_2436.o.wa5 kB
- wsj_2212.p.wa5 kB
- wsj_2202.p.wa25 kB
- wsj_2222.p.wa18 kB
- wsj_2214.p.wa7 kB
- wsj_2246.p.wa5 kB
- wsj_2211.o.wa26 kB
- wsj_2201.o.wa26 kB
- wsj_2332.p.wa4 kB
- wsj_2203.o.wa9 kB
- wsj_2248.p.wa3 kB
- wsj_2338.p.wa18 kB
- wsj_2313.o.wa7 kB
- wsj_2308.p.wa24 kB
- wsj_2393.o.wa5 kB
- wsj_2303.o.wa17 kB
- wsj_2406.p.wa24 kB
- wsj_2315.o.wa7 kB
- wsj_2249.o.wa4 kB
- wsj_2436.p.wa5 kB
- project_syndicate
- tools
- walign_to_tmt.pl3 kB
- alpaco.pl85 kB
- merge_two_alignments.pl2 kB
- marecek_diploma_thesis.pdf2 MB
- README2 kB
- logo.svg13 kB