wiki:en/Publications

Version 5 (modified by xrambous, 6 years ago) (diff)

--

Publications of NLP Centre

2024

2023

  • BLAHUŠ, Marek, Miloš JAKUBÍČEK, Michal CUKR, Vojtěch KOVÁŘ a Vít SUCHOMEL. Development of Evidence-Based Grammars for Terminology Extraction in OneClick Terms. In Marek Medveď, Michal Měchura, Carole Tiberius, Iztok Kosem, Jelena Kallas, Miloš Jakubíček, Simon Krek. Electronic lexicography in the 21st century (eLex 2023): Invisible Lexicography. Proceedings of the eLex 2023 conference. Brno, Czech Republic: Lexical Computing CZ s.r.o. s. 650-662. ISSN 2533-5626. 2023. Konferenční sborník info
    @inproceedings{2305342, author = {Blahuš, Marek and Jakubíček, Miloš and Cukr, Michal and Kovář, Vojtěch and Suchomel, Vít}, address = {Brno, Czech Republic}, booktitle = {Electronic lexicography in the 21st century (eLex 2023): Invisible Lexicography. Proceedings of the eLex 2023 conference}, editor = {Marek Medveď, Michal Měchura, Carole Tiberius, Iztok Kosem, Jelena Kallas, Miloš Jakubíček, Simon Krek}, keywords = {Grammars; Terminology Extraction; OneClick Terms}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Brno, Czech Republic}, pages = {650-662}, publisher = {Lexical Computing CZ s.r.o.}, title = {Development of Evidence-Based Grammars for Terminology Extraction in OneClick Terms}, url = {https://elex.link/elex2023/wp-content/uploads/117.pdf}, year = {2023} }
  • BLAHUŠ, Marek, Michal CUKR, Ondřej HERMAN, Miloš JAKUBÍČEK, Vojtěch KOVÁŘ, Jan KRAUS, Marek MEDVEĎ, Vlasta OHLÍDALOVÁ a Vít SUCHOMEL. Rapid Ukrainian-English Dictionary Creation Using Post-Edited Corpus Data. In Marek Medveď, Michal Měchura, Carole Tiberius, Iztok Kosem, Jelena Kallas, Miloš Jakubíček, Simon Krek. Electronic lexicography in the 21st century (eLex 2023): Invisible Lexicography. Proceedings of the eLex 2023 conference. Brno, Czech Republic: Lexical Computing CZ s.r.o. s. 613-637. ISSN 2533-5626. 2023. Konferenční sborník info
    @inproceedings{2303577, author = {Blahuš, Marek and Cukr, Michal and Herman, Ondřej and Jakubíček, Miloš and Kovář, Vojtěch and Kraus, Jan and Medveď, Marek and Ohlídalová, Vlasta and Suchomel, Vít}, address = {Brno, Czech Republic}, booktitle = {Electronic lexicography in the 21st century (eLex 2023): Invisible Lexicography. Proceedings of the eLex 2023 conference}, editor = {Marek Medveď, Michal Měchura, Carole Tiberius, Iztok Kosem, Jelena Kallas, Miloš Jakubíček, Simon Krek}, keywords = {Ukrainian; post-editing; dictionary; lexicography}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Brno, Czech Republic}, pages = {613-637}, publisher = {Lexical Computing CZ s.r.o.}, title = {Rapid Ukrainian-English Dictionary Creation Using Post-Edited Corpus Data}, url = {https://elex.link/elex2023/wp-content/uploads/114.pdf}, year = {2023} }

2022

  • HLAVÁČKOVÁ, Dana, Hana ŽIŽKOVÁ, Vojtěch KOVÁŘ, Jakub MACHURA, Ludmila ŠIKULOVÁ, Vojtěch MRKÝVKA, Markéta AUDY MASOPUSTOVÁ, Marek BLAHUŠ, Helena MEDKOVÁ, Zbyněk MICHÁLEK, Markéta PRAVDOVÁ, Sylva NZIMBA, Petr LOZAN, Klára DVOŘÁKOVÁ, Vladimír PETKEVIČ, Tomáš JELÍNEK a Hana SKOUMALOVÁ. Opravidlo. 2022. URL info
    @misc{1862974, author = {Hlaváčková, Dana and Žižková, Hana and Kovář, Vojtěch and Machura, Jakub and Šikulová, Ludmila and Mrkývka, Vojtěch and Audy Masopustová, Markéta and Blahuš, Marek and Medková, Helena and Michálek, Zbyněk and Pravdová, Markéta and Nzimba, Sylva and Lozan, Petr and Dvořáková, Klára and Petkevič, Vladimír and Jelínek, Tomáš and Skoumalová, Hana}, keywords = {spellchecker; Czech language; online proofreader}, language = {cze}, institution = {Masarykova univerzita, Univerzita Karlova, Ústav pro jazyk český AV ČR, Seznam.cz}, organization = {Masarykova univerzita, Univerzita Karlova, Ústav pro jazyk český AV ČR, Seznam.cz}, title = {Opravidlo}, url = {http://www.opravidlo.cz}, year = {2022} }
  • HERMAN, Ondřej. Blooming Onion: Efficient Deduplication through Approximate Membership Testing. In Aleš Horák, Pavel Rychlý, Adam Rambousek. Proceedings of the Sixteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2022. Brno: Tribun EU. s. 91-95. ISBN 978-80-263-1752-4. 2022. Domovská stránka workshopu Plný text info
    @inproceedings{2240155, author = {Herman, Ondřej}, address = {Brno}, booktitle = {Proceedings of the Sixteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2022}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {deduplication; text corpora; Bloom filter}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1752-4}, pages = {91-95}, publisher = {Tribun EU}, title = {Blooming Onion: Efficient Deduplication through Approximate Membership Testing}, url = {https://raslan2022.nlp-consulting.net/}, year = {2022} }
  • RYCHLÝ, Pavel a Ondřej HERMAN. MoMaT WebAPI. 2022. URL info
    @misc{2272323, author = {Rychlý, Pavel and Herman, Ondřej}, keywords = {web service; machine translation; language technology}, language = {eng}, institution = {Fakulta informatiky, Masarykova univerzita}, organization = {Fakulta informatiky, Masarykova univerzita}, title = {MoMaT WebAPI}, url = {https://nlp.fi.muni.cz/projekty/momat/}, year = {2022} }
  • MEDVEĎ, Marek, Aleš HORÁK a Radoslav SABOL. Comparing RNN and Transformer Context Representations in the Czech Answer Selection Task. In Ana Paula Rocha, Luc Steels, Jaap van den Herik. Proceedings of the 14th International Conference on Agents and Artificial Intelligence (ICAART). Portugal: SCITEPRESS. s. 388-394. ISBN 978-989-758-547-0. doi:10.5220/0000155600003116. 2022. info
    @inproceedings{1810359, author = {Medveď, Marek and Horák, Aleš and Sabol, Radoslav}, address = {Portugal}, booktitle = {Proceedings of the 14th International Conference on Agents and Artificial Intelligence (ICAART)}, doi = {http://dx.doi.org/10.5220/0000155600003116}, editor = {Ana Paula Rocha, Luc Steels, Jaap van den Herik}, keywords = {Question Answering; Answer Context; Answer Selection; Czech; Sentece Embeddings; RNN; BERT}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Portugal}, isbn = {978-989-758-547-0}, note = {accepted for publication}, pages = {388-394}, publisher = {SCITEPRESS}, title = {Comparing RNN and Transformer Context Representations in the Czech Answer Selection Task}, year = {2022} }
  • JAKUBÍČEK, Miloš, Vojtěch KOVÁŘ, Michal MĚCHURA a Adam RAMBOUSEK. Using NVH as a Backbone Format in the Lexonomy Dictionary Editor. In Aleš Horák, Pavel Rychlý, Adam Rambousek. Proceedings of the Sixteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2022. Brno: Tribun EU. s. 55-61. ISBN 978-80-263-1752-4. 2022. Domovská stránka workshopu Plný text info
    @inproceedings{2240339, author = {Jakubíček, Miloš and Kovář, Vojtěch and Měchura, Michal and Rambousek, Adam}, address = {Brno}, booktitle = {Proceedings of the Sixteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2022}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {NVH; XML; Lexonomy; dictionary editor}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1752-4}, pages = {55-61}, publisher = {Tribun EU}, title = {Using NVH as a Backbone Format in the Lexonomy Dictionary Editor}, url = {https://raslan2022.nlp-consulting.net/}, year = {2022} }
  • SUCHOMEL, Vít a Jan KRAUS. Semi-Manual Annotation of Topics and Genres in Web Corpora : The Cheap and Fast Way. In Aleš Horák, Pavel Rychlý, Adam Rambousek. Proceedings of the Sixteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2022. Brno: Tribun EU. s. 141-148. ISBN 978-80-263-1752-4. 2022. Domovská stránka workshopu Plný text info
    @inproceedings{2240321, author = {Suchomel, Vít and Kraus, Jan}, address = {Brno}, booktitle = {Proceedings of the Sixteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2022}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {web corpus; text corpus; topic; genre; text annotation}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1752-4}, pages = {141-148}, publisher = {Tribun EU}, title = {Semi-Manual Annotation of Topics and Genres in Web Corpora : The Cheap and Fast Way}, url = {https://raslan2022.nlp-consulting.net/}, year = {2022} }

2021

  • GREGOR, Miloš, Petra MLEJNKOVÁ, Miroslava PAVLÍKOVÁ, Barbora ŠENKÝŘOVÁ, Jakub DRMOLA, Miroslav MAREŠ, František KASL, Aleš HORÁK, Vít BAISA, Radim POLČÁK, Jan HANZELKA, Jonáš SYROVÁTKA a Ondřej HERMAN. Challenging Online Propaganda and Disinformation in the 21st Century. Cham: Palgrave Macmillan. 273 s. Political Campaigning and Communication. ISBN 978-3-030-58623-2. doi:10.1007/978-3-030-58624-9. 2021. web nakladatelství info
    @book{1752737, author = {Gregor, Miloš and Mlejnková, Petra and Pavlíková, Miroslava and Šenkýřová, Barbora and Drmola, Jakub and Mareš, Miroslav and Kasl, František and Horák, Aleš and Baisa, Vít and Polčák, Radim and Hanzelka, Jan and Syrovátka, Jonáš and Herman, Ondřej}, address = {Cham}, doi = {http://dx.doi.org/10.1007/978-3-030-58624-9}, keywords = {disinformation; online propaganda; information warfare; AI technologies; counter-measures against disinformation; post-truth era;}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Cham}, isbn = {978-3-030-58623-2}, publisher = {Palgrave Macmillan}, title = {Challenging Online Propaganda and Disinformation in the 21st Century}, url = {https://www.palgrave.com/gp/book/9783030586232}, year = {2021} }
  • JAKUBÍČEK, Miloš, Emma ROMANI, Pavel RYCHLÝ a Ondřej HERMAN. Development of HAMOD: a High Agreement Multi-lingual Outlier Detection dataset. In Horák, Rychlý, Rambousek. Recent Advances in Slavonic Natural Language Processing (RASLAN 2021). Brno: Tribun EU. s. 177-183. ISBN 978-80-263-1670-1. 2021. Domovská stránka workshopu Full text PDF info
    @inproceedings{1809767, author = {Jakubíček, Miloš and Romani, Emma and Rychlý, Pavel and Herman, Ondřej}, address = {Brno}, booktitle = {Recent Advances in Slavonic Natural Language Processing (RASLAN 2021)}, editor = {Horák, Rychlý, Rambousek}, keywords = {HAMOD; Distributional thesaurus; Outlier detection; Word embeddings; Sketch Engine}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1670-1}, pages = {177-183}, publisher = {Tribun EU}, title = {Development of HAMOD: a High Agreement Multi-lingual Outlier Detection dataset}, url = {https://raslan2021.nlp-consulting.net/}, year = {2021} }
  • HERMAN, Ondřej. Precomputed Word Embeddings for 15+ Languages. In Horák, Rychlý, Rambousek. Recent Advances in Slavonic Natural Language Processing (RASLAN 2021). Brno: Tribun EU. s. 41-46. ISBN 978-80-263-1670-1. 2021. Domovská stránka workshopu Full text PDF info
    @inproceedings{1809740, author = {Herman, Ondřej}, address = {Brno}, booktitle = {Recent Advances in Slavonic Natural Language Processing (RASLAN 2021)}, editor = {Horák, Rychlý, Rambousek}, keywords = {Word embeddings; Sketch Engine; Corpora}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1670-1}, pages = {41-46}, publisher = {Tribun EU}, title = {Precomputed Word Embeddings for 15+ Languages}, url = {https://raslan2021.nlp-consulting.net/}, year = {2021} }
  • MEDVEĎ, Marek, Radoslav SABOL a Aleš HORÁK. Evaluating Long Contexts in the Czech Answer Selection Task. In Horák, Rychlý, Rambousek. Recent Advances in Slavonic Natural Language Processing (RASLAN 2021). Brno: Tribun EU. s. 61-69. ISBN 978-80-263-1670-1. 2021. Domovská stránka workshopu Full text PDF info
    @inproceedings{1809741, author = {Medveď, Marek and Sabol, Radoslav and Horák, Aleš}, address = {Brno}, booktitle = {Recent Advances in Slavonic Natural Language Processing (RASLAN 2021)}, editor = {Horák, Rychlý, Rambousek}, keywords = {Question answering; Answer selection; Answer context; Evaluation}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1670-1}, pages = {61-69}, publisher = {Tribun EU}, title = {Evaluating Long Contexts in the Czech Answer Selection Task}, url = {https://raslan2021.nlp-consulting.net/}, year = {2021} }
  • HORÁK, Aleš, Adam RAMBOUSEK, Marek MEDVEĎ, Zuzana NEVĚŘILOVÁ, Pavel RYCHLÝ a Marie STARÁ. Software Tezaurus: funkcionalita pro styk s externími systémy. 2021. info
    @misc{1819741, author = {Horák, Aleš and Rambousek, Adam and Medveď, Marek and Nevěřilová, Zuzana and Rychlý, Pavel and Stará, Marie}, keywords = {thesaurus; dictionary editing; centralized system; open data}, language = {eng}, institution = {Technologická agentura České republiky}, organization = {Technologická agentura České republiky}, title = {Software Tezaurus: funkcionalita pro styk s externími systémy}, year = {2021} }
  • HORÁK, Aleš, Adam RAMBOUSEK, Marek MEDVEĎ, Zuzana NEVĚŘILOVÁ, Pavel RYCHLÝ a Marie STARÁ. Software Tezaurus: nástroje pro centrální systém tvorby odborných tezaurů. 2021. info
    @misc{1819739, author = {Horák, Aleš and Rambousek, Adam and Medveď, Marek and Nevěřilová, Zuzana and Rychlý, Pavel and Stará, Marie}, keywords = {thesaurus; dictionary editing; centralized system; open data}, language = {eng}, institution = {Technologická agentura České republiky}, organization = {Technologická agentura České republiky}, title = {Software Tezaurus: nástroje pro centrální systém tvorby odborných tezaurů}, year = {2021} }
  • HORÁK, Aleš, Adam RAMBOUSEK, Marek MEDVEĎ, Zuzana NEVĚŘILOVÁ, Pavel RYCHLÝ a Marie STARÁ. Software Tezaurus: nástroje pro podporu systematické a koordinované tvorby odborných tezaurů. 2021. info
    @misc{1819737, author = {Horák, Aleš and Rambousek, Adam and Medveď, Marek and Nevěřilová, Zuzana and Rychlý, Pavel and Stará, Marie}, keywords = {thesaurus; dictionary editing; centralized system; open data}, language = {eng}, institution = {Technologická agentura České republiky}, organization = {Technologická agentura České republiky}, title = {Software Tezaurus: nástroje pro podporu systematické a koordinované tvorby odborných tezaurů}, year = {2021} }
  • RAMBOUSEK, Adam, Miloš JAKUBÍČEK a Iztok KOSEM. New developments in Lexonomy. In Kosem, I., Cukr, M., Jakubíček, M., Kallas, J., Krek, S. & Tiberius, C. Electronic lexicography in the 21st century. Proceedings of the eLex 2021 conference. Brno: Lexical Computing CZ, s.r.o. s. 455-462. ISSN 2533-5626. 2021. proceedings info
    @inproceedings{1791676, author = {Rambousek, Adam and Jakubíček, Miloš and Kosem, Iztok}, address = {Brno}, booktitle = {Electronic lexicography in the 21st century. Proceedings of the eLex 2021 conference.}, editor = {Kosem, I., Cukr, M., Jakubíček, M., Kallas, J., Krek, S. & Tiberius, C.}, keywords = {Dictionary editing; Dictionary writing system; Lexicographic tools; XML; Corpora connection}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Brno}, pages = {455-462}, publisher = {Lexical Computing CZ, s.r.o.}, title = {New developments in Lexonomy}, url = {https://elex.link/elex2021/proceedings-download/}, year = {2021} }
  • KOVÁŘ, Vojtěch a Pavel RYCHLÝ. DMoG : A Data-Based Morphological Guesser. In Horák, Aleš; Rychlý, Pavel; Rambousek, Adam. Recent Advances in Slavonic Natural Language Processing (RASLAN 2021). Brno: Tribun EU. s. 135-138. ISBN 978-80-263-1670-1. 2021. Domovská stránka workshopu Full text PDF info
    @inproceedings{1809762, author = {Kovář, Vojtěch and Rychlý, Pavel}, address = {Brno}, booktitle = {Recent Advances in Slavonic Natural Language Processing (RASLAN 2021)}, editor = {Horák, Aleš; Rychlý, Pavel; Rambousek, Adam}, keywords = {Lemmatization; Morphological guesser; Morphological analysis; Morphological guessing}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1670-1}, pages = {135-138}, publisher = {Tribun EU}, title = {DMoG : A Data-Based Morphological Guesser}, url = {https://raslan2021.nlp-consulting.net/}, year = {2021} }
  • SUCHOMEL, Vít a Jan KRAUS. Website Properties in Relation to the Quality of Text Extracted for Web Corpora. In Horák, Rychlý, Rambousek. Recent Advances in Slavonic Natural Language Processing (RASLAN 2021). Brno: Tribun EU. s. 167-175. ISBN 978-80-263-1670-1. 2021. Full text PDF Domovská stránka workshopu info
    @inproceedings{1809765, author = {Suchomel, Vít and Kraus, Jan}, address = {Brno}, booktitle = {Recent Advances in Slavonic Natural Language Processing (RASLAN 2021)}, editor = {Horák, Rychlý, Rambousek}, keywords = {Web crawling; Web spam; Text corpus; Text processing}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1670-1}, pages = {167-175}, publisher = {Tribun EU}, title = {Website Properties in Relation to the Quality of Text Extracted for Web Corpora}, url = {https://nlp.fi.muni.cz/raslan/2021/paper19.pdf}, year = {2021} }
  • SUCHOMEL, Vít. Genre Annotation of Web Corpora: Scheme and Issues. In Kohei Arai, Supriya Kapoor, Rahul Bhatia. Proceedings of the Future Technologies Conference (FTC) 2020, Volume 1. Vancouver, Canada: Springer Nature Switzerland AG. s. 738-754. ISBN 978-3-030-63127-7. doi:10.1007/978-3-030-63128-4_55. 2021. Elektronická verze sborníku info
    @inproceedings{1663744, author = {Suchomel, Vít}, address = {Vancouver, Canada}, booktitle = {Proceedings of the Future Technologies Conference (FTC) 2020, Volume 1}, doi = {http://dx.doi.org/10.1007/978-3-030-63128-4_55}, editor = {Kohei Arai, Supriya Kapoor, Rahul Bhatia}, keywords = {Corpus annotation; Inter-annotator agreement; Text genre; Web corpora}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Vancouver, Canada}, isbn = {978-3-030-63127-7}, pages = {738-754}, publisher = {Springer Nature Switzerland AG}, title = {Genre Annotation of Web Corpora: Scheme and Issues}, url = {https://link.springer.com/book/10.1007/978-3-030-63128-4}, year = {2021} }

2020

  • MEDVEĎ, Marek, Radoslav SABOL a Aleš HORÁK. Efficient Management and Optimization of Very Large Machine Learning Dataset for Question Answering. In Aleš Horák. Proceedings of the Fourteenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2020. Brno: Tribun EU. s. 23-34. ISBN 978-80-263-1600-8. 2020. PDF ve sborníku Domovská stránka workshopu info
    @inproceedings{1729476, author = {Medveď, Marek and Sabol, Radoslav and Horák, Aleš}, address = {Brno}, booktitle = {Proceedings of the Fourteenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2020}, editor = {Aleš Horák}, keywords = {question answering; dataset management; machine learning; optimization}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1600-8}, pages = {23-34}, publisher = {Tribun EU}, title = {Efficient Management and Optimization of Very Large Machine Learning Dataset for Question Answering}, url = {https://nlp.fi.muni.cz/raslan/raslan20.pdf#page=21}, year = {2020} }
  • MEDVEĎ, Marek, Aleš HORÁK a Radoslav SABOL. Employing Sentence Context in Czech Answer Selection. In Sojka P., Kopeček I., Pala K., Horák A. Text, Speech, and Dialogue. TSD 2020. Switzerland: Springer, Cham. s. 112-121. ISBN 978-3-030-58322-4. doi:10.1007/978-3-030-58323-1_12. 2020. info
    @inproceedings{1709742, author = {Medveď, Marek and Horák, Aleš and Sabol, Radoslav}, address = {Switzerland}, booktitle = {Text, Speech, and Dialogue. TSD 2020}, doi = {http://dx.doi.org/10.1007/978-3-030-58323-1_12}, editor = {Sojka P., Kopeček I., Pala K., Horák A.}, keywords = {question answering;answer selection;Czech;answer context;morphologically rich languages}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Switzerland}, isbn = {978-3-030-58322-4}, pages = {112-121}, publisher = {Springer, Cham}, title = {Employing Sentence Context in Czech Answer Selection}, year = {2020} }
  • MEDVEĎ, Marek, Aleš HORÁK a Radoslav SABOL. Improving RNN-based Answer Selection for Morphologically Rich Languages. In Ana Rocha, Luc Steels, Jaap van den Herik. Proceedings of the 12th International Conference on Agents and Artificial Intelligence. Portugal: SCITEPRESS. s. 644-651. ISBN 978-989-758-395-7. doi:10.5220/0008979206440651. 2020. info
    @inproceedings{1643878, author = {Medveď, Marek and Horák, Aleš and Sabol, Radoslav}, address = {Portugal}, booktitle = {Proceedings of the 12th International Conference on Agents and Artificial Intelligence}, doi = {http://dx.doi.org/10.5220/0008979206440651}, editor = {Ana Rocha, Luc Steels, Jaap van den Herik}, keywords = {Question Answering; Question Classification; Answer Classification; Czech; Simple Question Answering Database; SQAD}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Portugal}, isbn = {978-989-758-395-7}, pages = {644-651}, publisher = {SCITEPRESS}, title = {Improving RNN-based Answer Selection for Morphologically Rich Languages}, year = {2020} }
  • JAKUBÍČEK, Miloš, Vojtěch KOVÁŘ, Pavel RYCHLÝ a Vít SUCHOMEL. Current Challenges in Web Corpus Building. In Adrien Barbaresi, Felix Bildhauer, Roland Schafer and Egon Stemle. Proceedings of the 12th Web as Corpus Workshop. Marseille, France: European Language Resources Association. s. 1-4. ISBN 979-10-95546-68-9. 2020. článek ve sborníku info
    @inproceedings{1658596, author = {Jakubíček, Miloš and Kovář, Vojtěch and Rychlý, Pavel and Suchomel, Vít}, address = {Marseille, France}, booktitle = {Proceedings of the 12th Web as Corpus Workshop}, editor = {Adrien Barbaresi, Felix Bildhauer, Roland Schafer and Egon Stemle}, keywords = {Web corpora; corpus building}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Marseille, France}, isbn = {979-10-95546-68-9}, pages = {1-4}, publisher = {European Language Resources Association}, title = {Current Challenges in Web Corpus Building}, url = {https://www.aclweb.org/anthology/2020.wac-1.1}, year = {2020} }
  • SUCHOMEL, Vít. Removing Spam from Web Corpora Through Supervised Learning and Semi-manual Classification of Web Sites. In Aleš Horák. Proceedings of the Fourteenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2020. Brno: Tribun 2020. s. 113-123. ISBN 978-80-263-1600-8. 2020. Domovská stránka workshopu PDF ve sborníku info
    @inproceedings{1729500, author = {Suchomel, Vít}, address = {Brno}, booktitle = {Proceedings of the Fourteenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2020}, editor = {Aleš Horák}, keywords = {web corpora; web spam; supervised learning}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1600-8}, pages = {113-123}, publisher = {Tribun 2020}, title = {Removing Spam from Web Corpora Through Supervised Learning and Semi-manual Classification of Web Sites}, url = {https://raslan2020.nlp-consulting.net/}, year = {2020} }

2019

  • RAMBOUSEK, Adam, Aleš HORÁK, Vít BAISA a Vít SUCHOMEL. A New Approach for Semi-automatic Building and Extending a Multilingual Terminology Thesaurus. International Journal on Artificial Intelligence Tools. USA: World Scientific Publishing, roč. 28, č. 2, s. 1-21. ISSN 0218-2130. doi:10.1142/S0218213019500088. 2019. Journal page arXiv preprint info
    @article{1511276, author = {Rambousek, Adam and Horák, Aleš and Baisa, Vít and Suchomel, Vít}, article_location = {USA}, article_number = {2}, doi = {http://dx.doi.org/10.1142/S0218213019500088}, keywords = {Thesaurus building; terminology dictionary; domain-corpus exploitation; knowledge extraction; term extraction; DEB platform; knowledge-rich contexts}, language = {eng}, issn = {0218-2130}, journal = {International Journal on Artificial Intelligence Tools}, title = {A New Approach for Semi-automatic Building and Extending a Multilingual Terminology Thesaurus}, url = {http://dx.doi.org/10.1142/S0218213019500088}, volume = {28}, year = {2019} }
  • BAISA, Vít, Marek BLAHUŠ, Michal CUKR, Ondřej HERMAN, Miloš JAKUBÍČEK, Vojtěch KOVÁŘ, Marek MEDVEĎ, Michal MĚCHURA, Pavel RYCHLÝ a Vít SUCHOMEL. Automating dictionary production: a Tagalog-English-Korean dictionary from scratch. In Proceedings of the 6th Biennial Conference on Electronic Lexicography. Brno, Czech Republic: Lexical Computing CZ s.r.o. s. 805-818. ISSN 2533-5626. 2019. Konferenční sborník info
    @inproceedings{1550657, author = {Baisa, Vít and Blahuš, Marek and Cukr, Michal and Herman, Ondřej and Jakubíček, Miloš and Kovář, Vojtěch and Medveď, Marek and Měchura, Michal and Rychlý, Pavel and Suchomel, Vít}, address = {Brno, Czech Republic}, booktitle = {Proceedings of the 6th Biennial Conference on Electronic Lexicography}, keywords = {Sketch Engine; Lexonomy; post-editing lexicography; dictionary; corpus; Tagalog; Filipino; English; Korean}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Brno, Czech Republic}, pages = {805-818}, publisher = {Lexical Computing CZ s.r.o.}, title = {Automating dictionary production: a Tagalog-English-Korean dictionary from scratch}, url = {https://elex.link/elex2019/wp-content/uploads/2019/10/eLex-2019_Proceedings.pdf}, year = {2019} }
  • HORÁK, Aleš, Vít BAISA a Ondřej HERMAN. Benchmark Dataset for Propaganda Detection in Czech Newspaper Texts. In Proceedings of Recent Advances in Natural Language Processing, RANLP 2019. Varna, Bulgaria: INCOMA Ltd. s. 77-83. ISBN 978-954-452-055-7. doi:10.26615/978-954-452-056-4_010. 2019. URL info
    @inproceedings{1552518, author = {Horák, Aleš and Baisa, Vít and Herman, Ondřej}, address = {Varna, Bulgaria}, booktitle = {Proceedings of Recent Advances in Natural Language Processing, RANLP 2019}, doi = {http://dx.doi.org/10.26615/978-954-452-056-4_010}, keywords = {propaganda detection; manipulative techniques; benchmark dataset}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Varna, Bulgaria}, isbn = {978-954-452-055-7}, pages = {77-83}, publisher = {INCOMA Ltd.}, title = {Benchmark Dataset for Propaganda Detection in Czech Newspaper Texts}, url = {https://www.aclweb.org/anthology/R19-1010.pdf}, year = {2019} }
  • KOPPEL, Kristina, Jelena KALLAS, Maria KHOKHLOVÁ, Vít SUCHOMEL, Vít BAISA a Jan MICHELFEIT. SkELL Corpora as a Part of the Language Portal Sonaveeb: Problems and Perspectives. In Proceedings of the 6th Biennial Conference on Electronic Lexicography. Brno, Czech Republic: Lexical Computing CZ s.r.o. s. 763-782. ISSN 2533-5626. 2019. Konferenční sborník info
    @inproceedings{1577318, author = {Koppel, Kristina and Kallas, Jelena and Khokhlová, Maria and Suchomel, Vít and Baisa, Vít and Michelfeit, Jan}, address = {Brno, Czech Republic}, booktitle = {Proceedings of the 6th Biennial Conference on Electronic Lexicography}, keywords = {GDEX; SkELL; learner corpus; Estonian; Russian}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Brno, Czech Republic}, pages = {763-782}, publisher = {Lexical Computing CZ s.r.o.}, title = {SkELL Corpora as a Part of the Language Portal Sonaveeb: Problems and Perspectives}, url = {https://elex.link/elex2019/wp-content/uploads/2019/10/eLex-2019_Proceedings.pdf}, year = {2019} }
  • KOPECKÝ, Zdeněk, Michal KUBÍČEK, Filip MRAVEC, Tomáš URBANEC, Aleš JANČÁŘ, Zdeněk MATĚJ, Ondřej HERMAN, Jan KRÁL, Petr OKRUHLICA, Aleš POVALAČ, Jiří ČULEN, František CVACHOVEC a Václav PŘENOSIL. Laboratorní spektrometr nízkoenergetických neutronů. 2019. URL info
    @techreport{1645300, author = {Kopecký, Zdeněk and Kubíček, Michal and Mravec, Filip and Urbanec, Tomáš and Jančář, Aleš and Matěj, Zdeněk and Herman, Ondřej and Král, Jan and Okruhlica, Petr and Povalač, Aleš and Čulen, Jiří and Cvachovec, František and Přenosil, Václav}, keywords = {low-energy neutron spectrometer;mixed field;ionizing radiation;separation methods;proportional detector;preamplifier;digital card}, language = {eng}, institution = {VF, a.s.}, organization = {VF, a.s.}, title = {Laboratorní spektrometr nízkoenergetických neutronů}, url = {http://www.urel.feec.vutbr.cz/web_documents/produkty/2019/laboratorni_spektrometr_CZ.pdf}, year = {2019} }
  • KRÁL, Jan, Zdeněk MATĚJ, Ondřej HERMAN, Aleš JANČÁŘ, Filip MRAVEC, Martin PAVELEK, Michal KUBÍČEK, Jiří ČULEN, Zdeněk KOPECKÝ, Petr OKRUHLICA, František CVACHOVEC a Václav PŘENOSIL. Systém pro detekci neutronů ve směsných polích - Energeticky kompenzovaný monitor příkonu dávkového ekvivalentu neutronů. 2019. URL info
    @techreport{1645337, author = {Král, Jan and Matěj, Zdeněk and Herman, Ondřej and Jančář, Aleš and Mravec, Filip and Pavelek, Martin and Kubíček, Michal and Čulen, Jiří and Kopecký, Zdeněk and Okruhlica, Petr and Cvachovec, František and Přenosil, Václav}, keywords = {spectrometric system;mixed field;ionizing radiation;pulse shape discrimination;Integrated neutron radiation dose monitoring device;scintillator}, language = {eng}, institution = {VF, a.s.}, organization = {VF, a.s.}, title = {Systém pro detekci neutronů ve směsných polích - Energeticky kompenzovaný monitor příkonu dávkového ekvivalentu neutronů}, url = {http://www.urel.feec.vutbr.cz/web_documents/produkty/2019/monitor_davkoveho_prikonu_CZ.pdf}, year = {2019} }
  • HERMAN, Ondřej a Pavel RYCHLÝ. SiLi Index: Data Structure for Fast Vector Space Searching. In Horák, Aleš and Rychlý, Pavel and Rambousek, Adam. Proceedings of the Thirteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2019. Brno: Tribun EU. s. 111-116. ISBN 978-80-263-1530-8. 2019. URL info
    @inproceedings{1591220, author = {Herman, Ondřej and Rychlý, Pavel}, address = {Brno}, booktitle = {Proceedings of the Thirteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2019}, editor = {Horák, Aleš and Rychlý, Pavel and Rambousek, Adam}, keywords = {word embeddings; vector space; semantic similarity}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1530-8}, pages = {111-116}, publisher = {Tribun EU}, title = {SiLi Index: Data Structure for Fast Vector Space Searching}, url = {https://nlp.fi.muni.cz/raslan/2019/paper07-herman.pdf}, year = {2019} }
  • HERMAN, Ondřej, Vojtěch KOVÁŘ, Miloš JAKUBÍČEK a Pavel RYCHLÝ. Word Sense Induction Using Word Sketches. In Martín-Vide C., Purver M., Pollak S. Proceedings of the 7th International Conference on Statistical Language and Speech Processing. Cham: Springer. s. 83-91. ISBN 978-3-030-31371-5. doi:10.1007/978-3-030-31372-2_7. 2019. info
    @inproceedings{1550577, author = {Herman, Ondřej and Kovář, Vojtěch and Jakubíček, Miloš and Rychlý, Pavel}, address = {Cham}, booktitle = {Proceedings of the 7th International Conference on Statistical Language and Speech Processing}, doi = {http://dx.doi.org/10.1007/978-3-030-31372-2_7}, editor = {Martín-Vide C., Purver M., Pollak S.}, keywords = {Word sense induction;Word sketch;Collocations;Word embeddings}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Cham}, isbn = {978-3-030-31371-5}, pages = {83-91}, publisher = {Springer}, title = {Word Sense Induction Using Word Sketches}, year = {2019} }
  • SABOL, Radoslav, Marek MEDVEĎ a Aleš HORÁK. Czech Question Answering with Extended SQAD v3.0 Benchmark Dataset. In Horák, Aleš and Rychlý, Pavel and Rambousek, Adam. Proceedings of the Thirteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2019. Brno: Tribun EU. s. 99-108. ISBN 978-80-263-1530-8. 2019. info
    @inproceedings{1591218, author = {Sabol, Radoslav and Medveď, Marek and Horák, Aleš}, address = {Brno}, booktitle = {Proceedings of the Thirteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2019}, editor = {Horák, Aleš and Rychlý, Pavel and Rambousek, Adam}, keywords = {question answering; QA benchmark dataset; SQAD; Czech}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1530-8}, pages = {99-108}, publisher = {Tribun EU}, title = {Czech Question Answering with Extended SQAD v3.0 Benchmark Dataset}, year = {2019} }
  • MEDVEĎ, Marek, Aleš HORÁK a Daša KUŠNIRÁKOVÁ. Question and Answer Classification in Czech Question Answering Benchmark Dataset. In Ana Rocha, Luc Steels, Jaap van den Herik. Proceedings of the 11th International Conference on Agents and Artificial Intelligence, Volume 2. Prague, Czech Republic: SCITEPRESS. s. 701-706. ISBN 978-989-758-350-6. doi:10.5220/0007396907010706. 2019. info
    @inproceedings{1521838, author = {Medveď, Marek and Horák, Aleš and Kušniráková, Daša}, address = {Prague, Czech Republic}, booktitle = {Proceedings of the 11th International Conference on Agents and Artificial Intelligence, Volume 2}, doi = {http://dx.doi.org/10.5220/0007396907010706}, editor = {Ana Rocha, Luc Steels, Jaap van den Herik}, keywords = {Question Answering; Question Classification; Answer Classification; Czech; Simple Question Answering Database; SQAD}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Prague, Czech Republic}, isbn = {978-989-758-350-6}, pages = {701-706}, publisher = {SCITEPRESS}, title = {Question and Answer Classification in Czech Question Answering Benchmark Dataset}, year = {2019} }
  • JAKUBÍČEK, Miloš a Pavel RYCHLÝ. A Distributional Multi-word Thesaurus in Sketch Engine. In Horák, Aleš and Rychlý, Pavel and Rambousek, Adam. Proceedings of the Thirteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2019. Brno: Tribun EU. s. 143-147. ISBN 978-80-263-1530-8. 2019. URL info
    @inproceedings{1591225, author = {Jakubíček, Miloš and Rychlý, Pavel}, address = {Brno}, booktitle = {Proceedings of the Thirteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2019}, editor = {Horák, Aleš and Rychlý, Pavel and Rambousek, Adam}, keywords = {text corpus; Sketch Engine; MWE; multi-word expressions; thesaurus}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1530-8}, pages = {143-147}, publisher = {Tribun EU}, title = {A Distributional Multi-word Thesaurus in Sketch Engine}, url = {https://nlp.fi.muni.cz/raslan/2019/paper17-jakubicek.pdf}, year = {2019} }
  • RAMBOUSEK, Adam, Miloš JAKUBÍČEK a Michal MĚCHURA. Lexonomy Clinic. In eLex 2019. 2019. URL info
    @proceedings{1600074, author = {Rambousek, Adam and Jakubíček, Miloš and Měchura, Michal}, booktitle = {eLex 2019}, keywords = {dictionary-writing systems; dictionary editing; Lexonomy}, language = {eng}, title = {Lexonomy Clinic}, url = {https://elex.link/elex2019/wp-content/uploads/2019/10/eLex_2019-Book_of_abstracts.pdf}, year = {2019} }
  • SUCHOMEL, Vít. Discriminating Between Similar Languages Using Large Web Corpora. In Horák, Aleš and Rychlý, Pavel and Rambousek, Adam. Proceedings of the Thirteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2019. Brno: Tribun EU. s. 129-135. ISBN 978-80-263-1530-8. 2019. URL info
    @inproceedings{1591222, author = {Suchomel, Vít}, address = {Brno}, booktitle = {Proceedings of the Thirteenth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2019}, editor = {Horák, Aleš and Rychlý, Pavel and Rambousek, Adam}, keywords = {language identification; discriminating similar languages; building web corpora}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1530-8}, pages = {129-135}, publisher = {Tribun EU}, title = {Discriminating Between Similar Languages Using Large Web Corpora}, url = {https://nlp.fi.muni.cz/raslan/2019/paper12-suchomel.pdf}, year = {2019} }

2018

  • ŘEŘUCHA, Šimon, Bretislav MIKEL, Zdeněk MATĚJ, Ondřej HERMAN, Miroslava HOLA, Michal JELINEK, Petr JEDLICKA, Ondrej CIP a Josef LAZAR. Linearized and compensated interferometric system for high-velocity traceable length calibration on a metre scale. In Proceedings Volume 10976, 21st Czech-Polish-Slovak Optical Conference on Wave and Quantum Aspects of Contemporary Optics. Lednice: SPIE. s. 1-8. ISBN 978-1-5106-2607-2. doi:10.1117/12.2519461. 2018. URL info
    @inproceedings{1490075, author = {Řeřucha, Šimon and Mikel, Bretislav and Matěj, Zdeněk and Herman, Ondřej and Hola, Miroslava and Jelinek, Michal and Jedlicka, Petr and Cip, Ondrej and Lazar, Josef}, address = {Lednice}, booktitle = {Proceedings Volume 10976, 21st Czech-Polish-Slovak Optical Conference on Wave and Quantum Aspects of Contemporary Optics}, doi = {http://dx.doi.org/10.1117/12.2519461}, keywords = {laser interferometry; displacement; optical metrology; homodyne detection; scale linearization; FPGA; reactor active zone chassis}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Lednice}, isbn = {978-1-5106-2607-2}, pages = {1-8}, publisher = {SPIE}, title = {Linearized and compensated interferometric system for high-velocity traceable length calibration on a metre scale}, url = {http://dx.doi.org/10.1117/12.2519461}, year = {2018} }
  • MATĚJ, Zdeněk, Michal KOŠŤÁL, František CVACHOVEC, Filip MRAVEC, Martin PAVELEK, Ondřej HERMAN, Martin VEŠKRNA, Václav PŘENOSIL a Evžen LOSA. Fast Two Parametric Spectrometric System For Experimental MSR/FHR Reactor Dosimetry. In Mary Helen Sparks. Reactor Dosimetry - 16th international Symposium. Mayfield: STP: Selected Technical Papers. s. 63-73. ISBN 978-0-8031-7661-4. 2018. URL info
    @inproceedings{1388624, author = {Matěj, Zdeněk and Košťál, Michal and Cvachovec, František and Mravec, Filip and Pavelek, Martin and Herman, Ondřej and Veškrna, Martin and Přenosil, Václav and Losa, Evžen}, address = {Mayfield}, booktitle = {Reactor Dosimetry - 16th international Symposium}, editor = {Mary Helen Sparks}, keywords = {Analog; Digital; Spectrometric; System; MSR; FHR}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Mayfield}, isbn = {978-0-8031-7661-4}, pages = {63-73}, publisher = {STP: Selected Technical Papers}, title = {Fast Two Parametric Spectrometric System For Experimental MSR/FHR Reactor Dosimetry}, url = {http://isrd16.reactordosimetry.org/}, year = {2018} }
  • HA, Hien Thi, Aleš HORÁK, Marek MEDVEĎ a Zuzana NEVĚŘILOVÁ. OCRMiner. 2018. URL info
    @misc{1451656, author = {Ha, Hien Thi and Horák, Aleš and Medveď, Marek and Nevěřilová, Zuzana}, keywords = {data mining; information extraction; text classification; OCR}, language = {eng}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {OCRMiner}, url = {https://nlp.fi.muni.cz/projekty/ocrminer}, year = {2018} }
  • HA, Hien Thi, Aleš HORÁK, Marek MEDVEĎ a Zuzana NEVĚŘILOVÁ. Recognition of OCR Invoice Metadata Block Types. In P. Sojka, A. Horák, I. Kopeček, K. Pala. Text, Speech, and Dialogue, 21st International Conference, TSD 2018. Switzerland: Springer International Publishing. s. 304-312. ISBN 978-3-030-00793-5. doi:10.1007/978-3-030-00794-2_33. 2018. info
    @inproceedings{1421338, author = {Ha, Hien Thi and Horák, Aleš and Medveď, Marek and Nevěřilová, Zuzana}, address = {Switzerland}, booktitle = {Text, Speech, and Dialogue, 21st International Conference, TSD 2018}, doi = {http://dx.doi.org/10.1007/978-3-030-00794-2_33}, editor = {P. Sojka, A. Horák, I. Kopeček, K. Pala}, keywords = {OCR;scanned documents;document metadata;invoice metadata extraction}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Switzerland}, isbn = {978-3-030-00793-5}, pages = {304-312}, publisher = {Springer International Publishing}, title = {Recognition of OCR Invoice Metadata Block Types}, year = {2018} }
  • RYCHLÝ, Pavel, Radoslav RÁBARA a Ondřej HERMAN. Distributed Corpus Search. In Piotr Banski, Marc Kupietz, Adrien Barbaresi, Hanno Biber, Evelyn Breiteneder, Simon Clematide, Andreas Witt. 6th Workshop on the Challenges in the Management of Large Corpora. Miyazaki, Japan: European Language Resource Association. s. 10-13. ISBN 979-1-09-554614-6. 2018. Sborník CMLC-6 info
    @inproceedings{1420812, author = {Rychlý, Pavel and Rábara, Radoslav and Herman, Ondřej}, address = {Miyazaki, Japan}, booktitle = {6th Workshop on the Challenges in the Management of Large Corpora}, editor = {Piotr Banski, Marc Kupietz, Adrien Barbaresi, Hanno Biber, Evelyn Breiteneder, Simon Clematide, Andreas Witt}, keywords = {distributed corpus search}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Miyazaki, Japan}, isbn = {979-1-09-554614-6}, pages = {10-13}, publisher = {European Language Resource Association}, title = {Distributed Corpus Search}, url = {http://lrec-conf.org/workshops/lrec2018/W17/pdf/book_of_proceedings.pdf}, year = {2018} }
  • SABOL, Radoslav, Marek MEDVEĎ a Aleš HORÁK. Recurrent Networks in AQA Answer Selection. In Aleš Horák, Pavel Rychlý and Adam Rambousek. Proceedings of the Twelfth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2018. Brno: Tribun EU. s. 53-62. ISBN 978-80-263-1517-9. 2018. URL info
    @inproceedings{1484740, author = {Sabol, Radoslav and Medveď, Marek and Horák, Aleš}, address = {Brno}, booktitle = {Proceedings of the Twelfth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2018}, editor = {Aleš Horák, Pavel Rychlý and Adam Rambousek}, keywords = {question answering; answer selection; QA dataset; SQAD; AQA}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1517-9}, pages = {53-62}, publisher = {Tribun EU}, title = {Recurrent Networks in AQA Answer Selection}, url = {https://nlp.fi.muni.cz/raslan/2018/paper12-Sabol_Medved_Horak.pdf}, year = {2018} }
  • MEDVEĎ, Marek a Aleš HORÁK. Sentence and Word Embedding Employed in Open Question-Answering. In Proceedings of the 10th International Conference on Agents and Artificial Intelligence (ICAART 2018). Setúbal, Portugal: SCITEPRESS - Science and Technology Publications. s. 486-492. ISBN 978-989-758-275-2. 2018. info
    @inproceedings{1393609, author = {Medveď, Marek and Horák, Aleš}, address = {Setúbal, Portugal}, booktitle = {Proceedings of the 10th International Conference on Agents and Artificial Intelligence (ICAART 2018)}, keywords = {question answering; word embedding; word2vec; AQA; Simple Question Answering Database; SQAD}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Setúbal, Portugal}, isbn = {978-989-758-275-2}, pages = {486-492}, publisher = {SCITEPRESS - Science and Technology Publications}, title = {Sentence and Word Embedding Employed in Open Question-Answering}, year = {2018} }
  • JAKUBÍČEK, Miloš, Michal MĚCHURA, Vojtěch KOVÁŘ a Pavel RYCHLÝ. Practical Post- Editing Lexicography with Lexonomy and Sketch Engine. In XVIII EURALEX International Congress: Lexicography in Global Contexts. 2018. URL info
    @proceedings{1433097, author = {Jakubíček, Miloš and Měchura, Michal and Kovář, Vojtěch and Rychlý, Pavel}, booktitle = {XVIII EURALEX International Congress: Lexicography in Global Contexts}, keywords = {corpora; post-editing; Lexonomy; Sketch Engine}, language = {eng}, title = {Practical Post- Editing Lexicography with Lexonomy and Sketch Engine}, url = {http://euralex2018.cjvt.si/}, year = {2018} }
  • KUŠNIRÁKOVÁ, Daša a Marek MEDVEĎ. Towards Czech Answer Type Analysis. In Aleš Horák, Pavel Rychlý and Adam Rambousek. Proceedings of the Twelfth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2018. Brno: Tribun EU. s. 41-51. ISBN 978-80-263-1517-9. 2018. URL info
    @inproceedings{1484738, author = {Kušniráková, Daša and Medveď, Marek}, address = {Brno}, booktitle = {Proceedings of the Twelfth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2018}, editor = {Aleš Horák, Pavel Rychlý and Adam Rambousek}, keywords = {question answering; question classification; answer classifica-tion; Czech; Simple Question Answering Database; SQAD}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1517-9}, pages = {41-51}, publisher = {Tribun EU}, title = {Towards Czech Answer Type Analysis}, url = {https://nlp.fi.muni.cz/raslan/2018/paper13-Kusnirakova_Medved.pdf}, year = {2018} }
  • SUCHOMEL, Vít. csTenTen17, a Recent Czech Web Corpus. In Aleš Horák, Pavel Rychlý and Adam Rambousek. Proceedings of the Twelfth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2018. Brno: Tribun EU. s. 111-123. ISBN 978-80-263-1517-9. 2018. URL info
    @inproceedings{1483790, author = {Suchomel, Vít}, address = {Brno}, booktitle = {Proceedings of the Twelfth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2018}, editor = {Aleš Horák, Pavel Rychlý and Adam Rambousek}, keywords = {Czech corpus; web corpus; text processing}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1517-9}, pages = {111-123}, publisher = {Tribun EU}, title = {csTenTen17, a Recent Czech Web Corpus}, url = {https://nlp.fi.muni.cz/raslan/2018/paper10-Suchomel.pdf}, year = {2018} }

2017

  • PALA, Karel, Aleš HORÁK, Pavel RYCHLÝ, Vít SUCHOMEL, Vít BAISA, Miloš JAKUBÍČEK, Vojtěch KOVÁŘ, Zuzana NEVĚŘILOVÁ, Adam RAMBOUSEK, Björn GAMBÄCK, Utpal SIKDAR a Lars BUNGUM. HaBiT system. 2017. URL info
    @misc{1381969, author = {Pala, Karel and Horák, Aleš and Rychlý, Pavel and Suchomel, Vít and Baisa, Vít and Jakubíček, Miloš and Kovář, Vojtěch and Nevěřilová, Zuzana and Rambousek, Adam and Gambäck, Björn and Sikdar, Utpal and Bungum, Lars}, keywords = {corpus tool; corpus manager; word list; word sketch; sketch differece; concordance}, language = {eng}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {HaBiT system}, url = {http://corpora.fi.muni.cz/habit/}, year = {2017} }
  • BAISA, Vít, Ondřej HERMAN a Aleš HORÁK. Manipulative Propaganda Techniques: Technical Report. In Horák A., Rychlý P., Rambousek, A. Proceedings of the Eleventh Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2017. Brno: Tribun EU. s. 111-118. ISBN 978-80-263-1340-3. 2017. URL info
    @inproceedings{1398004, author = {Baisa, Vít and Herman, Ondřej and Horák, Aleš}, address = {Brno}, booktitle = {Proceedings of the Eleventh Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2017}, editor = {Horák A., Rychlý P., Rambousek, A.}, keywords = {propaganda; manipulative techniques in text; propaganda corpus; propaganda detection}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1340-3}, pages = {111-118}, publisher = {Tribun EU}, title = {Manipulative Propaganda Techniques: Technical Report}, url = {http://nlp.fi.muni.cz/raslan/2017/paper07-Baisa_Herman_Horak.pdf}, year = {2017} }
  • BOHÁČ, Marek, Michal ROTT a Vojtěch KOVÁŘ. Text Punctuation: An Inter-annotator Agreement Study. In Ekštein, Kamil Matoušek, Václav. Text, Speech, and Dialogue: 20th International Conference, TSD 2017. Cham: Springer International Publishing. s. 120-128. ISBN 978-3-319-64205-5. doi:10.1007/978-3-319-64206-2_14. 2017. URL info
    @inproceedings{1393439, author = {Boháč, Marek and Rott, Michal and Kovář, Vojtěch}, address = {Cham}, booktitle = {Text, Speech, and Dialogue: 20th International Conference, TSD 2017}, doi = {http://dx.doi.org/10.1007/978-3-319-64206-2_14}, editor = {Ekštein, Kamil Matoušek, Václav}, keywords = {Comma adding;Spoken language;Inter-annotator agreement}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Cham}, isbn = {978-3-319-64205-5}, pages = {120-128}, publisher = {Springer International Publishing}, title = {Text Punctuation: An Inter-annotator Agreement Study}, url = {https://link.springer.com/chapter/10.1007/978-3-319-64206-2_14}, year = {2017} }
  • ŠULGANOVÁ, Terézia, Marek MEDVEĎ a Aleš HORÁK. Enlargement of the Czech Question-Answering Dataset to SQAD v2.0. In Aleš Horák, Pavel Rychlý, Adam Rambousek. Proceedings of the Eleventh Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2017. Brno: Tribun EU. s. 79-84. ISBN 978-80-263-1340-3. 2017. URL info
    @inproceedings{1400970, author = {Šulganová, Terézia and Medveď, Marek and Horák, Aleš}, address = {Brno}, booktitle = {Proceedings of the Eleventh Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2017}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {question answering; QA dataset; SQAD}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1340-3}, pages = {79-84}, publisher = {Tribun EU}, title = {Enlargement of the Czech Question-Answering Dataset to SQAD v2.0}, url = {http://raslan2017.nlp-consulting.net/proceedings}, year = {2017} }
  • MEDVEĎ, Marek, Terézia ŠULGANOVÁ a Aleš HORÁK. Multilinguality Adaptations of Natural Language Logical Analyzer. In Aleš Horák, Pavel Rychlý, Adam Rambousek. Proceedings of the Eleventh Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2017. Brno: Tribun EU. s. 51-58. ISBN 978-80-263-1340-3. 2017. URL info
    @inproceedings{1400965, author = {Medveď, Marek and Šulganová, Terézia and Horák, Aleš}, address = {Brno}, booktitle = {Proceedings of the Eleventh Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2017}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {Transparent Intensional Logic; TIL; logical analysis; natural language semantics}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1340-3}, pages = {51-58}, publisher = {Tribun EU}, title = {Multilinguality Adaptations of Natural Language Logical Analyzer}, url = {http://raslan2017.nlp-consulting.net/proceedings}, year = {2017} }
  • PAVELEK, Martin, Zdeněk MATĚJ, Ondřej HERMAN, Filip MRAVEC, Martin VEŠKRNA, František CVACHOVEC, Michal KOŠŤÁL a Václav PŘENOSIL. Fast Digital Spectrometer for Mixed Radiation Fields. In 2017 IEEE SENSORS Proceedings. Piscataway, New Jersey, US: IEEE. s. 436-438. ISBN 978-1-5386-4056-2. doi:10.1109/ICSENS.2017.8234012. 2017. IEEE Xplore: Fast digital spectrometer for mixed radiation fields info
    @inproceedings{1388623, author = {Pavelek, Martin and Matěj, Zdeněk and Herman, Ondřej and Mravec, Filip and Veškrna, Martin and Cvachovec, František and Košťál, Michal and Přenosil, Václav}, address = {Piscataway, New Jersey, US}, booktitle = {2017 IEEE SENSORS Proceedings}, doi = {http://dx.doi.org/10.1109/ICSENS.2017.8234012}, keywords = {neutron spectrometry; mixed fields; pulse-shape discrimination; scintillation; FPGA; digitizer}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Piscataway, New Jersey, US}, isbn = {978-1-5386-4056-2}, pages = {436-438}, publisher = {IEEE}, title = {Fast Digital Spectrometer for Mixed Radiation Fields}, url = {http://ieeexplore.ieee.org/document/8234012/}, year = {2017} }
  • KALLAS, Jelena, Vít SUCHOMEL a Maria KHOKHLOVA. Automated Identification of Domain Preferences of Collocations. In Iztok Kosem et al. Electronic Lexicography in the 21st Century. Proceedings of Elex 2017 Conference. Brno, Czech Republic: Lexical Computing CZ s.r.o. s. 309-320. ISSN 2533-5626. 2017. Sborník Článek info
    @inproceedings{1394199, author = {Kallas, Jelena and Suchomel, Vít and Khokhlova, Maria}, address = {Brno, Czech Republic}, booktitle = {Electronic Lexicography in the 21st Century. Proceedings of Elex 2017 Conference.}, editor = {Iztok Kosem et al.}, keywords = {collocation; multiword terms; terminological collocation; Russian; Estonian}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Brno, Czech Republic}, pages = {309-320}, publisher = {Lexical Computing CZ s.r.o.}, title = {Automated Identification of Domain Preferences of Collocations}, url = {https://elex.link/elex2017/proceedings-download/}, year = {2017} }

2016

  • ROTH, Filip, Ahmad ABBADI, Ondřej HERMAN, Martin PAVELEK a Václav PŘENOSIL. Compact hybrid real-time hyperspectral imaging system with high effective spatial, spectral, and temporal resolution. In Qingming Luo; Xingde Li; Ying Gu; Yuguo Tang. Optics in Health Care and Biomedical Optics VII. Beijing, China: SPIE Proceedings. s. 112-123. ISBN 978-1-5106-0467-4. doi:10.1117/12.2246110. 2016. Online version info
    @inproceedings{1361508, author = {Roth, Filip and Abbadi, Ahmad and Herman, Ondřej and Pavelek, Martin and Přenosil, Václav}, address = {Beijing, China}, booktitle = {Optics in Health Care and Biomedical Optics VII}, doi = {http://dx.doi.org/10.1117/12.2246110}, editor = {Qingming Luo; Xingde Li; Ying Gu; Yuguo Tang}, keywords = {real-time imaging system; spatial-spectral resolution; hyperspectral endoscope; video rate processing; medical spectroscopy; image-guided surgery}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Beijing, China}, isbn = {978-1-5106-0467-4}, pages = {112-123}, publisher = {SPIE Proceedings}, title = {Compact hybrid real-time hyperspectral imaging system with high effective spatial, spectral, and temporal resolution}, url = {http://dx.doi.org/10.1117/12.2246110}, year = {2016} }
  • HERMAN, Ondřej, Vít SUCHOMEL, Vít BAISA a Pavel RYCHLÝ. DSL Shared task 2016: Perfect Is The Enemy of Good Language Discrimination Through Expectation-Maximization and Chunk-based Language Model. In Preslav Nakov, Marcos Zampieri, Liling Tan, Nikola Ljubešić, Jörg Tiedemann, Shervin Malmasi. Proceedings of the Third Workshop on NLP for Similar Languages, Varieties and Dialects (VarDial3). Osaka: Association for Natural Language Processing (ANLP), Osaka, Japan. s. 114-118. ISBN 978-4-87974-716-7. 2016. URL info
    @inproceedings{1366107, author = {Herman, Ondřej and Suchomel, Vít and Baisa, Vít and Rychlý, Pavel}, address = {Osaka}, booktitle = {Proceedings of the Third Workshop on NLP for Similar Languages, Varieties and Dialects (VarDial3)}, editor = {Preslav Nakov, Marcos Zampieri, Liling Tan, Nikola Ljubešić, Jörg Tiedemann, Shervin Malmasi}, keywords = {language discrimination;expectation maximization;language model}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Osaka}, isbn = {978-4-87974-716-7}, pages = {114-118}, publisher = {Association for Natural Language Processing (ANLP), Osaka, Japan}, title = {DSL Shared task 2016: Perfect Is The Enemy of Good Language Discrimination Through Expectation-Maximization and Chunk-based Language Model}, url = {https://aclanthology.info/pdf/W/W16/W16-4815.pdf}, year = {2016} }
  • BAISA, Vít, Jan MICHELFEIT, Marek MEDVEĎ a Miloš JAKUBÍČEK. European Union Language Resources in Sketch Engine. In Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Marko Grobelnik and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis. Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC 2016). Portorož, Slovenia: European Language Resources Association (ELRA). s. 2799-2803. ISBN 978-2-9517408-9-1. 2016. URL info
    @inproceedings{1346032, author = {Baisa, Vít and Michelfeit, Jan and Medveď, Marek and Jakubíček, Miloš}, address = {Portorož, Slovenia}, booktitle = {Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC 2016)}, editor = {Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Marko Grobelnik and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, keywords = {JRC-Acquis; DCEP; DGT-TM; Europarl; EUR-Lex; Sketch Engine; parallel corpus; word sketch; parallel concordance}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Portorož, Slovenia}, isbn = {978-2-9517408-9-1}, pages = {2799-2803}, publisher = {European Language Resources Association (ELRA)}, title = {European Union Language Resources in Sketch Engine}, url = {http://www.lrec-conf.org/proceedings/lrec2016/pdf/572_Paper.pdf}, year = {2016} }
  • KOVÁŘ, Vojtěch, Vít BAISA a Miloš JAKUBÍČEK. Sketch Engine for Bilingual Lexicography. International Journal of Lexicography. Oxford: Oxford University Press, roč. 29, č. 3, s. 339-352. ISSN 0950-3846. doi:10.1093/ijl/ecw029. 2016. URL info
    @article{1349930, author = {Kovář, Vojtěch and Baisa, Vít and Jakubíček, Miloš}, article_location = {Oxford}, article_number = {3}, doi = {http://dx.doi.org/10.1093/ijl/ecw029}, keywords = {bilingual lexicography; Sketch Engine; word sketch; parallel corpus; parallel concordance; bilingual terminology extraction; TMX; TBX;}, language = {eng}, issn = {0950-3846}, journal = {International Journal of Lexicography}, title = {Sketch Engine for Bilingual Lexicography}, url = {http://ijl.oxfordjournals.org/cgi/content/full/ecw029?ijkey=mOFypUskLgTX0jI&keytype=ref}, volume = {29}, year = {2016} }
  • PŘENOSIL, Václav, Ondřej HERMAN, Dominik SALVET, Jaroslav ČECHÁK a Petr KOPEČEK. Funkční vzorek rychlé analýzy přijímaných rádiových signálů modulárního odpověďového rušiče. 2016. info
    @techreport{1414528, author = {Přenosil, Václav and Herman, Ondřej and Salvet, Dominik and Čechák, Jaroslav and Kopeček, Petr}, keywords = {FPGA;Response jammer;Signal analysing;RCIED;SDR}, language = {cze}, institution = {Masarykova univerzita (vlastnický podíl 12%); URC Systems, spol s r.o. (vlastnický podíl 88%)}, organization = {Masarykova univerzita (vlastnický podíl 12%); URC Systems, spol s r.o. (vlastnický podíl 88%)}, title = {Funkční vzorek rychlé analýzy přijímaných rádiových signálů modulárního odpověďového rušiče}, year = {2016} }
  • FIŠER, Darja, Vít SUCHOMEL a Miloš JAKUBÍČEK. Terminology Extraction for Academic Slovene Using Sketch Engine. In Aleš Horák, Pavel Rychlý, Adam Rambousek. Tenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2016. Brno: Tribun EU. s. 135-141. ISBN 978-80-263-1095-2. 2016. URL info
    @inproceedings{1365044, author = {Fišer, Darja and Suchomel, Vít and Jakubíček, Miloš}, address = {Brno}, booktitle = {Tenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2016}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {terminology; term extraction; Sketch Engine; academic discourse; Slovene}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1095-2}, pages = {135-141}, publisher = {Tribun EU}, title = {Terminology Extraction for Academic Slovene Using Sketch Engine}, url = {https://nlp.fi.muni.cz/raslan/2016/paper14-Fiser_Suchomel_Jakubicek.pdf}, year = {2016} }
  • VEŠKRNA, Martin, Zdeněk MATĚJ, Ondřej HERMAN, Filip MRAVEC, Václav PŘENOSIL a Martin PAVELEK. Protokol o testování plastického detektoru v poli radionuklidu Cf-252. 2016. info
    @misc{1377690, author = {Veškrna, Martin and Matěj, Zdeněk and Herman, Ondřej and Mravec, Filip and Přenosil, Václav and Pavelek, Martin}, keywords = {plastic detector; separative algorithm; digitizing card FD-11 and FD-17; figure of merit factor}, language = {cze}, title = {Protokol o testování plastického detektoru v poli radionuklidu Cf-252}, year = {2016} }
  • VEŠKRNA, Martin, Zdeněk MATĚJ, Ondřej HERMAN, Filip MRAVEC, Václav PŘENOSIL a Martin PAVELEK. Protokol o testování proporcionálního detektoru v poli radionuklidu Cf-252. 2016. info
    @misc{1377692, author = {Veškrna, Martin and Matěj, Zdeněk and Herman, Ondřej and Mravec, Filip and Přenosil, Václav and Pavelek, Martin}, keywords = {proportional detector; separative algorithm; digitizer Acqiris U1066A DC440; unfoldingctor}, language = {cze}, title = {Protokol o testování proporcionálního detektoru v poli radionuklidu Cf-252}, year = {2016} }
  • HERMAN, Ondřej, Filip MRAVEC, Martin VEŠKRNA a Václav PŘENOSIL. Tool for apparatus spectrum deconvolution. 2016. URL info
    @misc{1366105, author = {Herman, Ondřej and Mravec, Filip and Veškrna, Martin and Přenosil, Václav}, keywords = {deconvolution;neutron spectrometry;gamma spectrometry;expectation maximization;unfolding}, language = {eng}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {Tool for apparatus spectrum deconvolution}, url = {https://is.muni.cz/publication/1366105}, year = {2016} }
  • MEDVEĎ, Marek a Aleš HORÁK. AQA: Automatic Question Answering System for Czech. In Sojka Petr, Horák Aleš, Kopeček Ivan, Pala Karel. Text, Speech, and Dialogue 19th International Conference, TSD 2016 Brno, Czech Republic, September 12–16, 2016 Proceedings. Switzerland: Springer International Publishing. s. 270-278. ISBN 978-3-319-45510-5. doi:10.1007/978-3-319-45510-5_31. 2016. URL info
    @inproceedings{1353405, author = {Medveď, Marek and Horák, Aleš}, address = {Switzerland}, booktitle = {Text, Speech, and Dialogue 19th International Conference, TSD 2016 Brno, Czech Republic, September 12–16, 2016 Proceedings}, doi = {http://dx.doi.org/10.1007/978-3-319-45510-5_31}, editor = {Sojka Petr, Horák Aleš, Kopeček Ivan, Pala Karel}, keywords = {Question Answering; AQA; Simple Question Answering Database; SQAD; Named entity recognition}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Switzerland}, isbn = {978-3-319-45510-5}, pages = {270-278}, publisher = {Springer International Publishing}, title = {AQA: Automatic Question Answering System for Czech}, url = {http://dx.doi.org/10.1007/978-3-319-45510-5_31}, year = {2016} }
  • MEDVEĎ, Marek, Aleš HORÁK a Vojtěch KOVÁŘ. Bilingual Logical Analysis of Natural Language Sentences. In Aleš Horák, Pavel Rychlý, Adam Rambousek. Tenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2016. Brno: Tribun EU. s. 69-78. ISBN 978-80-263-1095-2. 2016. info
    @inproceedings{1365035, author = {Medveď, Marek and Horák, Aleš and Kovář, Vojtěch}, address = {Brno}, booktitle = {Tenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2016}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {semantics; semantic analysis; logical analysis; Transparent Intensional Logic; TIL}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1095-2}, pages = {69-78}, publisher = {Tribun EU}, title = {Bilingual Logical Analysis of Natural Language Sentences}, year = {2016} }
  • KOVÁŘ, Vojtěch, Miloš JAKUBÍČEK a Aleš HORÁK. On Evaluation of Natural Language Processing Tasks: Is Gold Standard Evaluation Methodology a Good Solution? In Jaap van den Herik and Joaquim Filipe. Proceedings of the 8th International Conference on Agents and Artificial Intelligence. Rome: SCITEPRESS. s. 540-545. ISBN 978-989-758-172-4. 2016. info
    @inproceedings{1322854, author = {Kovář, Vojtěch and Jakubíček, Miloš and Horák, Aleš}, address = {Rome}, booktitle = {Proceedings of the 8th International Conference on Agents and Artificial Intelligence}, editor = {Jaap van den Herik and Joaquim Filipe}, keywords = {Natural Language Processing; Applications; Evaluation}, howpublished = {paměťový nosič}, language = {eng}, location = {Rome}, isbn = {978-989-758-172-4}, pages = {540-545}, publisher = {SCITEPRESS}, title = {On Evaluation of Natural Language Processing Tasks: Is Gold Standard Evaluation Methodology a Good Solution?}, year = {2016} }
  • MEDVEĎ, Marek, Vojtěch KOVÁŘ a Miloš JAKUBÍČEK. English-French Document Alignment Based on Keywords and Statistical Translation. In Proceedings of the First Conference on Machine Translation, Volume 2: Shared Task Papers. Berlin: Association for Computational Linguistics. s. 728-732. ISBN 978-1-945626-10-4. 2016. info
    @inproceedings{1352922, author = {Medveď, Marek and Kovář, Vojtěch and Jakubíček, Miloš}, address = {Berlin}, booktitle = {Proceedings of the First Conference on Machine Translation, Volume 2: Shared Task Papers}, keywords = {bilingual document alignment}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Berlin}, isbn = {978-1-945626-10-4}, pages = {728-732}, publisher = {Association for Computational Linguistics}, title = {English-French Document Alignment Based on Keywords and Statistical Translation}, year = {2016} }
  • JAKUBÍČEK, Miloš a Pavel ŠMERK. Large Scale Keyword Extraction using a Finite State Backend. In Aleš Horák, Pavel Rychlý, Adam Rambousek. Tenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2016. Brno: Tribun EU. s. 143-146. ISBN 978-80-263-1095-2. 2016. URL info
    @inproceedings{1365139, author = {Jakubíček, Miloš and Šmerk, Pavel}, address = {Brno}, booktitle = {Tenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2016}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {terminology extraction; keyword extraction; fsa; Sketch Engine}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1095-2}, pages = {143-146}, publisher = {Tribun EU}, title = {Large Scale Keyword Extraction using a Finite State Backend}, url = {https://nlp.fi.muni.cz/raslan/2016/paper17-Jakubicek_Smerk.pdf}, year = {2016} }
  • KOVÁŘ, Vojtěch. Evaluating Natural Language Processing Tasks with Low Inter-Annotator Agreement: The Case of Corpus Applications. In Aleš Horák, Pavel Rychlý, Adam Rambousek. Tenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2016. Brno: Tribun EU. s. 127-134. ISBN 978-80-263-1095-2. 2016. info
    @inproceedings{1365039, author = {Kovář, Vojtěch}, address = {Brno}, booktitle = {Tenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2016}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {NLP; inter-annotator agreement; low inter-annotator agreement; evaluation; application; application-based evaluation; word sketch; thesaurus; terminology}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1095-2}, pages = {127-134}, publisher = {Tribun EU}, title = {Evaluating Natural Language Processing Tasks with Low Inter-Annotator Agreement: The Case of Corpus Applications}, year = {2016} }
  • KOVÁŘ, Vojtěch, Jakub MACHURA, Kristýna ZEMKOVÁ a Michal ROTT. Evaluation and Improvements in Punctuation Detection for Czech. In Sojka, Petr; Horák, Aleš; Kopeček, Ivan; Pala, Karel. Text, Speech, and Dialogue 19th International Conference, TSD 2016 Brno, Czech Republic, September 12–16, 2016 Proceedings. Cham (CH): Springer. s. 287-294. ISBN 978-3-319-45509-9. doi:10.1007/978-3-319-45510-5_33. 2016. info
    @inproceedings{1358120, author = {Kovář, Vojtěch and Machura, Jakub and Zemková, Kristýna and Rott, Michal}, address = {Cham (CH)}, booktitle = {Text, Speech, and Dialogue 19th International Conference, TSD 2016 Brno, Czech Republic, September 12–16, 2016 Proceedings}, doi = {http://dx.doi.org/10.1007/978-3-319-45510-5_33}, editor = {Sojka, Petr; Horák, Aleš; Kopeček, Ivan; Pala, Karel}, keywords = {automatic punctuation detection}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Cham (CH)}, isbn = {978-3-319-45509-9}, pages = {287-294}, publisher = {Springer}, title = {Evaluation and Improvements in Punctuation Detection for Czech}, year = {2016} }
  • KOVÁŘ, Vojtěch, Monika MOČIARIKOVÁ a Pavel RYCHLÝ. Finding Definitions in Large Corpora with Sketch Engine. In Nicoletta Calzolari (Conference Chair) et al. Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC 2016). Portorož, Slovenia: European Language Resources Association (ELRA). s. 391-394. ISBN 978-2-9517408-9-1. 2016. info
    @inproceedings{1360550, author = {Kovář, Vojtěch and Močiariková, Monika and Rychlý, Pavel}, address = {Portorož, Slovenia}, booktitle = {Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC 2016)}, editor = {Nicoletta Calzolari (Conference Chair) et al.}, keywords = {Sketch Engine; definition; definitions; CQL; corpora}, howpublished = {paměťový nosič}, language = {eng}, location = {Portorož, Slovenia}, isbn = {978-2-9517408-9-1}, pages = {391-394}, publisher = {European Language Resources Association (ELRA)}, title = {Finding Definitions in Large Corpora with Sketch Engine}, year = {2016} }
  • STARÁ, Marie a Vojtěch KOVÁŘ. Options for Automatic Creation of Dictionary Definitions from Corpora. In Aleš Horák, Pavel Rychlý, Adam Rambousek. Tenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2016. Brno: Tribun EU. s. 111-124. ISBN 978-80-263-1095-2. 2016. URL info
    @inproceedings{1365037, author = {Stará, Marie and Kovář, Vojtěch}, address = {Brno}, booktitle = {Tenth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2016}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {dictionary definition; corpora; word sketch}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-1095-2}, pages = {111-124}, publisher = {Tribun EU}, title = {Options for Automatic Creation of Dictionary Definitions from Corpora}, url = {https://nlp.fi.muni.cz/raslan/2016/paper13-Stara_Kovar.pdf}, year = {2016} }
  • RYCHLÝ, Pavel a Vít SUCHOMEL. Annotated Amharic Corpora. In Petr Sojka, Aleš Horák, Ivan Kopeček, Karel Pala. Text, Speech, and Dialogue 19th International Conference, TSD 2016 Brno, Czech Republic, September 12–16, 2016 Proceedings. Switzerland: Springer International Publishing. s. 295-302. ISBN 978-3-319-45509-9. doi:10.1007/978-3-319-45510-5_34. 2016. Plný text výsledku info
    @inproceedings{1353390, author = {Rychlý, Pavel and Suchomel, Vít}, address = {Switzerland}, booktitle = {Text, Speech, and Dialogue 19th International Conference, TSD 2016 Brno, Czech Republic, September 12–16, 2016 Proceedings}, doi = {http://dx.doi.org/10.1007/978-3-319-45510-5_34}, editor = {Petr Sojka, Aleš Horák, Ivan Kopeček, Karel Pala}, keywords = {Amharic; text corpus; web corpus; under-resourced language; corpus annotation; morphological tagger}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Switzerland}, isbn = {978-3-319-45509-9}, pages = {295-302}, publisher = {Springer International Publishing}, title = {Annotated Amharic Corpora}, url = {http://link.springer.com/chapter/10.1007/978-3-319-45510-5_34}, year = {2016} }
  • SUCHOMEL, Vít a Pavel RYCHLÝ. Set of Ethiopian Web Corpora. 2016. URL info
    @misc{1381970, author = {Suchomel, Vít and Rychlý, Pavel}, keywords = {text corpora; Ethiopian languages}, language = {eng}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {Set of Ethiopian Web Corpora}, url = {http://habit-project.eu/wiki/SetOfEthiopianWebCorpora}, year = {2016} }

2015

  • BAISA, Vít a Vít SUCHOMEL. Corpus Based Extraction of Hypernyms in Terminological Thesaurus for Land Surveying Domain. In Ninth Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 69-74. ISBN 978-80-263-0974-1. 2015. URL info
    @inproceedings{1318498, author = {Baisa, Vít and Suchomel, Vít}, address = {Brno}, booktitle = {Ninth Workshop on Recent Advances in Slavonic Natural Language Processing}, keywords = {Sketch Engine; concordance; thesaurus; word sketch; language learning; English language; corpus}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0974-1}, pages = {69-74}, publisher = {Tribun EU}, title = {Corpus Based Extraction of Hypernyms in Terminological Thesaurus for Land Surveying Domain}, url = {https://nlp.fi.muni.cz/raslan/2015/paper09-Baisa_Suchomel.pdf}, year = {2015} }
  • MEDVEĎ, Marek, Vít BAISA a Aleš HORÁK. Increasing Coverage of Translation Memories with Linguistically Motivated Segment Combination Methods. In Constantin Orasan and Rohit Gupta. Proceedings of The Workshop on Natural Language Processing for Translation Memories (NLP4TM). Bulgaria: INCOMA Ltd. Shoumen. s. 31-35. ISBN 978-954-452-032-8. 2015. The workshop on Natural Language Processing for Translation Memories info
    @inproceedings{1311833, author = {Medveď, Marek and Baisa, Vít and Horák, Aleš}, address = {Bulgaria}, booktitle = {Proceedings of The Workshop on Natural Language Processing for Translation Memories (NLP4TM)}, editor = {Constantin Orasan and Rohit Gupta}, keywords = {transaltion memories; DGT; MemoQ; Moses; segment; CAT}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Bulgaria}, isbn = {978-954-452-032-8}, pages = {31-35}, publisher = {INCOMA Ltd. Shoumen}, title = {Increasing Coverage of Translation Memories with Linguistically Motivated Segment Combination Methods}, url = {http://rgcl.wlv.ac.uk/events/NLP4TM/3_Paper.pdf}, year = {2015} }
  • KOCINCOVÁ, Lucia, Miloš JAKUBÍČEK, Vojtěch KOVÁŘ a Vít BAISA. Interactive Visualizations of Corpus Data in Sketch Engine. In Gintaré Grigonyté, Simon Clematide, Andrius Utka, Martin Volk. Proceedings of the Workshop on Innovative Corpus Query and Visualization Tools at NODALIDA 2015. Vilnius, Lithuania: Linköping University Electronic Press, Linköpings universitet. s. 17-22. ISBN 978-91-7519-035-8. 2015. info
    @inproceedings{1299713, author = {Kocincová, Lucia and Jakubíček, Miloš and Kovář, Vojtěch and Baisa, Vít}, address = {Vilnius, Lithuania}, booktitle = {Proceedings of the Workshop on Innovative Corpus Query and Visualization Tools at NODALIDA 2015}, editor = {Gintaré Grigonyté, Simon Clematide, Andrius Utka, Martin Volk}, keywords = {information visualization; interactive visualization; corpora; Sketch Engine; thesaurus; word sketch; Data-Driven Documents; generative design}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Vilnius, Lithuania}, isbn = {978-91-7519-035-8}, pages = {17-22}, publisher = {Linköping University Electronic Press, Linköpings universitet}, title = {Interactive Visualizations of Corpus Data in Sketch Engine}, year = {2015} }
  • KILGARRIFF, Adam, Vít BAISA, Miloš JAKUBÍČEK a Pavel RYCHLÝ. Longest-commonest Match. In Kosem, I., Jakubíček, M., Kallas, J., Krek, S. Electronic lexicography in the 21st century: linking lexical data in the digital age. Proceedings of the eLex 2015 conference, 11-13 August 2015, Herstmonceux Castle, United Kingdom. Jlubljana: Trojina, Institute for Applied Slovene Studies. s. 397-404. ISBN 978-961-93594-3-3. 2015. URL info
    @inproceedings{1308616, author = {Kilgarriff, Adam and Baisa, Vít and Jakubíček, Miloš and Rychlý, Pavel}, address = {Jlubljana}, booktitle = {Electronic lexicography in the 21st century: linking lexical data in the digital age. Proceedings of the eLex 2015 conference, 11-13 August 2015, Herstmonceux Castle, United Kingdom.}, editor = {Kosem, I., Jakubíček, M., Kallas, J., Krek, S.}, keywords = {multiword expresion; collocation; word sketch; Sketch Engine}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Jlubljana}, isbn = {978-961-93594-3-3}, pages = {397-404}, publisher = {Trojina, Institute for Applied Slovene Studies}, title = {Longest-commonest Match}, url = {https://elex.link/elex2015/proceedings/eLex_2015_26_Kilgarriff+etal.pdf}, year = {2015} }
  • RAMBOUSEK, Adam, Vít BAISA, Vít SUCHOMEL a Aleš HORÁK. Technologie pro využití obsahu tezauru pro publikační účely. 2015. info
    @techreport{1321769, author = {Rambousek, Adam and Baisa, Vít and Suchomel, Vít and Horák, Aleš}, keywords = {thesaurus; application; web service; extraction of terms; corpus; term}, language = {cze}, institution = {Technologická agentura České republiky}, organization = {Technologická agentura České republiky}, title = {Technologie pro využití obsahu tezauru pro publikační účely}, year = {2015} }
  • RAMBOUSEK, Adam, Vít BAISA, Vít SUCHOMEL, Aleš HORÁK a Lucia KOCINCOVÁ. Terminologický tezaurus pro obor zeměměřictví a katastru nemovitostí: Certifikovaná metodika. 2015. info
    @misc{1321771, author = {Rambousek, Adam and Baisa, Vít and Suchomel, Vít and Horák, Aleš and Kocincová, Lucia}, keywords = {certified methodology; thesaurus; automatic extractions of terms; corpus; concordance; application; web service; surveying; cadastre}, language = {cze}, title = {Terminologický tezaurus pro obor zeměměřictví a katastru nemovitostí: Certifikovaná metodika}, year = {2015} }
  • BAISA, Vít, Ondřej HERMAN a Miloš JAKUBÍČEK. Towards Automatic Finding of Word Sense Changes in Time. In Aleš Horák, Pavel Rychlý, Adam Rambousek. Ninth Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 33-41. ISBN 978-80-263-0974-1. 2015. URL info
    @inproceedings{1318600, author = {Baisa, Vít and Herman, Ondřej and Jakubíček, Miloš}, address = {Brno}, booktitle = {Ninth Workshop on Recent Advances in Slavonic Natural Language Processing}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {neologism; Sketch Engine; word sense; word sketch}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0974-1}, pages = {33-41}, publisher = {Tribun EU}, title = {Towards Automatic Finding of Word Sense Changes in Time}, url = {https://nlp.fi.muni.cz/raslan/2015/paper13-Baisa_Herman_Jakubicek.pdf}, year = {2015} }
  • BAISA, Vít a Vít SUCHOMEL. Turkic Language Support in Sketch Engine. In Proceedings of the international conference "Turkic Languages processing: TurkLang 2015". Kazan: Academy of Sciences of the Republic of Tatarstan Press. s. 214-223. ISBN 978-5-9690-0262-3. 2015. info
    @inproceedings{1311893, author = {Baisa, Vít and Suchomel, Vít}, address = {Kazan}, booktitle = {Proceedings of the international conference "Turkic Languages processing: TurkLang 2015"}, keywords = {corpus; Sketch Engine; Turkic language; Turkish; Kazakh; Kyrgyz; Turkmen; Azeri; Tatar}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Kazan}, isbn = {978-5-9690-0262-3}, pages = {214-223}, publisher = {Academy of Sciences of the Republic of Tatarstan Press}, title = {Turkic Language Support in Sketch Engine}, year = {2015} }
  • OSOLSOBĚ, Klára, Pavel ŠMERK, Karel PALA a Dana HLAVÁČKOVÁ. Deriv— softwarový nástroj pro testování mezí a možností automatické slovotvorné analýzy. In Hlaváčová, Jaroslava. Sborník semináře o digitálních zdrojích a službách ve společenských a humanitních vědách. 1. vyd. Praha: ÚFAL MFF UK. s. 42-46. ISBN 978-80-904571-9-5. 2015. URL info
    @inproceedings{1313051, author = {Osolsobě, Klára and Šmerk, Pavel and Pala, Karel and Hlaváčková, Dana}, address = {Praha}, booktitle = {Sborník semináře o digitálních zdrojích a službách ve společenských a humanitních vědách}, edition = {1.}, editor = {Hlaváčová, Jaroslava}, keywords = {derivational morphology; softwaretool}, howpublished = {tištěná verze "print"}, language = {cze}, location = {Praha}, isbn = {978-80-904571-9-5}, pages = {42-46}, publisher = {ÚFAL MFF UK}, title = {Deriv— softwarový nástroj pro testování mezí a možností automatické slovotvorné analýzy}, url = {http://ufallab.ms.mff.cuni.cz/~hlavacova/WDH2015/wdh2015_sbornik.pdf}, year = {2015} }
  • OSOLSOBĚ, Klára, Pavel ŠMERK, Karel PALA a Dana HLAVÁČKOVÁ. Deriv— softwarový nástroj pro testování mezí a možností automatické slovotvorné analýzy. In Seminář o digitálních zdrojích a službách ve společenských a humanitních vědách, Praha, 24. 9. 2015. 2015. info
    @proceedings{1324068, author = {Osolsobě, Klára and Šmerk, Pavel and Pala, Karel and Hlaváčková, Dana}, booktitle = {Seminář o digitálních zdrojích a službách ve společenských a humanitních vědách, Praha, 24. 9. 2015}, keywords = {derivational morphology; softwaretool}, language = {cze}, title = {Deriv— softwarový nástroj pro testování mezí a možností automatické slovotvorné analýzy}, year = {2015} }
  • MEDVEĎ, Marek a Aleš HORÁK. AST: New Tool for Logical Analysis of Sentences based on Transparent Intensional Logic. In Aleš Horák, Pavel Rychlý, Adam Rambousek. Ninth Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 95-102. ISBN 978-80-263-0974-1. 2015. info
    @inproceedings{1320592, author = {Medveď, Marek and Horák, Aleš}, address = {Brno}, booktitle = {Ninth Workshop on Recent Advances in Slavonic Natural Language Processing}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {semantics; semantic analysis; logical analysis; Transparent Intensional Logic; TIL}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0974-1}, pages = {95-102}, publisher = {Tribun EU}, title = {AST: New Tool for Logical Analysis of Sentences based on Transparent Intensional Logic}, year = {2015} }
  • PALA, Karel a Pavel ŠMERK. Derivancze - Derivational Analyzer of Czech. In P. Král, V.Matoušek. International Conference on Text, Speech, and Dialogue, TSD 2015. Berlin, Heidelberg: Springer Verlag. s. 515-523. ISBN 978-3-319-24032-9. doi:10.1007/978-3-319-24033-6_58. 2015. info
    @inproceedings{1322843, author = {Pala, Karel and Šmerk, Pavel}, address = {Berlin, Heidelberg}, booktitle = {International Conference on Text, Speech, and Dialogue, TSD 2015}, doi = {http://dx.doi.org/10.1007/978-3-319-24033-6_58}, editor = {P. Král, V.Matoušek}, keywords = {derivational morphology; word formation; Czech language}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Berlin, Heidelberg}, isbn = {978-3-319-24032-9}, pages = {515-523}, publisher = {Springer Verlag}, title = {Derivancze - Derivational Analyzer of Czech}, year = {2015} }
  • ŠMERK, Pavel. Semantic Regularity of Derivational Relations. In Aleš Horák, Pavel Rychlý, Adam Rambousek. Ninth Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 87-92. ISBN 978-80-263-0974-1. 2015. URL info
    @inproceedings{1320591, author = {Šmerk, Pavel}, address = {Brno}, booktitle = {Ninth Workshop on Recent Advances in Slavonic Natural Language Processing}, editor = {Aleš Horák, Pavel Rychlý, Adam Rambousek}, keywords = {derivational morphology; semantics of the derivational relations; word2vec}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0974-1}, pages = {87-92}, publisher = {Tribun EU}, title = {Semantic Regularity of Derivational Relations}, url = {https://nlp.fi.muni.cz/raslan/2015/paper14-Smerk.pdf}, year = {2015} }

Before 2015

  • ARTS, Tressy, Yonatan BELINKOV, Nizar HABASH, Adam KILGARRIFF a Vít SUCHOMEL. arTenTen: Arabic Corpus and Word Sketches. Journal of King Saud University-Computer and Information Sciences. Elsevier, roč. 2014, č. 26, s. 381-395. ISSN 1319-1578. doi:10.1016/j.jksuci.2014.06.009. 2014. plný text článku info
    @article{1210667, author = {Arts, Tressy and Belinkov, Yonatan and Habash, Nizar and Kilgarriff, Adam and Suchomel, Vít}, article_number = {26}, doi = {http://dx.doi.org/10.1016/j.jksuci.2014.06.009}, keywords = {Corpora; Lexicography; Morphology; Concordance; Arabic}, language = {eng}, issn = {1319-1578}, journal = {Journal of King Saud University-Computer and Information Sciences}, title = {arTenTen: Arabic Corpus and Word Sketches}, url = {http://www.sciencedirect.com/science/article/pii/S1319157814000330}, volume = {2014}, year = {2014} }
  • KILGARRIFF, Adam, Pavel RYCHLÝ, Miloš JAKUBÍČEK, Vojtěch KOVÁŘ, Vít BAISA a Lucia KOCINCOVÁ. Extrinsic Corpus Evaluation with a Collocation Dictionary Task. In Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Hrafn Loftsson and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis. Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC'14). Reykjavik, Iceland: European Language Resources Association (ELRA). s. 1-8. ISBN 978-2-9517408-8-4. 2014. URL info
    @inproceedings{1186170, author = {Kilgarriff, Adam and Rychlý, Pavel and Jakubíček, Miloš and Kovář, Vojtěch and Baisa, Vít and Kocincová, Lucia}, address = {Reykjavik, Iceland}, booktitle = {Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC'14)}, editor = {Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Hrafn Loftsson and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, keywords = {corpus; evaluation; collocation}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Reykjavik, Iceland}, isbn = {978-2-9517408-8-4}, pages = {1-8}, publisher = {European Language Resources Association (ELRA)}, title = {Extrinsic Corpus Evaluation with a Collocation Dictionary Task}, url = {http://www.lrec-conf.org/proceedings/lrec2014/summaries/52.html}, year = {2014} }
  • BAISA, Vít a Vojtěch KOVÁŘ. Information Extraction for Czech Based on Syntactic Analysis. In Zygmunt Vetulani, Joseph Mariani. Human Language Technology Challenges for Computer Science and Linguistics. Cham: Springer. s. 155-165. ISBN 978-3-319-08957-7. doi:10.1007/978-3-319-08958-4_13. 2014. info
    @inproceedings{1210672, author = {Baisa, Vít and Kovář, Vojtěch}, address = {Cham}, booktitle = {Human Language Technology Challenges for Computer Science and Linguistics}, doi = {http://dx.doi.org/10.1007/978-3-319-08958-4_13}, editor = {Zygmunt Vetulani, Joseph Mariani}, keywords = {information extraction; Czech language; syntactic analysis}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Cham}, isbn = {978-3-319-08957-7}, pages = {155-165}, publisher = {Springer}, title = {Information Extraction for Czech Based on Syntactic Analysis}, year = {2014} }
  • BAISA, Vít a Vít SUCHOMEL. SkELL: Web Interface for English Language Learning. In Eighth Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 63-70. ISSN 2336-4289. 2014. URL info
    @inproceedings{1210697, author = {Baisa, Vít and Suchomel, Vít}, address = {Brno}, booktitle = {Eighth Workshop on Recent Advances in Slavonic Natural Language Processing}, keywords = {Sketch Engine; concordance; thesaurus; word sketch; language learning; English language; corpus}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, pages = {63-70}, publisher = {Tribun EU}, title = {SkELL: Web Interface for English Language Learning}, url = {https://nlp.fi.muni.cz/raslan/2014/12.pdf}, year = {2014} }
  • KILGARRIFF, Adam, Vít BAISA, Jan BUŠTA, Miloš JAKUBÍČEK, Vojtěch KOVÁŘ, Jan MICHELFEIT, Pavel RYCHLÝ a Vít SUCHOMEL. The Sketch Engine: ten years on. Lexicography. Springer Berlin Heidelberg, roč. 1, č. 1, s. 7-36. ISSN 2197-4292. doi:10.1007/s40607-014-0009-9. 2014. URL info
    @article{1193200, author = {Kilgarriff, Adam and Baisa, Vít and Bušta, Jan and Jakubíček, Miloš and Kovář, Vojtěch and Michelfeit, Jan and Rychlý, Pavel and Suchomel, Vít}, article_number = {1}, doi = {http://dx.doi.org/10.1007/s40607-014-0009-9}, keywords = {Corpora; Corpus lexicography; Corpus tools; Word sketches; Sketch Engine}, language = {eng}, issn = {2197-4292}, journal = {Lexicography}, title = {The Sketch Engine: ten years on}, url = {http://dx.doi.org/10.1007/s40607-014-0009-9}, volume = {1}, year = {2014} }
  • BAISA, Vít a Vít SUCHOMEL. Intrinsic Methods for Comparison of Corpora. In A. Horák, P. Rychlý. RASLAN 2013 Recent Advances in Slavonic Natural Language Processing. první. Brno: Tribun EU. s. 51-58. ISBN 978-80-263-0520-0. 2013. URL info
    @inproceedings{1131260, author = {Baisa, Vít and Suchomel, Vít}, address = {Brno}, booktitle = {RASLAN 2013 Recent Advances in Slavonic Natural Language Processing}, edition = {první}, editor = {A. Horák, P. Rychlý}, keywords = {text corpus; corpora comparison}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0520-0}, pages = {51-58}, publisher = {Tribun EU}, title = {Intrinsic Methods for Comparison of Corpora}, url = {https://nlp.fi.muni.cz/raslan/2013/paper05.pdf}, year = {2013} }
  • BAISA, Vít a Vít SUCHOMEL. Detecting Spam in Web Corpora. In Aleš Horák, Pavel Rychlý. 6th Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 69-76. ISBN 978-80-263-0313-8. 2012. URL info
    @inproceedings{1077953, author = {Baisa, Vít and Suchomel, Vít}, address = {Brno}, booktitle = {6th Workshop on Recent Advances in Slavonic Natural Language Processing}, editor = {Aleš Horák, Pavel Rychlý}, keywords = {spam detection; web corpora; n-gram}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0313-8}, pages = {69-76}, publisher = {Tribun EU}, title = {Detecting Spam in Web Corpora}, url = {https://nlp.fi.muni.cz/raslan/2012/paper05.pdf}, year = {2012} }
  • KILGARRIFF, Adam, Pavel RYCHLÝ, Vojtěch KOVÁŘ a Vít BAISA. Finding Multiwords of More Than Two Words. In Proceedings of the 15th EURALEX International Congress. Oslo: Department of Linguistics and Scandinavian Studies, University of Oslo. s. 693-700. ISBN 978-82-303-2095-2. 2012. info
    @inproceedings{982493, author = {Kilgarriff, Adam and Rychlý, Pavel and Kovář, Vojtěch and Baisa, Vít}, address = {Oslo}, booktitle = {Proceedings of the 15th EURALEX International Congress}, keywords = {collocations; multiword expressions; multiwords; corpus lexicography; word sketches}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Oslo}, isbn = {978-82-303-2095-2}, pages = {693-700}, publisher = {Department of Linguistics and Scandinavian Studies, University of Oslo}, title = {Finding Multiwords of More Than Two Words}, year = {2012} }
  • BAISA, Vít a Vít SUCHOMEL. Large Corpora for Turkic Languages and Unsupervised Morphological Analysis. In Seniz Demir, Ilknur Durgar El-Kahlout, Mehmet Ugur Dogan. Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12). Istanbul, Turkey: European Language Resources Association (ELRA). s. 28-32. ISBN 978-2-9517408-7-7. 2012. URL info
    @inproceedings{982494, author = {Baisa, Vít and Suchomel, Vít}, address = {Istanbul, Turkey}, booktitle = {Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12)}, editor = {Seniz Demir, Ilknur Durgar El-Kahlout, Mehmet Ugur Dogan}, keywords = {corpus; turkic languages; unsupervised morphological analysis}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Istanbul, Turkey}, isbn = {978-2-9517408-7-7}, pages = {28-32}, publisher = {European Language Resources Association (ELRA)}, title = {Large Corpora for Turkic Languages and Unsupervised Morphological Analysis}, url = {http://www.lrec-conf.org/proceedings/lrec2012/workshops/02.Turkic%20Languages%20Proceedings.pdf}, year = {2012} }
  • BAISA, Vít a Vojtěch KOVÁŘ. Information Extraction for Czech Based on Syntactic Analysis. In Zygmunt Vetulani. Human Language Technologies as a Challenge for Computer Science and Linguistics, Proceedings of 5th Language and Technology Conference. Poznań: Funcacja Universytetu im. A. Mickiewicza. s. 466-470. ISBN 978-83-932640-1-8. 2011. info
    @inproceedings{959033, author = {Baisa, Vít and Kovář, Vojtěch}, address = {Poznań}, booktitle = {Human Language Technologies as a Challenge for Computer Science and Linguistics, Proceedings of 5th Language and Technology Conference}, editor = {Zygmunt Vetulani}, keywords = {information extraction; syntactic analysis; semantic classification; morphological disambiguation}, language = {eng}, location = {Poznań}, isbn = {978-83-932640-1-8}, pages = {466-470}, publisher = {Funcacja Universytetu im. A. Mickiewicza}, title = {Information Extraction for Czech Based on Syntactic Analysis}, year = {2011} }
  • BOJAR, Ondřej, Vojtěch DIATKA, Pavel RYCHLÝ, Pavel STRAŇÁK, Vít SUCHOMEL, Aleš TAMCHYNA a Daniel ZEMAN. HindEnCorp – Hindi-English and Hindi-only Corpus for Machine Translation. In Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Hrafn Loftsson and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis. Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC'14). Reykjavik, Iceland: European Language Resources Association (ELRA). s. 3550-3555. ISBN 978-2-9517408-8-4. 2014. URL info
    @inproceedings{1195822, author = {Bojar, Ondřej and Diatka, Vojtěch and Rychlý, Pavel and Straňák, Pavel and Suchomel, Vít and Tamchyna, Aleš and Zeman, Daniel}, address = {Reykjavik, Iceland}, booktitle = {Proceedings of the Ninth International Conference on Language Resources and Evaluation (LREC'14)}, editor = {Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Hrafn Loftsson and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, keywords = {Machine Translation; SpeechToSpeech Translation; Metadata}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Reykjavik, Iceland}, isbn = {978-2-9517408-8-4}, pages = {3550-3555}, publisher = {European Language Resources Association (ELRA)}, title = {HindEnCorp – Hindi-English and Hindi-only Corpus for Machine Translation}, url = {http://www.lrec-conf.org/proceedings/lrec2014/summaries/835.html}, year = {2014} }
  • KASPRZAK, Jan, Michal BRANDEJS, Miroslav KŘIPAČ a Pavel ŠMERK. Distributed System for Discovering Similar Documents: From a Relational Database to the Custom-Developed Parallel Solution. In ICEIS 2008: Proceedings of the Tenth International Conference on Enterprise Information Systems, Vol. DISI - Databases and Informations Systems Integration. Setúbal, Portugal: INSTICC (Institute for Systems and Technologies of Information, Control and Communication). s. 437-440. ISBN 978-989-8111-36-4. 2008. info
    @inproceedings{838694, author = {Kasprzak, Jan and Brandejs, Michal and Křipač, Miroslav and Šmerk, Pavel}, address = {Setúbal, Portugal}, booktitle = {ICEIS 2008: Proceedings of the Tenth International Conference on Enterprise Information Systems, Vol. DISI - Databases and Informations Systems Integration}, keywords = {University; Plagiarism; Similar Documents; Cluster; Information System; Theses}, language = {eng}, location = {Setúbal, Portugal}, isbn = {978-989-8111-36-4}, pages = {437-440}, publisher = {INSTICC (Institute for Systems and Technologies of Information, Control and Communication)}, title = {Distributed System for Discovering Similar Documents: From a Relational Database to the Custom-Developed Parallel Solution}, year = {2008} }
  • BUŠTA, Jan. Type-based Search of Idiomatic Expression. In Aleš Horák, Pavel Rychlý. Seventh Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2013. Brno: Tribun EU. s. 93-96. ISBN 978-80-263-0520-0. 2013. URL info
    @inproceedings{1131878, author = {Bušta, Jan}, address = {Brno}, booktitle = {Seventh Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2013}, editor = {Aleš Horák, Pavel Rychlý}, keywords = {idioms; idiomatic candidates; syntactic fixedness; lexical fixedness; transitive verbs; thesaurus}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0520-0}, pages = {93-96}, publisher = {Tribun EU}, title = {Type-based Search of Idiomatic Expression}, url = {https://nlp.fi.muni.cz/raslan/2013/paper12.pdf}, year = {2013} }
  • BUŠTA, Jan a Miloš JAKUBÍČEK. E-learning punctuation test based on the error corpus. 2010. URL info
    @misc{935745, author = {Bušta, Jan and Jakubíček, Miloš}, keywords = {e-learning;punctuation;text errors; corpus}, language = {eng}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {E-learning punctuation test based on the error corpus}, url = {http://is.muni.cz/el/1433/jaro2009/VB000/odp/interpunkce.qref}, year = {2010} }
  • MORAVEC, Jaroslav, Vojtěch KOVÁŘ, Jan BUŠTA a Miloš JAKUBÍČEK. OOCorr. 2010. URL info
    @misc{935743, author = {Moravec, Jaroslav and Kovář, Vojtěch and Bušta, Jan and Jakubíček, Miloš}, keywords = {text corpus; text errors; annotation; OpenOffice.org}, language = {eng}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {OOCorr}, url = {http://nlp.fi.muni.cz/projekty/oocorr/}, year = {2010} }
  • BUŠTA, Jan a Miloš JAKUBÍČEK. Building of Corpus Based E-learning Materials for Czech. In SCO 2009 : Sharable Content Objects : 6. ročník konference o elektronické podpoře výuky. 1. vyd. Brno: Masarykova univerzita. s. 144-149. ISBN 978-80-210-4878-2. 2009. SCO 2009 info
    @inproceedings{836948, author = {Bušta, Jan and Jakubíček, Miloš}, address = {Brno}, booktitle = {SCO 2009 : Sharable Content Objects : 6. ročník konference o elektronické podpoře výuky}, edition = {1. vyd.}, keywords = {corpus;e-learning;real-world examples;writing of Czech texts;categorization of mistakes}, language = {eng}, location = {Brno}, isbn = {978-80-210-4878-2}, pages = {144-149}, publisher = {Masarykova univerzita}, title = {Building of Corpus Based E-learning Materials for Czech}, url = {http://sco.muni.cz/2009}, year = {2009} }
  • JAKUBÍČEK, Miloš, Jan BUŠTA, Dana HLAVÁČKOVÁ a Karel PALA. Classification of Errors in Text. In RASLAN 2009 : Recent Advances in Slavonic Natural Language Processing. 1. vyd. Brno: Masaryk University. s. 109-119. ISBN 978-80-210-5048-8. 2009. URL info
    @inproceedings{866439, author = {Jakubíček, Miloš and Bušta, Jan and Hlaváčková, Dana and Pala, Karel}, address = {Brno}, booktitle = {RASLAN 2009 : Recent Advances in Slavonic Natural Language Processing}, edition = {1.}, keywords = {errors in text; classification of errors}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-210-5048-8}, pages = {109-119}, publisher = {Masaryk University}, title = {Classification of Errors in Text}, url = {http://nlp.fi.muni.cz/raslan/2009/}, year = {2009} }
  • KOVÁŘ, Vojtěch, Miloš JAKUBÍČEK a Jan BUŠTA. Czech Vulgarisms in Text Corpora. In After Half a Century of Slavonic Natural Language Processing. 1. vyd. Brno: Tribun EU s.r.o. s. 141-145. ISBN 978-80-7399-815-8. 2009. info
    @inbook{847703, author = {Kovář, Vojtěch and Jakubíček, Miloš and Bušta, Jan}, address = {Brno}, booktitle = {After Half a Century of Slavonic Natural Language Processing}, edition = {1.}, keywords = {vulgarism; text corpus}, language = {eng}, location = {Brno}, isbn = {978-80-7399-815-8}, pages = {141-145}, publisher = {Tribun EU s.r.o.}, title = {Czech Vulgarisms in Text Corpora}, year = {2009} }
  • BUŠTA, Jan. Četnost idiomů v textovém korpusu. In VARIA XVIII Zborník príspevkov z XVIII. kolokvia mladých jazykovedcov. Prešov: Filozofická fakulta Prešovskej univerzity v Prešove. s. 89-92, 3 s. ISBN 978-80-555-0083-6. 2009. info
    @inproceedings{866663, author = {Bušta, Jan}, address = {Prešov}, booktitle = {VARIA XVIII Zborník príspevkov z XVIII. kolokvia mladých jazykovedcov}, keywords = {idioms MWE corpora}, language = {cze}, location = {Prešov}, isbn = {978-80-555-0083-6}, pages = {89-92}, publisher = {Filozofická fakulta Prešovskej univerzity v Prešove}, title = {Četnost idiomů v textovém korpusu}, year = {2009} }
  • BUŠTA, Jan. Computing Idioms Frequency in Text Corpora. In Proceedings of Recent Advances in Slavonic Natural Language Processing 2008. Brno: Masaryk University. s. 0-0, 4 s. ISBN 978-80-210-4741-9. 2008. URL info
    @inproceedings{806007, author = {Bušta, Jan}, address = {Brno}, booktitle = {Proceedings of Recent Advances in Slavonic Natural Language Processing 2008}, keywords = {frequency of idioms; headwords; text corpora; czech language}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-210-4741-9}, pages = {0-0}, publisher = {Masaryk University}, title = {Computing Idioms Frequency in Text Corpora}, url = {https://nlp.fi.muni.cz/raslan/2008/papers/12.pdf}, year = {2008} }
  • ČAPEK, Tomáš a Pavel ŠMERK. Towards Partial Word Sense Disambiguation Tools for Czech. In Proceedings of Fourth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2010. Brno: Tribun EU. 6 s. ISBN 978-80-7399-246-0. 2010. URL info
    @inproceedings{914408, author = {Čapek, Tomáš and Šmerk, Pavel}, address = {Brno}, booktitle = {Proceedings of Fourth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2010}, keywords = {word sense desambiguation; morphological desambiguation; multi-word expression recognition}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-7399-246-0}, publisher = {Tribun EU}, title = {Towards Partial Word Sense Disambiguation Tools for Czech}, url = {https://nlp.fi.muni.cz/raslan/2010/paper13.pdf}, year = {2010} }
  • ČAPEK, Tomáš a Pavel ŠMERK. SAFT - sémantický anotátor volného textu. 2009. URL info
    @misc{928565, author = {Čapek, Tomáš and Šmerk, Pavel}, keywords = {semantic annotation; wordnet; morphological analysis}, language = {cze}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {SAFT - sémantický anotátor volného textu}, url = {http://nlp.fi.muni.cz/projekty/saft/}, year = {2009} }
  • ČERNÁ, Anna, Hana KONEČNÁ, Hana MŽOURKOVÁ, Markéta PRAVDOVÁ, Martin PROŠEK, Kamila SMEJKALOVÁ, Ivana SVOBODOVÁ, Ludmila UHLÍŘOVÁ, Jan CHROMÝ, Dana HLAVÁČKOVÁ, Karel PALA a Pavel ŠMERK. Internetová jazyková příručka. Praha: Ústav pro jazyk český AV ČR, v. v. i, 2011. URL info
    @misc{1344319, author = {Černá, Anna and Konečná, Hana and Mžourková, Hana and Pravdová, Markéta and Prošek, Martin and Smejkalová, Kamila and Svobodová, Ivana and Uhlířová, Ludmila and Chromý, Jan and Hlaváčková, Dana and Pala, Karel and Šmerk, Pavel}, address = {Praha}, keywords = {dictionary; orthography; grammar}, language = {cze}, location = {Praha}, publisher = {Ústav pro jazyk český AV ČR, v. v. i}, title = {Internetová jazyková příručka}, url = {http://prirucka.ujc.cas.cz/}, year = {2011} }
  • DOVUDOV, Gulshan, Vít SUCHOMEL a Pavel ŠMERK. POS Annotated 50M Corpus of Tajik Language. In Proceedings of the Workshop on Language Technology for Normalisation of Less-Resourced Languages (SALTMIL 8/AfLaT 2012). Istanbul: European Language Resources Association (ELRA). s. 93-98. ISBN 978-2-9517408-7-7. 2012. URL info
    @inproceedings{1073390, author = {Dovudov, Gulshan and Suchomel, Vít and Šmerk, Pavel}, address = {Istanbul}, booktitle = {Proceedings of the Workshop on Language Technology for Normalisation of Less-Resourced Languages (SALTMIL 8/AfLaT 2012)}, keywords = {Tajik language; Tajik corpus; morphological analysis of Tajik}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Istanbul}, isbn = {978-2-9517408-7-7}, pages = {93-98}, publisher = {European Language Resources Association (ELRA)}, title = {POS Annotated 50M Corpus of Tajik Language}, url = {http://www.cnts.ua.ac.be/sites/default/files/saltmil8-aflat2012.pdf}, year = {2012} }
  • DOVUDOV, Gulshan, Vít SUCHOMEL a Pavel ŠMERK. Towards 100M Morphologically Annotated Corpus of Tajik. In Aleš Horák, Pavel Rychlý. Proceedings of Recent Advances in Slavonic Natural Language Processing, RASLAN 2012. Brno: Tribun EU. s. 91-94. ISBN 978-80-263-0313-8. 2012. URL info
    @inproceedings{1096012, author = {Dovudov, Gulshan and Suchomel, Vít and Šmerk, Pavel}, address = {Brno}, booktitle = {Proceedings of Recent Advances in Slavonic Natural Language Processing, RASLAN 2012}, editor = {Aleš Horák, Pavel Rychlý}, keywords = {web corpora; Tajik}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0313-8}, pages = {91-94}, publisher = {Tribun EU}, title = {Towards 100M Morphologically Annotated Corpus of Tajik}, url = {https://nlp.fi.muni.cz/raslan/2012/paper15.pdf}, year = {2012} }
  • DOVUDOV, Gulshan, Jan POMIKÁLEK, Vít SUCHOMEL a Pavel ŠMERK. Building a 50M Corpus of Tajik Language. In Aleš Horák, Pavel Rychlý. Proceedings of Recent Advances in Slavonic Natural Language Processing, RASLAN 2011. Brno: Tribun EU. s. 89-95. ISBN 978-80-263-0077-9. 2011. URL info
    @inproceedings{959067, author = {Dovudov, Gulshan and Pomikálek, Jan and Suchomel, Vít and Šmerk, Pavel}, address = {Brno}, booktitle = {Proceedings of Recent Advances in Slavonic Natural Language Processing, RASLAN 2011}, editor = {Aleš Horák, Pavel Rychlý}, keywords = {language corpora; corpus; corpus building; tajik}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0077-9}, pages = {89-95}, publisher = {Tribun EU}, title = {Building a 50M Corpus of Tajik Language}, url = {https://nlp.fi.muni.cz/raslan/2011/paper07.pdf}, year = {2011} }
  • GOLEMBIOVSKÝ, Jiří, Aleš HORÁK a Miloš JAKUBÍČEK. wwwsynt - webové rozhraní analyzátoru synt. 2010. URL info
    @misc{935708, author = {Golembiovský, Jiří and Horák, Aleš and Jakubíček, Miloš}, keywords = {syntactic analysis;Czech;parsing;synt}, language = {cze}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {wwwsynt - webové rozhraní analyzátoru synt}, url = {http://nlp.fi.muni.cz/projekty/wwwsynt/}, year = {2010} }
  • JAKUBÍČEK, Miloš, Vojtěch KOVÁŘ a Marek GRÁC. Through Low-Cost Annotation to Reliable Parsing Evaluation. In PACLIC 24 Proceedings of the 24th Pacific Asia Conference on Language, Information and Computation. Tokyo: Waseda University. s. 555-562. ISBN 978-4-905166-00-9. 2010. URL info
    @inproceedings{908010, author = {Jakubíček, Miloš and Kovář, Vojtěch and Grác, Marek}, address = {Tokyo}, booktitle = {PACLIC 24 Proceedings of the 24th Pacific Asia Conference on Language, Information and Computation}, keywords = {noun phrases;parsing;parser evaluation;annotation;inter-annotator agreement}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Tokyo}, isbn = {978-4-905166-00-9}, pages = {555-562}, publisher = {Waseda University}, title = {Through Low-Cost Annotation to Reliable Parsing Evaluation}, url = {http://aclweb.org/anthology//Y/Y10/Y10-1064.pdf}, year = {2010} }
  • KOVÁŘ, Vojtěch a Ondřej HERMAN. Methods for Detection of Word Usage over Time. In Seventh Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2013. Brno: Tribun EU. s. 79-85. ISBN 978-80-263-0520-0. 2013. URL info
    @inproceedings{1131909, author = {Kovář, Vojtěch and Herman, Ondřej}, address = {Brno}, booktitle = {Seventh Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2013}, keywords = {word usage; time series; regression methods; Theil-Sen estimator; Mann-Kendall test;}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0520-0}, pages = {79-85}, publisher = {Tribun EU}, title = {Methods for Detection of Word Usage over Time}, url = {https://nlp.fi.muni.cz/raslan/2013/paper11.pdf}, year = {2013} }
  • ŠMERK, Pavel a Dana HLAVÁČKOVÁ. Derivační analyzátor češtiny. 2011. URL info
    @misc{979827, author = {Šmerk, Pavel and Hlaváčková, Dana}, keywords = {derivational morphology; derivational analysis; Czech morphology}, language = {cze}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {Derivační analyzátor češtiny}, url = {http://nlp.fi.muni.cz/projekty/derivance}, year = {2011} }
  • OSOLSOBĚ, Klára, Dana HLAVÁČKOVÁ, Karel PALA a Pavel ŠMERK. Exploring Derivational Relations in Czech with the Deriv Tool. In NLP, Corpus Linguistics, Corpus Based Grammar Research. Bratislava, Slovakia: Tribun. s. 152-161. ISBN 978-80-7399-875-2. 2009. info
    @inproceedings{857324, author = {Osolsobě, Klára and Hlaváčková, Dana and Pala, Karel and Šmerk, Pavel}, address = {Bratislava, Slovakia}, booktitle = {NLP, Corpus Linguistics, Corpus Based Grammar Research}, keywords = {NLP; word derivation; corpus linguistics}, language = {eng}, location = {Bratislava, Slovakia}, isbn = {978-80-7399-875-2}, pages = {152-161}, publisher = {Tribun}, title = {Exploring Derivational Relations in Czech with the Deriv Tool}, year = {2009} }
  • OSOLSOBĚ, Klára, Karel PALA, Pavel ŠMERK a Dana HLAVÁČKOVÁ. Relations between Formal and Derivational Morphology in Czech. In Czech in Formal Grammar. Mnichov: Lincom. s. 79-87. ISBN 978-3-89586-282-3. 2009. info
    @inproceedings{862414, author = {Osolsobě, Klára and Pala, Karel and Šmerk, Pavel and Hlaváčková, Dana}, address = {Mnichov}, booktitle = {Czech in Formal Grammar}, keywords = {formal morphology; derivational morphology; NLP;}, language = {cze}, location = {Mnichov}, isbn = {978-3-89586-282-3}, pages = {79-87}, publisher = {Lincom}, title = {Relations between Formal and Derivational Morphology in Czech}, year = {2009} }
  • HORÁK, Aleš, Tomáš HOLAN, Vladimír KADLEC a Vojtěch KOVÁŘ. Dependency and Phrasal Parsers of the Czech Language: A Comparison. In Proceedings of 10th International Conference on Text, Speech, and Dialogue (TSD 2007). Berlin, Heidelberg: Springer. s. 76-84. ISBN 978-3-540-74627-0. 2007. info
    @inproceedings{746063, author = {Horák, Aleš and Holan, Tomáš and Kadlec, Vladimír and Kovář, Vojtěch}, address = {Berlin, Heidelberg}, booktitle = {Proceedings of 10th International Conference on Text, Speech, and Dialogue (TSD 2007)}, keywords = {parsing; Czech}, language = {eng}, location = {Berlin, Heidelberg}, isbn = {978-3-540-74627-0}, pages = {76-84}, publisher = {Springer}, title = {Dependency and Phrasal Parsers of the Czech Language: A Comparison}, year = {2007} }
  • HORÁK, Aleš, Adam RAMBOUSEK, Vít SUCHOMEL a Lucia KOCINCOVÁ. Semiautomatic Building and Extension of Terminological Thesaurus for Land Surveying Domain. In Aleš Horák, Pavel Rychlý. Eighth Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 129-137. ISSN 2336-4289. 2014. PDF full paper info
    @inproceedings{1210709, author = {Horák, Aleš and Rambousek, Adam and Suchomel, Vít and Kocincová, Lucia}, address = {Brno}, booktitle = {Eighth Workshop on Recent Advances in Slavonic Natural Language Processing}, editor = {Aleš Horák, Pavel Rychlý}, keywords = {corpus building; thesaurus; terminological dictionary; term extraction; DEB platform}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, pages = {129-137}, publisher = {Tribun EU}, title = {Semiautomatic Building and Extension of Terminological Thesaurus for Land Surveying Domain}, url = {https://nlp.fi.muni.cz/raslan/2014/2.pdf}, year = {2014} }
  • HORÁK, Aleš a Marek MEDVEĎ. SQAD: Simple Question Answering Database. In Eighth Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 121-128. ISSN 2336-4289. 2014. info
    @inproceedings{1210707, author = {Horák, Aleš and Medveď, Marek}, address = {Brno}, booktitle = {Eighth Workshop on Recent Advances in Slavonic Natural Language Processing}, keywords = {question answering; Simple Question Answering Database; SQAD; syntax-based question answering; SBQA}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, pages = {121-128}, publisher = {Tribun EU}, title = {SQAD: Simple Question Answering Database}, year = {2014} }
  • HORÁK, Aleš, Miloš JAKUBÍČEK a Vojtěch KOVÁŘ. Linguistic Logical Analysis of Direct Speech. In Aleš Horák, Pavel Rychlý. RASLAN 2012 Recent Advances in Slavonic Natural Language Processing. Brno, Czech Republic: Tribun EU. s. 51-59. ISBN 978-80-263-0313-8. 2012. URL info
    @inproceedings{1079842, author = {Horák, Aleš and Jakubíček, Miloš and Kovář, Vojtěch}, address = {Brno, Czech Republic}, booktitle = {RASLAN 2012 Recent Advances in Slavonic Natural Language Processing}, editor = {Aleš Horák, Pavel Rychlý}, keywords = {direct speech; indirect speech; Transparent Intensional Logic; TIL; Normal Translation Algorithm; NTA; logical analysis; syntactic analysis; parsing}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno, Czech Republic}, isbn = {978-80-263-0313-8}, pages = {51-59}, publisher = {Tribun EU}, title = {Linguistic Logical Analysis of Direct Speech}, url = {https://nlp.fi.muni.cz/raslan/2012/paper09.pdf}, year = {2012} }
  • KOVÁŘ, Vojtěch, Miloš JAKUBÍČEK a Aleš HORÁK. Syntactic parser SET. 2012. URL info
    @misc{1083242, author = {Kovář, Vojtěch and Jakubíček, Miloš and Horák, Aleš}, keywords = {syntax;parser;syntactic analysis;pattern matching}, language = {eng}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {Syntactic parser SET}, url = {http://nlp.fi.muni.cz/projects/set}, year = {2012} }
  • HORÁK, Aleš, Miloš JAKUBÍČEK a Vojtěch KOVÁŘ. Analyzing Time-Related Clauses in Transparent Intensional Logic. In Horák, Rychlý. Proceedings of Recent Advances in Slavonic Natural Language Processing 2011. Brno: Tribun EU. s. 3-9. ISBN 978-80-263-0077-9. 2011. info
    @inproceedings{959105, author = {Horák, Aleš and Jakubíček, Miloš and Kovář, Vojtěch}, address = {Brno}, booktitle = {Proceedings of Recent Advances in Slavonic Natural Language Processing 2011}, editor = {Horák, Rychlý}, keywords = {Transparent Intensional Logic;TIL;Normal Translation Algorithm;NTA;logical analysis;temporal analysis;time-related clauses}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0077-9}, pages = {3-9}, publisher = {Tribun EU}, title = {Analyzing Time-Related Clauses in Transparent Intensional Logic}, year = {2011} }
  • KOVÁŘ, Vojtěch, Aleš HORÁK a Miloš JAKUBÍČEK. Syntactic Analysis Using Finite Patterns: A New Parsing System for Czech. In Human Language Technology. Challenges for Computer Science and Linguistics. Berlin/Heidelberg: Springer. s. 161-171. ISBN 978-3-642-20094-6. 2011. URL info
    @inproceedings{932481, author = {Kovář, Vojtěch and Horák, Aleš and Jakubíček, Miloš}, address = {Berlin/Heidelberg}, booktitle = {Human Language Technology. Challenges for Computer Science and Linguistics}, keywords = {syntactic analysis; freeword- order languages; an alternative approach; natural language processing}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Berlin/Heidelberg}, isbn = {978-3-642-20094-6}, pages = {161-171}, publisher = {Springer}, title = {Syntactic Analysis Using Finite Patterns: A New Parsing System for Czech}, url = {http://dx.doi.org/10.1007/978-3-642-20095-3_15}, year = {2011} }
  • KOVÁŘ, Vojtěch, Aleš HORÁK a Miloš JAKUBÍČEK. How to Analyze Natural Language with Transparent Intensional Logic? In Proceedings of Recent Advances in Slavonic Natural Language Processing 2010. Brno: Masaryk University. s. 69--76. ISBN 978-80-7399-246-0. 2010. info
    @inproceedings{914266, author = {Kovář, Vojtěch and Horák, Aleš and Jakubíček, Miloš}, address = {Brno}, booktitle = {Proceedings of Recent Advances in Slavonic Natural Language Processing 2010}, keywords = {TIL;transparent intensional logic;syntactic analysis;valency frames;logic}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-7399-246-0}, pages = {69--76}, publisher = {Masaryk University}, title = {How to Analyze Natural Language with Transparent Intensional Logic?}, year = {2010} }
  • JAKUBÍČEK, Miloš a Aleš HORÁK. Punctuation Detection with Full Syntactic Parsing. Research in Computing Science, Special issue: Natural Language Processing and its Applications. Mexiko: Instituto Politécnico Nacional, roč. 46, March 2010, s. 335-343. ISSN 1870-4069. 2010. URL info
    @article{876509, author = {Jakubíček, Miloš and Horák, Aleš}, article_location = {Mexiko}, article_number = {March 2010}, keywords = {punctuation; grammar checking; parsing; syntactic analysis}, language = {eng}, issn = {1870-4069}, journal = {Research in Computing Science, Special issue: Natural Language Processing and its Applications}, title = {Punctuation Detection with Full Syntactic Parsing}, url = {http://www.cicling.org/2010/Vol46.pdf}, volume = {46}, year = {2010} }
  • JAKUBÍČEK, Miloš, Vojtěch KOVÁŘ a Aleš HORÁK. Measuring Coverage of a Valency Lexicon using Full Syntactic Analysis. In RASLAN 2009 : Recent Advances in Slavonic Natural Language Processing. 1. vyd. Brno: Masaryk University. s. 75-79. ISBN 978-80-210-5048-8. 2009. URL info
    @inproceedings{866435, author = {Jakubíček, Miloš and Kovář, Vojtěch and Horák, Aleš}, address = {Brno}, booktitle = {RASLAN 2009 : Recent Advances in Slavonic Natural Language Processing}, edition = {1.}, keywords = {verb valency; valency lexicon; parsing; syntactic analysis}, language = {eng}, location = {Brno}, isbn = {978-80-210-5048-8}, pages = {75-79}, publisher = {Masaryk University}, title = {Measuring Coverage of a Valency Lexicon using Full Syntactic Analysis}, url = {http://nlp.fi.muni.cz/raslan/2009/}, year = {2009} }
  • JAKUBÍČEK, Miloš, Aleš HORÁK a Vojtěch KOVÁŘ. Mining Phrases from Syntactic Analysis. In Text, Speech, Dialogue 2009. 1. vyd. Berlin Heidelberg: Springer Verlag. s. 124-130. ISBN 978-3-642-04207-2. doi:10.1007/978-3-642-04208-9_20. 2009. URL info
    @inproceedings{847718, author = {Jakubíček, Miloš and Horák, Aleš and Kovář, Vojtěch}, address = {Berlin Heidelberg}, booktitle = {Text, Speech, Dialogue 2009}, doi = {http://dx.doi.org/10.1007/978-3-642-04208-9_20}, edition = {1.}, keywords = {parsing; syntactic structures; mining phrases}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Berlin Heidelberg}, isbn = {978-3-642-04207-2}, pages = {124-130}, publisher = {Springer Verlag}, title = {Mining Phrases from Syntactic Analysis}, url = {http://www.springerlink.com/content/p153184279t56250/}, year = {2009} }
  • KOVÁŘ, Vojtěch, Aleš HORÁK a Miloš JAKUBÍČEK. Syntactic Analysis as Pattern Matching: The SET Parsing System. In Proceedings of 4th Language & Technology Conference. Poznań (Poland): Wydawnictwo Poznańskie. s. 100-104. ISBN 978-83-7177-746-2. 2009. info
    @inproceedings{855311, author = {Kovář, Vojtěch and Horák, Aleš and Jakubíček, Miloš}, address = {Poznań (Poland)}, booktitle = {Proceedings of 4th Language & Technology Conference}, keywords = {syntactic analysis;pattern matching;SET}, language = {eng}, location = {Poznań (Poland)}, isbn = {978-83-7177-746-2}, pages = {100-104}, publisher = {Wydawnictwo Poznańskie}, title = {Syntactic Analysis as Pattern Matching: The SET Parsing System}, year = {2009} }
  • KOVÁŘ, Vojtěch, Aleš HORÁK a Vladimír KADLEC. New Methods for Pruning and Ordering of Syntax Parsing Trees. In Proceedings of Text, Speech and Dialogue 2008. Berlin, Heidelberg: Springer. s. 125-131. ISBN 978-3-540-87390-7. 2008. info
    @inproceedings{789416, author = {Kovář, Vojtěch and Horák, Aleš and Kadlec, Vladimír}, address = {Berlin, Heidelberg}, booktitle = {Proceedings of Text, Speech and Dialogue 2008}, keywords = {syntactic analysis; parsing; natural language processing}, language = {eng}, location = {Berlin, Heidelberg}, isbn = {978-3-540-87390-7}, pages = {125-131}, publisher = {Springer}, title = {New Methods for Pruning and Ordering of Syntax Parsing Trees}, year = {2008} }
  • KOVÁŘ, Vojtěch, Aleš HORÁK a Miloš JAKUBÍČEK. Power Networks Dialogs - Enhancing Domain-Specific Text Processing Techniques and Resources. In Proceedings of ELNET 2008. Ostrava: Faculty of Electrical Engineering and Computer Science, VŠB - Technical University of Ostrava. s. 72-80. ISBN 978-80-248-1875-7. 2008. info
    @inproceedings{806006, author = {Kovář, Vojtěch and Horák, Aleš and Jakubíček, Miloš}, address = {Ostrava}, booktitle = {Proceedings of ELNET 2008}, keywords = {electrical power networks;czech domain-specific resources;syntax analysis;text corpora}, language = {eng}, location = {Ostrava}, isbn = {978-80-248-1875-7}, pages = {72-80}, publisher = {Faculty of Electrical Engineering and Computer Science, VŠB - Technical University of Ostrava}, title = {Power Networks Dialogs - Enhancing Domain-Specific Text Processing Techniques and Resources}, year = {2008} }
  • KOVÁŘ, Vojtěch a Aleš HORÁK. Power Networks Dialogues - Automatic Analysis and Evaluation of a Domain-Specific Text Corpus. In Proceedings of ELNET 2007. Ostrava: Faculty of Electrical Engineering and Computer Science, VŠB - Technical University of Ostrava. s. 30-37. ISBN 978-80-248-1681-4. 2007. info
    @inproceedings{746344, author = {Kovář, Vojtěch and Horák, Aleš}, address = {Ostrava}, booktitle = {Proceedings of ELNET 2007}, keywords = {power network; corpus; dialogue; domain-specific; synt; syntactic analysis}, language = {eng}, location = {Ostrava}, isbn = {978-80-248-1681-4}, pages = {30-37}, publisher = {Faculty of Electrical Engineering and Computer Science, VŠB - Technical University of Ostrava}, title = {Power Networks Dialogues - Automatic Analysis and Evaluation of a Domain-Specific Text Corpus}, year = {2007} }
  • KOVÁŘ, Vojtěch a Aleš HORÁK. Reducing the Number of Resulting Parsing Trees for the Czech Language Using the Beautified Chart Method. In Proceedings of 3rd Language and Technology Conference. Poznań: Wydawnictwo Poznańskie. s. 433-437. ISBN 978-83-7177-407-2. 2007. info
    @inproceedings{746082, author = {Kovář, Vojtěch and Horák, Aleš}, address = {Poznań}, booktitle = {Proceedings of 3rd Language and Technology Conference}, keywords = {syntactic analysis; parser; chart; forest of values; beautified chart}, language = {eng}, location = {Poznań}, isbn = {978-83-7177-407-2}, pages = {433-437}, publisher = {Wydawnictwo Poznańskie}, title = {Reducing the Number of Resulting Parsing Trees for the Czech Language Using the Beautified Chart Method}, year = {2007} }
  • KOVÁŘ, Vojtěch, Vladimír KADLEC a Aleš HORÁK. Grammar Development for Czech Syntactic Parser with Corpus-based Techniques. In Proceedings of Corpus Linguistic 2006. Saint-Petersburg: Saint-Petersburg State University. s. 159-165. ISBN 5-288-04181-4. 2006. info
    @inproceedings{707744, author = {Kovář, Vojtěch and Kadlec, Vladimír and Horák, Aleš}, address = {Saint-Petersburg}, booktitle = {Proceedings of Corpus Linguistic 2006}, keywords = {parsing grammar czech corpus}, language = {eng}, location = {Saint-Petersburg}, isbn = {5-288-04181-4}, pages = {159-165}, publisher = {Saint-Petersburg State University}, title = {Grammar Development for Czech Syntactic Parser with Corpus-based Techniques}, year = {2006} }
  • ŠMERK, Pavel, Vít HOTÁREK a Pavel RYCHLÝ. WWWAjka. 2010. URL info
    @misc{935737, author = {Šmerk, Pavel and Hotárek, Vít and Rychlý, Pavel}, keywords = {morphological analysis}, language = {cze}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {WWWAjka}, url = {http://nlp.fi.muni.cz/projekty/wwwajka}, year = {2010} }
  • SRDANOVIĆ, Irena, Naomi IDA, Chikako SHIGEMORI BUČAR, Adam KILGARRIFF a Vojtěch KOVÁŘ. Japanese Word Sketches: Advances and Problems. Acta Linguistica Asiatica. Ljubljana: University of Ljubljana, roč. 1/2011, č. 2, s. 63-82. ISSN 2232-3317. 2011. URL info
    @article{954282, author = {Srdanović, Irena and Ida, Naomi and Shigemori Bučar, Chikako and Kilgarriff, Adam and Kovář, Vojtěch}, article_location = {Ljubljana}, article_number = {2}, keywords = {word sketches;evaluation;japanese}, language = {eng}, issn = {2232-3317}, journal = {Acta Linguistica Asiatica}, title = {Japanese Word Sketches: Advances and Problems}, url = {http://revije.ff.uni-lj.si/ala/article/view/38}, volume = {1/2011}, year = {2011} }
  • INUMELLA, Abhilash, Adam KILGARRIFF a Vojtěch KOVÁŘ. Associating Collocations with Dictionary Senses. In Proceedings of 6th Biennial Conference of the Asian Association for Lexicography. 2009. URL info
    @proceedings{873881, author = {Inumella, Abhilash and Kilgarriff, Adam and Kovář, Vojtěch}, booktitle = {Proceedings of 6th Biennial Conference of the Asian Association for Lexicography}, keywords = {collocation;collocations;dictionary;sense;dictionary sense}, language = {eng}, title = {Associating Collocations with Dictionary Senses}, url = {http://nlp.fi.muni.cz/publications/asialex2009_yabhil_kilgarriff_xkovar3/AbhilashKilgKovar_30jun09.pdf}, year = {2009} }
  • JAKUBÍČEK, Miloš, Pavel RYCHLÝ a Adam KILGARRIFF. Effective Corpus Virtualization. In Marc Kupietz, Hanno Biber, Harald Lüngen, Piotr Bański, Evelyn Breiteneder, Karlheinz Mörth, Andreas Witt, Jani Takhsha. Challenges in the Management of Large Corpora (CMLC-2). Reykjavik: EUROPEAN LANGUAGE RESOURCES ASSOCIATION-ELRA. s. 7-9. ISBN 978-2-9517408-8-4. 2014. URL info
    @inproceedings{1186171, author = {Jakubíček, Miloš and Rychlý, Pavel and Kilgarriff, Adam}, address = {Reykjavik}, booktitle = {Challenges in the Management of Large Corpora (CMLC-2)}, editor = {Marc Kupietz, Hanno Biber, Harald Lüngen, Piotr Bański, Evelyn Breiteneder, Karlheinz Mörth, Andreas Witt, Jani Takhsha}, keywords = {corpus; corpus linguistics; virtualization; indexing; database}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Reykjavik}, isbn = {978-2-9517408-8-4}, pages = {7-9}, publisher = {EUROPEAN LANGUAGE RESOURCES ASSOCIATION-ELRA}, title = {Effective Corpus Virtualization}, url = {http://corpora.ids-mannheim.de/cmlc.html}, year = {2014} }
  • KILGARRIFF, Adam, Miloš JAKUBÍČEK, Vojtěch KOVÁŘ, Pavel RYCHLÝ a Vít SUCHOMEL. Finding Terms in Corpora for Many Languages with the Sketch Engine. In Proceedings of the Demonstrations at the 14th Conferencethe European Chapter of the Association for Computational Linguistics. Gothenburg, Sweden: The Association for Computational Linguistics. s. 53-56. ISBN 978-1-937284-75-6. 2014. Plný text výsledku info
    @inproceedings{1181590, author = {Kilgarriff, Adam and Jakubíček, Miloš and Kovář, Vojtěch and Rychlý, Pavel and Suchomel, Vít}, address = {Gothenburg, Sweden}, booktitle = {Proceedings of the Demonstrations at the 14th Conferencethe European Chapter of the Association for Computational Linguistics}, keywords = {terminology; terms; corpora; sketch engine}, howpublished = {elektronická verze "online"}, language = {eng}, location = {Gothenburg, Sweden}, isbn = {978-1-937284-75-6}, pages = {53-56}, publisher = {The Association for Computational Linguistics}, title = {Finding Terms in Corpora for Many Languages with the Sketch Engine}, url = {http://aclweb.org/anthology/E/E14/E14-2014.pdf}, year = {2014} }
  • KOVÁŘ, Vojtěch, Pavel RYCHLÝ a Miloš JAKUBÍČEK. Low Inter-Annotator Agreement = An Ill-Defined Problem? In Eighth Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 57-62. ISSN 2336-4289. 2014. URL info
    @inproceedings{1210696, author = {Kovář, Vojtěch and Rychlý, Pavel and Jakubíček, Miloš}, address = {Brno}, booktitle = {Eighth Workshop on Recent Advances in Slavonic Natural Language Processing}, keywords = {NLP; inter-annotator agreement; low inter-annotator agreement; evaluation}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, pages = {57-62}, publisher = {Tribun EU}, title = {Low Inter-Annotator Agreement = An Ill-Defined Problem?}, url = {https://nlp.fi.muni.cz/raslan/2014/13.pdf}, year = {2014} }
  • JAKUBÍČEK, Miloš a Pavel RYCHLÝ. Optimization of Regular Expression Evaluation within the Manatee Corpus Management System. In Eighth Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 37-48. ISSN 2336-4289. 2014. info
    @inproceedings{1210693, author = {Jakubíček, Miloš and Rychlý, Pavel}, address = {Brno}, booktitle = {Eighth Workshop on Recent Advances in Slavonic Natural Language Processing}, keywords = {text corpus; regular expression; Manatee}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, pages = {37-48}, publisher = {Tribun EU}, title = {Optimization of Regular Expression Evaluation within the Manatee Corpus Management System}, year = {2014} }
  • KILGARRIFF, Adam, Miloš JAKUBÍČEK, Jan POMIKÁLEK, Tony Berber SARDINHA a Pete WHITELOCK. PtTenTen: A corpus for Portuguese lexicography. In Tony Berber Sardinha, Telma de Lurdes São Bento Ferreira. Working with Portuguese Corpora. 1. vyd. London: Bloomsbury Publishing. s. 280-287. Bloomsbury Academic. ISBN 978-1-4411-9050-5. 2014. URL info
    @inbook{1173363, author = {Kilgarriff, Adam and Jakubíček, Miloš and Pomikálek, Jan and Sardinha, Tony Berber and Whitelock, Pete}, address = {London}, booktitle = {Working with Portuguese Corpora}, edition = {1}, editor = {Tony Berber Sardinha, Telma de Lurdes São Bento Ferreira}, keywords = {pttenten; portuguese; lexicography; corpus; corpora}, howpublished = {tištěná verze "print"}, language = {eng}, location = {London}, isbn = {978-1-4411-9050-5}, pages = {280-287}, publisher = {Bloomsbury Publishing}, title = {PtTenTen: A corpus for Portuguese lexicography}, url = {http://www.bloomsbury.com/uk/working-with-portuguese-corpora-9781441190505/}, year = {2014} }
  • JAKUBÍČEK, Miloš a Vojtěch KOVÁŘ. Enhancing Czech Parsing with Verb Valency Frames. In CICLing 2013. Greece: Springer Verlag. s. 282-293. ISBN 978-3-642-37246-9. doi:10.1007/978-3-642-37247-6_23. 2013. info
    @inproceedings{1081576, author = {Jakubíček, Miloš and Kovář, Vojtěch}, address = {Greece}, booktitle = {CICLing 2013}, doi = {http://dx.doi.org/10.1007/978-3-642-37247-6_23}, keywords = {parsing; syntactic analysis; verb valencies; valency frames; Czech}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Greece}, isbn = {978-3-642-37246-9}, pages = {282-293}, publisher = {Springer Verlag}, title = {Enhancing Czech Parsing with Verb Valency Frames}, year = {2013} }
  • JAKUBÍČEK, Miloš, Pavel ŠMERK a Pavel RYCHLÝ. Fast Construction of a Word-Number Index for Large Data. In A. Horák, P. Rychlý. RASLAN 2013 Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 63-67. ISBN 978-80-263-0520-0. 2013. URL info
    @inproceedings{1131334, author = {Jakubíček, Miloš and Šmerk, Pavel and Rychlý, Pavel}, address = {Brno}, booktitle = {RASLAN 2013 Recent Advances in Slavonic Natural Language Processing}, editor = {A. Horák, P. Rychlý}, keywords = {word to number index; number to word index; finite state automata; hat-trie}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0520-0}, pages = {63-67}, publisher = {Tribun EU}, title = {Fast Construction of a Word-Number Index for Large Data}, url = {https://nlp.fi.muni.cz/raslan/2013/paper10.pdf}, year = {2013} }
  • JAKUBÍČEK, Miloš a Marek MEDVEĎ. Portable Lexical Analysis for Parsing of Morphologically-Rich Languages. In A. Horák, P. Rychlý. RASLAN 2013 Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 21-26. ISBN 978-80-263-0520-0. 2013. info
    @inproceedings{1131336, author = {Jakubíček, Miloš and Medveď, Marek}, address = {Brno}, booktitle = {RASLAN 2013 Recent Advances in Slavonic Natural Language Processing}, editor = {A. Horák, P. Rychlý.}, keywords = {lexical analysis; synt parser}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0520-0}, pages = {21-26}, publisher = {Tribun EU}, title = {Portable Lexical Analysis for Parsing of Morphologically-Rich Languages}, year = {2013} }
  • MEDVEĎ, Marek, Miloš JAKUBÍČEK a Vojtěch KOVÁŘ. Towards taggers and parsers for Slovak. In Zygmunt Vetulani & Hans Uszkoreit. Human Language Technologies as a Challenge for Computer Science and Linguistics. Proceedings of the 6th Language and Technology Conference. Poznań, Poland: Fundacja Uniwersytetu im. A. Mickiewicza. s. 527-530. ISBN 978-83-932640-3-2. 2013. LTC website info
    @inproceedings{1131339, author = {Medveď, Marek and Jakubíček, Miloš and Kovář, Vojtěch}, address = {Poznań, Poland}, booktitle = {Human Language Technologies as a Challenge for Computer Science and Linguistics. Proceedings of the 6th Language and Technology Conference}, editor = {Zygmunt Vetulani & Hans Uszkoreit}, keywords = {Slovak; parsing; tagging; parser adaptation}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Poznań, Poland}, isbn = {978-83-932640-3-2}, pages = {527-530}, publisher = {Fundacja Uniwersytetu im. A. Mickiewicza}, title = {Towards taggers and parsers for Slovak}, url = {http://www.ltc.amu.edu.pl}, year = {2013} }
  • MEDVEĎ, Marek, Miloš JAKUBÍČEK, Vojtěch KOVÁŘ a Václav NĚMČÍK. Adaptation of Czech Parsers for Slovak. In Aleš Horák, Pavel Rychlý. RASLAN 2012 Recent Advances in Slavonic Natural Language Processing. Brno, Czech Republic: Tribun EU. s. 23-30. ISBN 978-80-263-0313-8. 2012. URL info
    @inproceedings{1079840, author = {Medveď, Marek and Jakubíček, Miloš and Kovář, Vojtěch and Němčík, Václav}, address = {Brno, Czech Republic}, booktitle = {RASLAN 2012 Recent Advances in Slavonic Natural Language Processing}, editor = {Aleš Horák, Pavel Rychlý}, keywords = {syntactic analysis; parsing; Slovak}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno, Czech Republic}, isbn = {978-80-263-0313-8}, pages = {23-30}, publisher = {Tribun EU}, title = {Adaptation of Czech Parsers for Slovak}, url = {https://nlp.fi.muni.cz/raslan/2012/paper16.pdf}, year = {2012} }
  • POMIKÁLEK, Jan, Pavel RYCHLÝ a Miloš JAKUBÍČEK. Building a 70 billion word corpus of English from ClueWeb. In Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Mehmet Ugur Dogan and Bente Maegaard and Joseph Mariani and Jan Odijk and Stelios Piperidis. Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12). Istanbul, Turkey: European Language Resources Association (ELRA). s. 502-506. ISBN 978-2-9517408-7-7. 2012. URL info
    @inproceedings{991165, author = {Pomikálek, Jan and Rychlý, Pavel and Jakubíček, Miloš}, address = {Istanbul, Turkey}, booktitle = {Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12)}, editor = {Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Mehmet Ugur Dogan and Bente Maegaard and Joseph Mariani and Jan Odijk and Stelios Piperidis}, keywords = {corpus; clueweb; English; encoding; word sketch}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Istanbul, Turkey}, isbn = {978-2-9517408-7-7}, pages = {502-506}, publisher = {European Language Resources Association (ELRA)}, title = {Building a 70 billion word corpus of English from ClueWeb}, url = {http://nlp.fi.muni.cz/publications/lrec2012_xpomikal_pary_xjakub/lrec2012.pdf}, year = {2012} }
  • KILGARRIFF, Adam, Jan POMIKÁLEK, Miloš JAKUBÍČEK a Pete WHITELOCK. Setting up for corpus lexicography. In Ruth Vatvedt Fjeld and Julie Matilde Torjusen. Proceedings of the 15th EURALEX International Congress. Oslo, Norway: Department of Linguistics and Scandinavian Studies, University of Oslo. s. 606-612. ISBN 978-82-303-2228-4. 2012. URL info
    @inproceedings{991176, author = {Kilgarriff, Adam and Pomikálek, Jan and Jakubíček, Miloš and Whitelock, Pete}, address = {Oslo, Norway}, booktitle = {Proceedings of the 15th EURALEX International Congress}, editor = {Ruth Vatvedt Fjeld and Julie Matilde Torjusen}, keywords = {corpora; corpus lexicography; web crawling; dependency parsing}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Oslo, Norway}, isbn = {978-82-303-2228-4}, pages = {606-612}, publisher = {Department of Linguistics and Scandinavian Studies, University of Oslo}, title = {Setting up for corpus lexicography}, url = {http://trac.sketchengine.co.uk/attachment/wiki/AK/Papers/pt_31may2012.doc?format=raw}, year = {2012} }
  • JAKUBÍČEK, Miloš, Vojtěch KOVÁŘ a Pavel ŠMERK. Czech Morphological Tagset Revisited. In Horák, Rychlý. Proceedings of Recent Advances in Slavonic Natural Language Processing 2011. Brno: Tribun EU. s. 29-42. ISBN 978-80-263-0077-9. 2011. URL info
    @inproceedings{959110, author = {Jakubíček, Miloš and Kovář, Vojtěch and Šmerk, Pavel}, address = {Brno}, booktitle = {Proceedings of Recent Advances in Slavonic Natural Language Processing 2011}, editor = {Horák, Rychlý}, keywords = {morphology;tag;tagset;annotation;Czech}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0077-9}, pages = {29-42}, publisher = {Tribun EU}, title = {Czech Morphological Tagset Revisited}, url = {https://nlp.fi.muni.cz/raslan/2011/paper05.pdf}, year = {2011} }
  • JAKUBÍČEK, Miloš. Effective Parsing Using Competing CFG Rules. In Habernal, Matoušek. Proceedings of Text, Speech and Dialogue 2011. Berlin, Heidelberg: Springer Verlag. s. 115-122. ISBN 978-3-642-23537-5. 2011. URL info
    @inproceedings{949222, author = {Jakubíček, Miloš}, address = {Berlin, Heidelberg}, booktitle = {Proceedings of Text, Speech and Dialogue 2011}, editor = {Habernal, Matoušek}, keywords = {parsing; syntactic analysis; CFG; competing rule}, language = {eng}, location = {Berlin, Heidelberg}, isbn = {978-3-642-23537-5}, pages = {115-122}, publisher = {Springer Verlag}, title = {Effective Parsing Using Competing CFG Rules}, url = {http://www.kiv.zcu.cz/tsd2011/}, year = {2011} }
  • JAKUBÍČEK, Miloš a Vojtěch KOVÁŘ. CzechParl: Corpus of Stenographic Protocols from Czech Parliament. In Proceedings of Recent Advances in Slavonic Natural Language Processing 2010. Brno: Masaryk University. s. 41--46. ISBN 978-80-7399-246-0. 2010. info
    @inproceedings{914268, author = {Jakubíček, Miloš and Kovář, Vojtěch}, address = {Brno}, booktitle = {Proceedings of Recent Advances in Slavonic Natural Language Processing 2010}, keywords = {corpus;corpora;parliament;stenographic protocol}, language = {eng}, location = {Brno}, isbn = {978-80-7399-246-0}, pages = {41--46}, publisher = {Masaryk University}, title = {CzechParl: Corpus of Stenographic Protocols from Czech Parliament}, year = {2010} }
  • JAKUBÍČEK, Miloš, Pavel RYCHLÝ, Adam KILGARRIFF a Diana MCCARTHY. Fast syntactic searching in very large corpora for many languages. In PACLIC 24 Proceedings of the 24th Pacific Asia Conference on Language, Information and Computation. Tokyo: Waseda University. s. 741-747. ISBN 978-4-905166-00-9. 2010. info
    @inproceedings{908008, author = {Jakubíček, Miloš and Rychlý, Pavel and Kilgarriff, Adam and McCarthy, Diana}, address = {Tokyo}, booktitle = {PACLIC 24 Proceedings of the 24th Pacific Asia Conference on Language, Information and Computation}, keywords = {corpus search; large corpora; CQL; syntactic search}, language = {eng}, location = {Tokyo}, isbn = {978-4-905166-00-9}, pages = {741-747}, publisher = {Waseda University}, title = {Fast syntactic searching in very large corpora for many languages}, year = {2010} }
  • KOVÁŘ, Vojtěch a Miloš JAKUBÍČEK. Prague Dependency Treebank Annotation Errors: A Preliminary Analysis. In RASLAN 2009 : Recent Advances in Slavonic Natural Language Processing. 1. vyd. Brno: Masaryk University. s. 101-108. ISBN 978-80-210-5048-8. 2009. URL info
    @inproceedings{866437, author = {Kovář, Vojtěch and Jakubíček, Miloš}, address = {Brno}, booktitle = {RASLAN 2009 : Recent Advances in Slavonic Natural Language Processing}, edition = {1.}, keywords = {error in text; annotation; Prague Dependency Treebank; PDT}, language = {eng}, location = {Brno}, isbn = {978-80-210-5048-8}, pages = {101-108}, publisher = {Masaryk University}, title = {Prague Dependency Treebank Annotation Errors: A Preliminary Analysis}, url = {http://nlp.fi.muni.cz/raslan/2009/}, year = {2009} }
  • JAKUBÍČEK, Miloš. Extraction of Syntactic Structures Based on the Czech Parser Synt. In Proceedings of Recent Advances in Slavonic Natural Language Processing 2008. Brno: Masaryk University. s. 56-62. ISBN 978-80-210-4741-9. 2008. URL info
    @inproceedings{806050, author = {Jakubíček, Miloš}, address = {Brno}, booktitle = {Proceedings of Recent Advances in Slavonic Natural Language Processing 2008}, keywords = {synt;syntactic analysis;syntactic structures;parsing}, language = {eng}, location = {Brno}, isbn = {978-80-210-4741-9}, pages = {56-62}, publisher = {Masaryk University}, title = {Extraction of Syntactic Structures Based on the Czech Parser Synt}, url = {http://nlp.fi.muni.cz/raslan/2008/papers/8.pdf}, year = {2008} }
  • KOVÁŘ, Vojtěch a Miloš JAKUBÍČEK. Test Suite for the Czech Parser Synt. In Proceedings of Recent Advances in Slavonic Natural Language Processing 2008. Brno: Masaryk University. s. 63-70. ISBN 978-80-210-4741-9. 2008. URL info
    @inproceedings{806003, author = {Kovář, Vojtěch and Jakubíček, Miloš}, address = {Brno}, booktitle = {Proceedings of Recent Advances in Slavonic Natural Language Processing 2008}, keywords = {synt;syntactic analysis;parsing;test suite;brno phrasal treebank}, language = {eng}, location = {Brno}, isbn = {978-80-210-4741-9}, pages = {63-70}, publisher = {Masaryk University}, title = {Test Suite for the Czech Parser Synt}, url = {http://nlp.fi.muni.cz/raslan/2008/papers/9.pdf}, year = {2008} }
  • KILGARRIFF, Adam, Vojtěch KOVÁŘ, Simon KREK, Irena SRDANOVIĆ a Carole TIBERIUS. A Quantitative Evaluation of Word Sketches. In Proceedings of the XIV Euralex International Congress. Leeuwarden: Fryske Academy. 7 s. ISBN 978-90-6273-840-3. 2010. URL info
    @inproceedings{900029, author = {Kilgarriff, Adam and Kovář, Vojtěch and Krek, Simon and Srdanović, Irena and Tiberius, Carole}, address = {Leeuwarden}, booktitle = {Proceedings of the XIV Euralex International Congress}, keywords = {word sketches evaluation}, language = {eng}, location = {Leeuwarden}, isbn = {978-90-6273-840-3}, publisher = {Fryske Academy}, title = {A Quantitative Evaluation of Word Sketches}, url = {http://nlp.fi.muni.cz/publications/kilgarriff_xkovar3_etal/kilgarriff_xkovar3_etal.pdf}, year = {2010} }
  • KILGARRIFF, Adam, Vojtěch KOVÁŘ a Pavel RYCHLÝ. Tickbox Lexicography. In Sylviane Granger, Magali Paquot. eLexicography in the 21st century: New challenges, new applications. Brussels: Presses universitaires de Louvain. s. 411-418. ISBN 2-87463-211-2. 2010. URL info
    @inproceedings{934177, author = {Kilgarriff, Adam and Kovář, Vojtěch and Rychlý, Pavel}, address = {Brussels}, booktitle = {eLexicography in the 21st century: New challenges, new applications}, editor = {Sylviane Granger, Magali Paquot}, keywords = {corpus lexicography; dictionary editing}, language = {eng}, location = {Brussels}, isbn = {2-87463-211-2}, pages = {411-418}, publisher = {Presses universitaires de Louvain}, title = {Tickbox Lexicography}, url = {http://www.i6doc.com/en/livre/?GCOI=28001100345140}, year = {2010} }
  • KOVÁŘ, Vojtěch. Partial Grammar Checking for Czech Using the SET Parser. In 17th International Conference, TSD 2014. prvni. Berlin Heidelberg: Springer Verlag. s. 308-314. ISBN 978-3-319-10815-5. doi:10.1007/978-3-319-10816-2_38. 2014. info
    @inproceedings{1211584, author = {Kovář, Vojtěch}, address = {Berlin Heidelberg}, booktitle = {17th International Conference, TSD 2014}, doi = {http://dx.doi.org/10.1007/978-3-319-10816-2_38}, edition = {prvni}, keywords = {parser; SET; Czech; grammar checking; punctuation detection; syntactic analysis}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Berlin Heidelberg}, isbn = {978-3-319-10815-5}, pages = {308-314}, publisher = {Springer Verlag}, title = {Partial Grammar Checking for Czech Using the SET Parser}, year = {2014} }
  • RYGL, Jan, Kristýna ZEMKOVÁ a Vojtěch KOVÁŘ. Authorship Verification based on Syntax Features. In Aleš Horák, Pavel Rychlý. Proceedings of the Sixth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2012. 1st ed. Brno (Czech Republic): Tribun EU. s. 111-119. ISBN 978-80-263-0313-8. 2012. paper conference page info
    @inproceedings{1077977, author = {Rygl, Jan and Zemková, Kristýna and Kovář, Vojtěch}, address = {Brno (Czech Republic)}, booktitle = {Proceedings of the Sixth Workshop on Recent Advances in Slavonic Natural Language Processing, RASLAN 2012}, edition = {1st ed.}, editor = {Aleš Horák, Pavel Rychlý}, keywords = {authorship verification;syntactic analysis;SET;machine learning}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno (Czech Republic)}, isbn = {978-80-263-0313-8}, pages = {111-119}, publisher = {Tribun EU}, title = {Authorship Verification based on Syntax Features}, url = {https://nlp.fi.muni.cz/raslan/2012/paper06.pdf}, year = {2012} }
  • KOVÁŘ, Vojtěch. Corpus Query System Bonito - Recent Development. In Proceedings of Recent Advances in Slavonic Natural Language Processing. Brno: Masaryk University. s. 71-76. ISBN 978-80-210-4471-5. 2007. URL info
    @inproceedings{746083, author = {Kovář, Vojtěch}, address = {Brno}, booktitle = {Proceedings of Recent Advances in Slavonic Natural Language Processing}, keywords = {corpus; cqs; manatee; bonito; xml; localization}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-210-4471-5}, pages = {71-76}, publisher = {Masaryk University}, title = {Corpus Query System Bonito - Recent Development}, url = {https://nlp.fi.muni.cz/raslan/2007/papers/2.pdf}, year = {2007} }
  • RYCHLÝ, Pavel a Vojtěch KOVÁŘ. Displaying Bidirectional Text Concordances in KWIC format. 2007. info
    @proceedings{746341, author = {Rychlý, Pavel and Kovář, Vojtěch}, keywords = {bidirectional; KWIC; corpus}, language = {eng}, title = {Displaying Bidirectional Text Concordances in KWIC format}, year = {2007} }
  • LINKOV, Václav, Pavel ŠMERK, Bingbing LI a David ŠMAHEL. Personality Perception in Instant Messenger Communication in the Czech Republic and People’s Republic of China. Studia psychologica : an international journal of research and theory in psychological sciences. roč. 56, č. 4, s. 287-300. ISSN 0039-3320. doi:10.21909/sp.2014.04.667. 2014. info
    @article{1215468, author = {Linkov, Václav and Šmerk, Pavel and Li, Bingbing and Šmahel, David}, article_number = {4}, doi = {http://dx.doi.org/10.21909/sp.2014.04.667}, keywords = {personality perception accuracy; cues for personality perception; Big Five; social perception; computer mediated communication}, language = {eng}, issn = {0039-3320}, journal = {Studia psychologica : an international journal of research and theory in psychological sciences}, title = {Personality Perception in Instant Messenger Communication in the Czech Republic and People’s Republic of China}, volume = {56}, year = {2014} }
  • LINKOV, Václav a Pavel ŠMERK. Rozdíly mezi pravdivou a lživou online textovou komunikací. Sociální studia. Brno: Fakulta sociálních studií MU Brno, roč. 6, č. 2, s. 73-95. ISSN 1214-813X. 2009. URL info
    @article{849797, author = {Linkov, Václav and Šmerk, Pavel}, article_location = {Brno}, article_number = {2}, keywords = {computer-mediated communication; cues; deception detection; linguistic analysis}, language = {cze}, issn = {1214-813X}, journal = {Sociální studia}, title = {Rozdíly mezi pravdivou a lživou online textovou komunikací}, url = {http://socstudia.fss.muni.cz/Eng/index.php?ukol=1&clanek=290}, volume = {6}, year = {2009} }
  • RYGL, Jan a Marek MEDVEĎ. Style Markers Based on Stop-word List. In Eighth Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 85-89. ISSN 2336-4289. 2014. paper info
    @inproceedings{1210701, author = {Rygl, Jan and Medveď, Marek}, address = {Brno}, booktitle = {Eighth Workshop on Recent Advances in Slavonic Natural Language Processing}, keywords = {style marker; stop-word list; corpus}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, pages = {85-89}, publisher = {Tribun EU}, title = {Style Markers Based on Stop-word List}, url = {https://nlp.fi.muni.cz/raslan/2014/8.pdf}, year = {2014} }
  • SUCHOMEL, Vít, Jan MICHELFEIT a Jan POMIKÁLEK. Text Tokenisation Using unitok. In Eighth Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 71-75. ISSN 2336-4289. 2014. URL info
    @inproceedings{1210699, author = {Suchomel, Vít and Michelfeit, Jan and Pomikálek, Jan}, address = {Brno}, booktitle = {Eighth Workshop on Recent Advances in Slavonic Natural Language Processing}, keywords = {tokenisation; corpus tool}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, pages = {71-75}, publisher = {Tribun EU}, title = {Text Tokenisation Using unitok}, url = {https://nlp.fi.muni.cz/raslan/2014/14.pdf}, year = {2014} }
  • NEVĚŘILOVÁ, Zuzana a Vít SUCHOMEL. Intelligent Search and Replace for Czech Phrases. In Eighth Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 97-105. ISSN 2336-4289. 2014. URL info
    @inproceedings{1210703, author = {Nevěřilová, Zuzana and Suchomel, Vít}, address = {Brno}, booktitle = {Eighth Workshop on Recent Advances in Slavonic Natural Language Processing}, keywords = {search and replace; detecting phrases; generating phrases; subject-predicative complement}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, pages = {97-105}, publisher = {Tribun EU}, title = {Intelligent Search and Replace for Czech Phrases}, url = {https://nlp.fi.muni.cz/raslan/2014/16.pdf}, year = {2014} }
  • PALA, Karel, Pavel RYCHLÝ a Pavel ŠMERK. Automatic Identification of Legal Terms in Czech Law Texts. In Semantic Processing of Legal Texts. Berlin: Springer. s. 83-94. ISBN 978-3-642-12836-3. doi:10.1007/978-3-642-12837-0_5. 2010. info
    @inproceedings{884809, author = {Pala, Karel and Rychlý, Pavel and Šmerk, Pavel}, address = {Berlin}, booktitle = {Semantic Processing of Legal Texts}, doi = {http://dx.doi.org/10.1007/978-3-642-12837-0_5}, keywords = {terminology extraction; natural language processing; legal language}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Berlin}, isbn = {978-3-642-12836-3}, pages = {83-94}, publisher = {Springer}, title = {Automatic Identification of Legal Terms in Czech Law Texts}, year = {2010} }
  • RYCHLÝ, Pavel, Pavel ŠMERK a Karel PALA. DESAM – morfologicky označkovaný korpus českých textů. 2010. URL info
    @techreport{935754, author = {Rychlý, Pavel and Šmerk, Pavel and Pala, Karel}, keywords = {morphology; annotation; Czech; lemmatization; grammatical tags}, language = {cze}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {DESAM – morfologicky označkovaný korpus českých textů}, url = {http://nlp.fi.muni.cz/projects/desam}, year = {2010} }
  • ŠMERK, Pavel, Karel PALA a Markéta PRAVDOVÁ. Internetová jazyková příručka. 2010. URL info
    @misc{935738, author = {Šmerk, Pavel and Pala, Karel and Pravdová, Markéta}, keywords = {internet language reference book; orthography; language norm; codification}, language = {cze}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {Internetová jazyková příručka}, url = {http://prirucka.ujc.cas.cz}, year = {2010} }
  • PALA, Karel a Pavel ŠMERK. Multiword Expressions in Czech (a case study). In Aleš Bičan, Jan Klaška, Petra Macurová, Jana Zmrzlíková. Karlík a továrna na lingvistiku. Prof. Petru Karlíkovi k šedesátým narozeninám. Brno: Host. s. 331-344. ISBN 978-80-7294-412-5. 2010. info
    @inproceedings{913082, author = {Pala, Karel and Šmerk, Pavel}, address = {Brno}, booktitle = {Karlík a továrna na lingvistiku. Prof. Petru Karlíkovi k šedesátým narozeninám}, editor = {Aleš Bičan, Jan Klaška, Petra Macurová, Jana Zmrzlíková}, keywords = {Czech Multiword Expressions; Word Sketches; n-grams}, language = {eng}, location = {Brno}, isbn = {978-80-7294-412-5}, pages = {331-344}, publisher = {Host}, title = {Multiword Expressions in Czech (a case study)}, year = {2010} }
  • PALA, Karel, Pavel RYCHLÝ a Pavel ŠMERK. Automatic Identification of Legal Terms in Czech Legal Texts. In Proceedings of the Workshop on Semantic processing of legal texts, LREC 2008. Marrakech, Morocco: European Language Resources Association (ELRA). s. 11-15. ISBN 2-9517408-4-0. 2008. URL info
    @inproceedings{770626, author = {Pala, Karel and Rychlý, Pavel and Šmerk, Pavel}, address = {Marrakech, Morocco}, booktitle = {Proceedings of the Workshop on Semantic processing of legal texts, LREC 2008}, keywords = {legal texts; law terms; recognition; morphological and syntactic analysis}, language = {eng}, location = {Marrakech, Morocco}, isbn = {2-9517408-4-0}, pages = {11-15}, publisher = {European Language Resources Association (ELRA)}, title = {Automatic Identification of Legal Terms in Czech Legal Texts}, url = {http://www.lrec-conf.org/proceedings/lrec2008/workshops/W9_Proceedings.pdf}, year = {2008} }
  • PALA, Karel, Lukáš SVOBODA a Pavel ŠMERK. Czech MWE Database. In Proceedings of the Sixth International Language Resources and Evaluation Conference (LREC '08). Marrakech, Morocco: European Language Resources Association (ELRA). s. 1-5. ISBN 2-9517408-4-0. 2008. URL info
    @inproceedings{769845, author = {Pala, Karel and Svoboda, Lukáš and Šmerk, Pavel}, address = {Marrakech, Morocco}, booktitle = {Proceedings of the Sixth International Language Resources and Evaluation Conference (LREC '08)}, keywords = {multiword expressions;word sketch engine}, language = {eng}, location = {Marrakech, Morocco}, isbn = {2-9517408-4-0}, pages = {1-5}, publisher = {European Language Resources Association (ELRA)}, title = {Czech MWE Database}, url = {http://www.lrec-conf.org/proceedings/lrec2008/summaries/746.html}, year = {2008} }
  • RYCHLÝ, Pavel, Pavel ŠMERK, Karel PALA a Radek SEDLÁČEK. Morphological Analyzer Ajka. 2008. URL info
    @techreport{836478, author = {Rychlý, Pavel and Šmerk, Pavel and Pala, Karel and Sedláček, Radek}, keywords = {morphology; annotation; Czech; lemmatization; grammatical tags}, language = {eng}, institution = {NLPC FI MU}, organization = {NLPC FI MU}, title = {Morphological Analyzer Ajka}, url = {http://nlp.fi.muni.cz/projects/ajka}, year = {2008} }
  • PALA, Karel, Pavel RYCHLÝ a Pavel ŠMERK. Morphological Analysis of Law texts. In Petr Sojka, Aleš Horák. First Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2007. Brno: Masaryk University. s. 21-26, 7 s. ISBN 978-80-210-4471-5. 2007. URL RASLAN 2007 Workshop web page info
    @inproceedings{746343, author = {Pala, Karel and Rychlý, Pavel and Šmerk, Pavel}, address = {Brno}, booktitle = {First Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2007}, editor = {Petr Sojka, Aleš Horák}, keywords = {morphological analysis; partial syntactic analysis; noun groups detection}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-210-4471-5}, pages = {21-26}, publisher = {Masaryk University}, title = {Morphological Analysis of Law texts}, url = {http://nlp.fi.muni.cz/raslan/2007/papers/14.pdf}, year = {2007} }
  • POMIKÁLEK, Jan a Vít SUCHOMEL. Chared. 2011. Domovská stránka software, online demo Repozitář zdrojového kódu, instalační balíček ke stažení info
    @misc{979276, author = {Pomikálek, Jan and Suchomel, Vít}, keywords = {character encoding; character encoding detection; charset; Unicode}, language = {eng}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {Chared}, url = {http://nlp.fi.muni.cz/projects/chared/}, year = {2011} }
  • POMIKÁLEK, Jan a Vít SUCHOMEL. chared: Character Encoding Detection with a Known Language. In Aleš Horák, Pavel Rychlý. RASLAN 2011. 5. vyd. Brno, Czech Republic: Tribun EU. s. 125-129. ISBN 978-80-263-0077-9. 2011. URL info
    @inproceedings{959065, author = {Pomikálek, Jan and Suchomel, Vít}, address = {Brno, Czech Republic}, booktitle = {RASLAN 2011}, edition = {5}, editor = {Aleš Horák, Pavel Rychlý}, keywords = {character encoding; character encoding detection; charset; Unicode}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno, Czech Republic}, isbn = {978-80-263-0077-9}, pages = {125-129}, publisher = {Tribun EU}, title = {chared: Character Encoding Detection with a Known Language}, url = {https://nlp.fi.muni.cz/raslan/2011/paper16.pdf}, year = {2011} }
  • SUCHOMEL, Vít a Jan POMIKÁLEK. Practical Web Crawling for Text Corpora. In A. Horák, P. Rychlý. Proceedings of Recent Advances in Slavonic Natural Language Processing, RASLAN 2011. Brno: Tribun EU. s. 97-108. ISBN 978-80-263-0077-9. 2011. URL info
    @inproceedings{959084, author = {Suchomel, Vít and Pomikálek, Jan}, address = {Brno}, booktitle = {Proceedings of Recent Advances in Slavonic Natural Language Processing, RASLAN 2011}, editor = {A. Horák, P. Rychlý}, keywords = {crawler; web crawling; corpus; web corpus; text corpus}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0077-9}, pages = {97-108}, publisher = {Tribun EU}, title = {Practical Web Crawling for Text Corpora}, url = {https://nlp.fi.muni.cz/raslan/2011/paper09.pdf}, year = {2011} }
  • ŠMERK, Pavel a Pavel RYCHLÝ. Majka – rychlý morfologický analyzátor. 2009. URL info
    @techreport{935762, author = {Šmerk, Pavel and Rychlý, Pavel}, keywords = {morphology; annotation; Czech; lemmatization; grammatical tags}, language = {cze}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {Majka – rychlý morfologický analyzátor}, url = {http://nlp.fi.muni.cz/ma/}, year = {2009} }
  • SUCHOMEL, Vít. Recent Czech Web Corpora. In Aleš Horák, Pavel Rychlý. 6th Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 77-83. ISBN 978-80-263-0313-8. 2012. URL info
    @inproceedings{1079512, author = {Suchomel, Vít}, address = {Brno}, booktitle = {6th Workshop on Recent Advances in Slavonic Natural Language Processing}, editor = {Aleš Horák, Pavel Rychlý}, keywords = {web corpora; czech corpus}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-263-0313-8}, pages = {77-83}, publisher = {Tribun EU}, title = {Recent Czech Web Corpora}, url = {https://nlp.fi.muni.cz/raslan/2012/paper11.pdf}, year = {2012} }
  • SUCHOMEL, Vít. SpiderLing. 2012. Domovská stránka software, zdrojový kód info
    @misc{1095720, author = {Suchomel, Vít}, keywords = {web crawler; web spider; text corpora}, language = {eng}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {SpiderLing}, url = {http://nlp.fi.muni.cz/trac/spiderling/}, year = {2012} }
  • ŠMERK, Pavel. Tools for Fast Morphological Analysis Based on Finite State Automata. In Eighth Workshop on Recent Advances in Slavonic Natural Language Processing. Brno: Tribun EU. s. 147-150. ISSN 2336-4289. 2014. URL info
    @inproceedings{1210712, author = {Šmerk, Pavel}, address = {Brno}, booktitle = {Eighth Workshop on Recent Advances in Slavonic Natural Language Processing}, keywords = {morphological analysis; minimal deterministic finite state automata}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, pages = {147-150}, publisher = {Tribun EU}, title = {Tools for Fast Morphological Analysis Based on Finite State Automata}, url = {https://nlp.fi.muni.cz/raslan/2014/17.pdf}, year = {2014} }
  • ŠMERK, Pavel. A New Data Format for Czech Morphological Analysis. In Petr Sojka, Aleš Horák. Proceedings of Fourth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2010. Brno: Tribun EU. s. 3-8. ISBN 978-80-7399-246-0. 2010. URL info
    @inproceedings{914403, author = {Šmerk, Pavel}, address = {Brno}, booktitle = {Proceedings of Fourth Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2010}, editor = {Petr Sojka, Aleš Horák}, keywords = {morphology analysis; czech morphology}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-7399-246-0}, pages = {3-8}, publisher = {Tribun EU}, title = {A New Data Format for Czech Morphological Analysis}, url = {https://nlp.fi.muni.cz/raslan/2010/paper14.pdf}, year = {2010} }
  • ŠMERK, Pavel. Deriv. 2010. URL info
    @misc{935735, author = {Šmerk, Pavel}, keywords = {derivational relations; morphological analysis}, language = {cze}, institution = {Masarykova univerzita}, organization = {Masarykova univerzita}, title = {Deriv}, url = {http://deb.fi.muni.cz/deriv}, year = {2010} }
  • ŠMERK, Pavel. Fast Morphological Analysis of Czech. In Proceedings of the Raslan Workshop 2009. Brno: Masarykova univerzita. 4 s. ISBN 978-80-210-5048-8. 2009. URL info
    @inproceedings{866518, author = {Šmerk, Pavel}, address = {Brno}, booktitle = {Proceedings of the Raslan Workshop 2009}, keywords = {morphological analysis; finite state automata}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-210-5048-8}, publisher = {Masarykova univerzita}, title = {Fast Morphological Analysis of Czech}, url = {https://nlp.fi.muni.cz/raslan/2009/papers/13.pdf}, year = {2009} }
  • ŠMERK, Pavel. Towards Czech Morphological Guesser. In Petr Sojka, Aleš Horák. Proceedings of Recent Advances in Slavonic Natural Language Processing, RASLAN 2008. Brno: Masarykova univerzita. s. 1-4. ISBN 978-80-210-4741-9. 2008. URL RASLAN 2008 Workshop web page info
    @inproceedings{805962, author = {Šmerk, Pavel}, address = {Brno}, booktitle = {Proceedings of Recent Advances in Slavonic Natural Language Processing, RASLAN 2008}, editor = {Petr Sojka, Aleš Horák}, keywords = {morphological guesser; morphological analysis; morphological guessing}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-210-4741-9}, pages = {1-4}, publisher = {Masarykova univerzita}, title = {Towards Czech Morphological Guesser}, url = {http://nlp.fi.muni.cz/raslan/2008/papers/10.pdf}, year = {2008} }
  • ŠMERK, Pavel. Morphemic Analysis: A Dictionary Lookup Instead of Real Analysis. In Petr Sojka, Aleš Horák. First Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2007. Brno: Masaryk University. s. 77-85. ISBN 978-80-210-4471-5. 2007. URL RASLAN 2007 Workshop web page info
    @inproceedings{746346, author = {Šmerk, Pavel}, address = {Brno}, booktitle = {First Workshop on Recent Advances in Slavonic Natural Languages Processing, RASLAN 2007}, editor = {Petr Sojka, Aleš Horák}, keywords = {morphological analysis; morphemic analysis}, howpublished = {tištěná verze "print"}, language = {eng}, location = {Brno}, isbn = {978-80-210-4471-5}, pages = {77-85}, publisher = {Masaryk University}, title = {Morphemic Analysis: A Dictionary Lookup Instead of Real Analysis}, url = {http://nlp.fi.muni.cz/raslan/2007/papers/8.pdf}, year = {2007} }
  • ŠMERK, Pavel. Unsupervised Learning of Rules for Morphological Disambiguation. Lecture Notes in Computer Science. Berlin: Springer Verlag, roč. 3206, č. 1, s. 211-216. ISSN 0302-9743. 2004. info
    @article{558001, author = {Šmerk, Pavel}, article_location = {Berlin}, article_number = {1}, keywords = {morphological disambiguation;tagging;morphological tagging;unsupervised learning}, language = {eng}, issn = {0302-9743}, journal = {Lecture Notes in Computer Science}, title = {Unsupervised Learning of Rules for Morphological Disambiguation}, volume = {3206}, year = {2004} }