
@article{Masciolini-EtAl:2025,
  author = "A. Masciolini and A. Caines and O. D. Clercq and J. Kruijsbergen and M. Kurfalı and R. M. Sanchez and E. Volodina and R. Ostling and K. Allkivi and S. A. Holdt and I. Auzina and R. Dargis and E. Drakonaki and J. Frey and I. Glisic and P. Kikilintza and L. Nicolas and M. Romanyshyn and A. Rosen and A. Rozovskaya and K. Suluste and O. Syvokon and A. Tantos and D. Touriki and K. Tsiotskas and E. Tsourilla and V. Varsamopoulos and K. Wisniewski and A. Zagar and T. Zesch",
  title = "Towards better language representation in Natural Language Processing",
  year = 2025,
  journal = "International Journal of Learner Corpus Research",
  publisher = "John Benjamins Publishing Company",
  volume = 11,
  number = 2,
  pages = "309-335",
  month = "May",
  doi = "https://doi.org/10.1075/ijlcr.24033.mas",
  url = "https://www.jbe-platform.com/docserver/fulltext/ijlcr.24033.mas.pdf"
}


@inproceedings{Skadina-EtAl:2025,
  author = "I. Skadina and B. Bakanovs and R. Dargis",
  title = "First Steps in Benchmarking Latvian in Large Language Models",
  year = 2025,
  journal = "Proceedings of the Third Workshop on Resources and Representations for Under-Resourced Languages and Domains (RESOURCEFUL)",
  publisher = "University of Tartu Library",
  pages = "86-95",
  month = "Mar",
  url = "https://hdl.handle.net/10062/107120"
}


@inproceedings{Saulīte2025a,
  author = "B. Saulite and R. Dargis and K. Pokratniece",
  title = "Error Types in the Latvian Grammatical Error Correction and Fluency Corpus "Norma"",
  year = 2025,
  journal = "3rd UniDive Workshop in Budapest",
  month = "Jan",
  url = "https://unidive.lisn.upsaclay.fr/lib/exe/fetch.php?media=meetings:general_meetings:3rd_unidive_general_meeting:16_error_types_in_the_latvian_.pdf"
}


@inproceedings{Znotins-EtAl-2025-WNUT,
  author = "A. Znotins and N. Gruzitis and R. Dargis",
  title = "From Conversational Speech to Readable Text: Post-Processing Noisy Transcripts in a Low-Resource Setting",
  year = 2025,
  booktitle = "Proceedings of the Tenth Workshop on Noisy and User-generated Text",
  publisher = "ACL",
  pages = "143--148",
  url = "https://aclanthology.org/2025.wnut-1.15/"
}


@inproceedings{dargis-etal-2024-evaluating,
  author = "R. Dargis and G. Barzdins and I. Skadina and N. Gruzitis and B. Saulite",
  title = "Evaluating Open-Source LLMs in Low-Resource Languages: Insights from Latvian High School Exams",
  year = 2024,
  booktitle = "Proceedings of the 4th International Conference on Natural Language Processing for Digital Humanities",
  publisher = "Association for Computational Linguistics",
  pages = "289-293",
  month = "Nov",
  url = "https://aclanthology.org/2024.nlp4dh-1.28.pdf"
}


@inproceedings{dargis-etal-2024-balsutalka-lv,
  author = "R. Dargis and A. Znotins and I. Auzina and B. Saulite and S. Reinsone and R. Dejus and A. Klavinska and N. Gruzitis",
  title = "BalsuTalka.lv – Boosting the Common Voice Corpus for Low-Resource Languages",
  year = 2024,
  booktitle = "Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING)",
  pages = "2080",
  month = "May",
  url = "https://aclanthology.org/2024.lrec-main.187"
}


@article{Erjavec-EtAl:2024-LRE,
  author = "T. Erjavec and M. Kopp and N. Ljubesic and T. Kuzman and P. Rayson and P. Osenova and M. Ogrodniczuk and C. Coltekin and D. Korzinek and K. Meden and J. Skubic and P. Rupnik and T. Agnoloni and J. Aires and S. Barkarson and R. Bartolini and N. Bel and M. C. Perez and R. Dargis and e. al.",
  title = "ParlaMint II: advancing comparable parliamentary corpora across Europe",
  year = 2024,
  journal = "Language Resources and Evaluation",
  doi = "https://doi.org/10.1007/s10579-024-09798-w",
  url = "https://link.springer.com/article/10.1007/s10579-024-09798-w"
}


@article{Auzina-EtAl:2024,
  author = "I. Auzina and N. Gruzitis and R. Dargis and G. Rabante-Busa and D. Gosko and J. Vempers and R. Kivkucans and A. Znotins",
  title = "Recent Latvian Speech Corpora for Linguistic Research and Technology Development",
  year = 2024,
  journal = "Baltic Journal of Modern Computing",
  publisher = "University of Latvia",
  volume = 12,
  number = 4,
  pages = "646-658",
  doi = "https://doi.org/10.22364/bjmc.2024.12.4.24",
  url = "https://www.bjmc.lu.lv/fileadmin/user_upload/lu_portal/projekti/bjmc/Contents/12_4_24_Auzina.pdf"
}


@article{Dargis-Saulite:2024,
  author = "R. Dargis and B. Saulite",
  title = "Korpuss.lv – a Versatile Platform for Digital Humanities",
  year = 2024,
  journal = "Baltic Journal of Modern Computing",
  publisher = "University of Latvia",
  volume = 12,
  number = 4,
  pages = "636-645",
  doi = "https://doi.org/10.22364/bjmc.2024.12.4.23",
  url = "https://www.bjmc.lu.lv/fileadmin/user_upload/lu_portal/projekti/bjmc/Contents/12_4_23_Dargis.pdf"
}


@article{T.Erjavec2023a,
  author = "T. Erjavec and M. Ogrodniczuk and P. Osenova and N. Ljubesic and K. Simov and A. Pancur and M. Rudolf and M. Kopp and S. Barkarson and S. Steingrimsson and C. Coltekin and J. de Does and K. Depuydt and T. Agnoloni and G. Venturi and M. C. Perez and L. de Macedo and C. Navarretta and G. Luxardo and M. Coole and P. Rayson and V. Morkevicius and T. Krilavicius and R. Dargis and O. Ring and R. van Heusden and M. Marx and D. Fiser",
  title = "The ParlaMint corpora of parliamentary proceedings",
  year = 2023,
  journal = "Language Resources and Evaluation",
  publisher = "Springer",
  volume = 57,
  pages = "415-448",
  doi = "10.1007/s10579-021-09574-0",
  url = "https://link.springer.com/content/pdf/10.1007/s10579-021-09574-0.pdf"
}


@article{Saulite-EtAl:2023,
  author = "B. Saulite and I. Auzina and R. Dargis",
  title = "Nacionālā korpusu kolekcija Korpuss.lv",
  year = 2023,
  journal = "Linguistica Lettica",
  publisher = "LU Latviešu valodas institūts",
  volume = 31,
  number = 1,
  pages = "202-223",
  doi = "https://doi.org/10.22364/lingualet.31.1",
  url = "https://dspace.lu.lv/dspace/bitstream/handle/7/65577/Linguistica_Lettica_31-1.pdf?sequence=1&isAllowed=y"
}


@inproceedings{Znotins2022a,
  author = "A. Znotins and R. Dargis and N. Gruzitis and G. Barzdins and D. Gosko",
  title = "RUTA:MED – Dual Workflow Medical Speech Transcription Pipeline and Editor",
  year = 2022,
  booktitle = "Natural Language Processing and Information Systems",
  publisher = "Springer",
  volume = 13286,
  pages = "209-214",
  month = "Jun",
  doi = "10.1007/978-3-031-08473-7_19"
}


@article{Skestere-Dargis:2022,
  author = "L. Skestere and R. Dargis",
  title = "Agenda-Setting Dynamics during COVID-19: Who Leads and Who Follows?",
  year = 2022,
  journal = "Social Sciences",
  volume = 11,
  number = 12,
  pages = "556",
  doi = "https://doi.org/10.3390/socsci11120556",
  url = "https://www.mdpi.com/2076-0760/11/12/556"
}


@inproceedings{Skadina-EtAl:2022:CLARIN,
  author = "I. Skadina and I. Auzina and R. Dargis and E. Lasmanis and A. Voitkans",
  title = "CLARIN-LV: Many Steps till Operation",
  year = 2022,
  booktitle = "CLARIN Annual Conference",
  pages = "9-13",
  url = "https://office.clarin.eu/v/CE-2022-2118-CLARIN2022_ConferenceProceedings.pdf"
}


@inproceedings{Dargis-EtAl:2022:BalticHLT,
  author = "R. Dargis and I. Auzina and I. Kaija and K. Levane-Petrova and K. Pokratniece",
  title = "Corpus Based Self-Assessment Platform for Latvian Language Learners",
  year = 2022,
  journal = "Baltic Journal of Modern Computing",
  volume = 10,
  number = 3,
  pages = "392-401",
  url = "https://www.bjmc.lu.lv/fileadmin/user_upload/lu_portal/projekti/bjmc/Contents/10_3_12_Dargis.pdf"
}


@article{Auziņa-EtAl:2022b:Letonica,
  author = "I. Auzina and R. Dargis and B. Saulite and N. Gruzitis and M. Grasmanis and A. Spektors and K. Stepanovs",
  title = "Specializēta latviešu valodas runas korpusa un izrunas vārdnīcas izveide vizuālās diagnostikas izmeklējumu lingvistiskai analīzei un sistemātiskai transkribēšanai",
  year = 2022,
  journal = "Letonica",
  volume = 47,
  pages = "244-262",
  url = "https://lulfmi.lv/files/letonica/47/13-development-of-a-specialized-latvian-speech-corpus-and-pronunciation-dictionary-for-the-linguistic-analysis-and-systematic-transcription-of-visual-diagnostic-exa"
}


@article{Auziņa-EtAl:2022a:Letonica,
  author = "I. Auzina and R. Dargis and I. Kaija and K. Levane-Petrova and K. Pokratniece",
  title = "Valodas korpusu izmantošana latviešu valodas uzdevumu automātiskā ģenerēšanā",
  year = 2022,
  journal = "Letonica",
  volume = 47,
  pages = "264-282",
  url = "https://lulfmi.lv/files/letonica/47/14-use-of-the-language-corpora-in-automatic-generation-of-latvian-language-exercises.pdf"
}


@article{Skadina-EtAl:2022:Letonica,
  author = "I. Skadina and I. Auzina and R. Dargis and A. Voitkans",
  title = "CLARIN valodas resursu un rīku pētniecības infrastruktūra humanitārajām un sociālajām zinātnēm",
  year = 2022,
  journal = "Letonica",
  volume = 47,
  pages = "312-327",
  url = "https://lulfmi.lv/files/letonica/47/17-clarin-language-resources-and-technology-infrastructure-for-the-humanities-and-social-sciences.pdf"
}


@inproceedings{Gruzitis-EtAl:2022:WorldS4,
  author = "N. Gruzitis and R. Dargis and V. Lasmanis and G. Garkaje and D. Gosko",
  title = "Adapting Automatic Speech Recognition to the Radiology Domain for a Less-Resourced Language: The Case of Latvian",
  year = 2022,
  booktitle = "Intelligent Sustainable Systems",
  publisher = "Springer",
  volume = 333,
  pages = "267-276",
  doi = "10.1007/978-981-16-6309-3_27",
  url = "https://www.researchgate.net/publication/357554153_Adapting_Automatic_Speech_Recognition_to_the_Radiology_Domain_for_a_Less-Resourced_Language_The_Case_of_Latvian"
}


@inproceedings{Saulite-EtAl:2022:LREC,
  author = "B. Saulite and R. Dargis and N. Gruzitis and I. Auzina and K. Levane-Petrova and L. Pretkalnina and L. Rituma and P. Paikens and A. Znotins and L. Strankale and K. Pokratniece and I. Poikans and G. Barzdins and I. Skadina and A. Baklane and V. Saulespurens and J. Ziedins",
  title = "Latvian National Corpora Collection – Korpuss.lv",
  year = 2022,
  booktitle = "13th Language Resources and Evaluation Conference (LREC)",
  pages = "5123-5129",
  url = "http://www.lrec-conf.org/proceedings/lrec2022/pdf/2022.lrec-1.548.pdf"
}


@inproceedings{Dargis-EtAl:2022:LREC,
  author = "R. Dargis and I. Auzina and I. Kaija and K. Levane-Petrova and K. Pokratniece",
  title = "LaVA – Latvian Language Learner corpus",
  year = 2022,
  booktitle = "13th Language Resources and Evaluation Conference (LREC)",
  pages = "727-731",
  url = "http://www.lrec-conf.org/proceedings/lrec2022/pdf/2022.lrec-1.77.pdf"
}


@inproceedings{Auziņa-EtAl:2021:kongress,
  author = "I. Auzina and I. Kaija and K. Levane-Petrova and K. Pokratniece and R. Dargis",
  title = "Latviešu valodas apguvēju korpusa (LaVA) izmantošana pētniecībā un mācību uzdevumu izstrādē",
  year = 2021,
  booktitle = "Latviešu valodas apguve. XIII Starptautiskais baltistu kongress",
  publisher = "LiePA",
  pages = "142-161",
  doi = "10.37384/LVA.2021.142",
  url = "https://www.researchgate.net/publication/356607926_Latviesu_valodas_apguveju_korpusa_LaVA_izmantosana_petnieciba_un_macibu_uzdevumu_izstrade"
}


@inproceedings{Dargis-EtAl:2020c:BalticHLT,
  author = "R. Dargis and I. Auzina and K. Levane-Petrova and I. Kaija",
  title = "Detailed Error Annotation for Morphologically Rich Languages: Latvian Use Case",
  year = 2020,
  booktitle = "Human Language Technologies - The Baltic Perspective",
  publisher = "IOS Press",
  volume = 328,
  pages = "241-244",
  doi = "10.3233/FAIA200629",
  url = "http://ebooks.iospress.nl/volumearticle/55550"
}


@inproceedings{Dargis-EtAl:2020b:BalticHLT,
  author = "R. Dargis and N. Gruzitis and I. Auzina and K. Stepanovs",
  title = "Creation of Language Resources for the Development of a Medical Speech Recognition System for Latvian",
  year = 2020,
  booktitle = "Human Language Technologies - The Baltic Perspective",
  publisher = "IOS Press",
  volume = 328,
  pages = "135-141",
  doi = "10.3233/FAIA200615",
  url = "https://ebooks.iospress.nl/volumearticle/55536"
}


@inproceedings{Gruzitis-EtAl:2020:IFNW,
  author = "N. Gruzitis and R. Dargis and L. Rituma and G. Nespore-Berzkalne and B. Saulite",
  title = "Deriving a PropBank Corpus from Parallel FrameNet and UD Corpora",
  year = 2020,
  booktitle = "Proceedings of the International FrameNet Workshop 2020: Towards a Global, Multilingual FrameNet",
  pages = "63-69",
  url = "https://www.aclweb.org/anthology/2020.framenet-1.9.pdf"
}


@inproceedings{Dargis-EtAl:2020a:BalticHLT,
  author = "R. Dargis and K. Levane-Petrova and I. Poikans",
  title = "Lessons Learned from Creating a Balanced Corpus from Online Data",
  year = 2020,
  booktitle = "Human Language Technologies - The Baltic Perspective",
  publisher = "IOS Press",
  volume = 328,
  pages = "127-134",
  doi = "10.3233/FAIA200614",
  url = "https://ebooks.iospress.nl/volumearticle/55535"
}


@inproceedings{Dargis-EtAl:2020b:LREC,
  author = "R. Dargis and I. Auzina and K. Levane-Petrova and I. Kaija",
  title = "Quality Focused Approach to a Learner Corpus Development",
  year = 2020,
  booktitle = "Proceedings of The 12th Language Resources and Evaluation Conference (LREC)",
  pages = "392-396",
  url = "https://www.aclweb.org/anthology/2020.lrec-1.49.pdf"
}


@inproceedings{Dargis-EtAl:2020a:LREC,
  author = "R. Dargis and P. Paikens and N. Gruzitis and I. Auzina and A. Akmane",
  title = "Development and Evaluation of Speech Synthesis Corpora for Latvian",
  year = 2020,
  booktitle = "Proceedings of The 12th Language Resources and Evaluation Conference (LREC)",
  pages = "6633-6637",
  url = "https://www.aclweb.org/anthology/2020.lrec-1.818.pdf"
}


@inproceedings{Bojars-EtAl:2019:SEMANTiCS,
  author = "U. Bojars and R. Dargis and U. Lavrinovics and P. Paikens",
  title = "LinkedSaeima: a Linked Open Dataset of Latvia's Parliamentary Debates",
  year = 2019,
  booktitle = "Proceedings of the 15th SEMANTiCS Conference",
  publisher = "Springer",
  volume = 11702,
  pages = "50-56",
  doi = "10.1007/978-3-030-33220-4_4",
  url = "https://link.springer.com/chapter/10.1007/978-3-030-33220-4_4"
}


@article{Urek-EtAl:2019:JBS,
  author = "O. Urek and A. Vulane and R. Dargis and A. Taurina and T. Zirina and H. G. Simonsen",
  title = "Latvian CDI: methodology, developmental trends and cross-linguistic comparison",
  year = 2019,
  journal = "Journal of Baltic Studies",
  publisher = "Routledge",
  volume = 50,
  number = 3,
  pages = "285-305",
  doi = "10.1080/01629778.2019.1590433"
}


@inproceedings{Auzina-EtAl:2019,
  author = "I. Auzina and R. Dargis and K. Levane-Petrova",
  title = "Latviešu valodas apguvēju kļūdu analīze: pareizrakstības kļūdas",
  year = 2019,
  journal = "Vārds un tā pētīšanas aspekti",
  publisher = "LiePA",
  number = 23,
  pages = "220-227"
}


@inproceedings{Dargis-Auzina:2018:BalticHLT,
  author = "R. Dargis and I. Auzina",
  title = "Towards a Modern Text-to-Speech System for Latvian",
  year = 2018,
  booktitle = "Human Language Technologies - The Baltic Perspective",
  publisher = "IOS Press",
  volume = 307,
  pages = "26-29",
  doi = "10.3233/978-1-61499-912-6-26",
  url = "http://ebooks.iospress.nl/volumearticle/50300"
}


@inproceedings{Dargis-EtAl:2018:ParlaCLARIN,
  author = "R. Dargis and I. Auzina and U. Bojars and P. Paikens and A. Znotins",
  title = "Annotation of the Corpus of the Saeima with Multilingual Standards",
  year = 2018,
  booktitle = "Proceedings of the 2018 ParlaCLARIN Workshop",
  url = "http://lrec-conf.org/workshops/lrec2018/W2/pdf/21_W2.pdf"
}


@inproceedings{Dargis-EtAl:2018:LREC,
  author = "R. Dargis and I. Auzina and K. Levane-Petrova",
  title = "The Use of Text Alignment in Semi-Automatic Error Analysis: Use Case in the Development of the Corpus of the Latvian Language Learners",
  year = 2018,
  booktitle = "Proceedings of the 11th International Conference on Language Resources and Evaluation (LREC)",
  pages = "4111-4115",
  url = "http://www.lrec-conf.org/proceedings/lrec2018/pdf/933.pdf"
}


@inproceedings{Spektors-EtAl:2016:LREC,
  author = "A. Spektors and I. Auzina and R. Dargis and N. Gruzitis and P. Paikens and L. Pretkalnina and L. Rituma and B. Saulite",
  title = "Tezaurs.lv: the largest open lexical database for Latvian",
  year = 2016,
  booktitle = "Proceedings of the 10th International Conference on Language Resources and Evaluation (LREC)",
  url = "http://www.lrec-conf.org/proceedings/lrec2016/pdf/1095_Paper.pdf"
}


@inproceedings{Auzina-EtAl:2016:BalticHLT,
  author = "I. Auzina and K. Levane-Petrova and G. Rabante-Busa and R. Dargis and A. Fabregas",
  title = "Designing an annotated longitudinal Latvian children's speech corpus",
  year = 2016,
  booktitle = "Human Language Technologies - The Baltic Perspective",
  publisher = "IOS Press",
  volume = 289,
  doi = "10.3233/978-1-61499-701-6-46",
  url = "http://ebooks.iospress.nl/volumearticle/45513"
}


@inproceedings{Dargis-EtAl:2016:BalticHLT,
  author = "R. Dargis and G. Rabante-Busa and I. Auzina and S. Kruks",
  title = "ParliSearch - A system for large text corpus discourse analysis",
  year = 2016,
  booktitle = "Human Language Technologies - The Baltic Perspective",
  publisher = "IOS Press",
  volume = 289,
  doi = "10.3233/978-1-61499-701-6-115",
  url = "http://ebooks.iospress.nl/volumearticle/45524"
}


@inproceedings{Znotins-EtAl:2015:INTERSPEECH,
  author = "A. Znotins and K. Polis and R. Dargis",
  title = "Media monitoring system for Latvian radio and TV broadcasts",
  year = 2015,
  booktitle = "Proceedings of the 16th Annual Conference of the International Speech Communication Association (INTERSPEECH)",
  url = "https://www.isca-archive.org/interspeech_2015/znotins15_interspeech.pdf"
}


@inproceedings{Dargis-Znotins:2014:BalticHLT,
  author = "R. Dargis and A. Znotins",
  title = "Baseline for keyword spotting in Latvian broadcast speech",
  year = 2014,
  booktitle = "Human Language Technologies - The Baltic Perspective",
  publisher = "IOS Press",
  volume = 268,
  doi = "10.3233/978-1-61499-442-8-75",
  url = "http://ebooks.iospress.nl/volumearticle/38007"
}


@inproceedings{Garkaje-EtAl:2014:BalticHLT,
  author = "G. Garkaje and E. Zilgalve and R. Dargis",
  title = "Normalization and automatized sentiment analysis of contemporary online Latvian Language",
  year = 2014,
  booktitle = "Human Language Technologies - The Baltic Perspective",
  publisher = "IOS Press",
  volume = 268,
  doi = "10.3233/978-1-61499-442-8-83",
  url = "http://ebooks.iospress.nl/volumearticle/38008"
}


@inproceedings{Auzina-EtAl:2014:BalticHLT,
  author = "I. Auzina and M. Pinnis and R. Dargis",
  title = "Comparison of rule-based and statistical methods for grapheme to phoneme modelling",
  year = 2014,
  booktitle = "Human Language Technologies - The Baltic Perspective",
  publisher = "IOS Press",
  volume = 268,
  doi = "10.3233/978-1-61499-442-8-57",
  url = "http://ebooks.iospress.nl/volumearticle/38004"
}


