{"?xml":{"@version":"1.0"},"edm:RDF":{"@xmlns:dc":"http://purl.org/dc/elements/1.1/","@xmlns:edm":"http://www.europeana.eu/schemas/edm/","@xmlns:wgs84_pos":"http://www.w3.org/2003/01/geo/wgs84_pos","@xmlns:foaf":"http://xmlns.com/foaf/0.1/","@xmlns:rdaGr2":"http://rdvocab.info/ElementsGr2","@xmlns:oai":"http://www.openarchives.org/OAI/2.0/","@xmlns:owl":"http://www.w3.org/2002/07/owl#","@xmlns:rdf":"http://www.w3.org/1999/02/22-rdf-syntax-ns#","@xmlns:ore":"http://www.openarchives.org/ore/terms/","@xmlns:skos":"http://www.w3.org/2004/02/skos/core#","@xmlns:dcterms":"http://purl.org/dc/terms/","edm:WebResource":{"@rdf:about":"http://www.dlib.si/stream/URN:NBN:SI:doc-I9685A02/e038c2e7-c7ad-4686-9f5f-9df0b59189b5/PDF","dcterms:extent":"283 KB"},"edm:TimeSpan":{"@rdf:about":"2005-2025","edm:begin":{"@xml:lang":"en","#text":"2005"},"edm:end":{"@xml:lang":"en","#text":"2025"}},"edm:ProvidedCHO":{"@rdf:about":"URN:NBN:SI:doc-I9685A02","dcterms:isPartOf":[{"@rdf:resource":"https://www.dlib.si/details/URN:NBN:SI:spr-M10OPZYO"},{"@xml:lang":"sl","#text":"Sodobna pedagogika"}],"dcterms:issued":"2025","dc:creator":["Arhar Holdt, Špela","Božič, Martin","Klemen, Matej","Robnik Šikonja, Marko"],"dc:format":[{"@xml:lang":"sl","#text":"številka:3"},{"@xml:lang":"sl","#text":"letnik:76"},{"@xml:lang":"sl","#text":"str. 162–176"}],"dc:identifier":["ISSN:0038-0474","DOI:10.63384/sptB53z793a","COBISSID_HOST:259208195","URN:URN:NBN:SI:doc-I9685A02"],"dc:language":"en","dc:publisher":{"@xml:lang":"sl","#text":"Zveza društev pedagoških delavcev Slovenije"},"dc:subject":[{"@xml:lang":"en","#text":"educational domain"},{"@xml:lang":"en","#text":"grammatical error correction"},{"@xml:lang":"sl","#text":"izobraževalna domena"},{"@xml:lang":"en","#text":"large language models"},{"@xml:lang":"sl","#text":"popravljanje slovničnih napak"},{"@xml:lang":"sl","#text":"sintetiziranje podatkov"},{"@xml:lang":"en","#text":"synthetic data construction"},{"@xml:lang":"sl","#text":"veliki jezikovni modeli"}],"dcterms:temporal":{"@rdf:resource":"2005-2025"},"dc:title":{"@xml:lang":"sl","#text":"Grammatical error correction of Slovenian school essays using large language models|"},"dc:description":[{"@xml:lang":"sl","#text":"Grammatical error correction (GEC) is the task of automatically detecting and correcting grammatical errors in text. Large language models have enabled the development of accurate automated methods for detecting and correcting certain types of errors. In the educational domain, the aim of GEC is to aid teachers in correcting student errors. Excessive paraphrasing is a property of Generative Pre-trained Transformer-based models and is undesirable in the language education context. To avoid this, we develop multiple Slovenian models for correcting errors in spelling, word case (capitalization), word form, and word order. We describe the training data construction, training process, and model evaluation approach using the Šolar-Eval 1.0 corpus of school essays authored by primary and secondary school students. Our quantitative evaluation shows that the developed models have reasonably high accuracy levels, and our qualitative evaluation highlights the strengths and weaknesses of the models and the evaluation process. The analysis reveals multiple challenges and promising future directions for improving both model development and the evaluation process"},{"@xml:lang":"sl","#text":"Strojno popravljanje slovničnih napak je naloga, ki zajema samodejno zaznavanje in popravljanje slovničnih napak v besedilu. Na področju izobraževanja je cilj metod pomagati učiteljem pri popravljanju napak učencev. Veliki jezikovni modeli omogočajo razvoj natančnih avtomatskih metod za zaznavanje in popravljanje določenih vrst napak. Da bi se izognili pretiranemu parafraziranju, ki je značilno za modele tipa GPT, in je v kontekstu poučevanja jezika nezaželeno, predstavimo več razvitih slovenskih modelov tipa BERT in T5 za popravljanje različnih vrst napak. Te vključujejo črkovalne napake, napake v rabi velikih začetnic, besednih oblik in besednega reda. V članku opišemo postopek ustvarjanja učnih podatkov, postopek učenja ter postopek evalvacije modelov na korpusu Šolar-Eval 1.0, ki vsebuje šolske spise osnovnošolcev in srednješolcev. Avtomatska evalvacija kaže razmeroma visoko natančnost razvitih modelov, medtem ko ročna kvalitativna evalvacija razkrije prednosti in slabosti razvitih modelov ter evalvacijskega postopka. Analiza razkriva številne izzive in obetavne smeri za nadaljnje izboljšave tako pri razvoju modelov kot pri postopku evalvacije"}],"edm:type":"TEXT","dc:type":[{"@xml:lang":"sl","#text":"znanstveno časopisje"},{"@xml:lang":"en","#text":"journals"},{"@rdf:resource":"http://www.wikidata.org/entity/Q361785"}]},"ore:Aggregation":{"@rdf:about":"http://www.dlib.si/?URN=URN:NBN:SI:doc-I9685A02","edm:aggregatedCHO":{"@rdf:resource":"URN:NBN:SI:doc-I9685A02"},"edm:isShownBy":{"@rdf:resource":"http://www.dlib.si/stream/URN:NBN:SI:doc-I9685A02/e038c2e7-c7ad-4686-9f5f-9df0b59189b5/PDF"},"edm:rights":{"@rdf:resource":"http://creativecommons.org/licenses/by-sa/4.0/"},"edm:provider":"Slovenian National E-content Aggregator","edm:intermediateProvider":{"@xml:lang":"en","#text":"National and University Library of Slovenia"},"edm:dataProvider":{"@xml:lang":"sl","#text":"Zveza društev pedagoških delavcev Slovenije"},"edm:object":{"@rdf:resource":"http://www.dlib.si/streamdb/URN:NBN:SI:doc-I9685A02/maxi/edm"},"edm:isShownAt":{"@rdf:resource":"http://www.dlib.si/details/URN:NBN:SI:doc-I9685A02"}}}}