<?xml version="1.0"?><rdf:RDF xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:edm="http://www.europeana.eu/schemas/edm/" xmlns:wgs84_pos="http://www.w3.org/2003/01/geo/wgs84_pos" xmlns:foaf="http://xmlns.com/foaf/0.1/" xmlns:rdaGr2="http://rdvocab.info/ElementsGr2" xmlns:oai="http://www.openarchives.org/OAI/2.0/" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:ore="http://www.openarchives.org/ore/terms/" xmlns:skos="http://www.w3.org/2004/02/skos/core#" xmlns:dcterms="http://purl.org/dc/terms/"><edm:WebResource rdf:about="http://www.dlib.si/stream/URN:NBN:SI:doc-MFAZGQZL/7cd47b22-3c48-4ce7-8916-903b5579a6a2/HTML"><dcterms:extent>65 KB</dcterms:extent></edm:WebResource><edm:WebResource rdf:about="http://www.dlib.si/stream/URN:NBN:SI:doc-MFAZGQZL/81101d9f-840a-42a7-99be-7d765e7b7824/PDF"><dcterms:extent>1015 KB</dcterms:extent></edm:WebResource><edm:WebResource rdf:about="http://www.dlib.si/stream/URN:NBN:SI:doc-MFAZGQZL/75fd6628-62eb-403e-9989-1f67f3f4a97b/TEXT"><dcterms:extent>50 KB</dcterms:extent></edm:WebResource><edm:TimeSpan rdf:about="1948-2025"><edm:begin xml:lang="en">1948</edm:begin><edm:end xml:lang="en">2025</edm:end></edm:TimeSpan><edm:ProvidedCHO rdf:about="URN:NBN:SI:doc-MFAZGQZL"><dcterms:isPartOf rdf:resource="https://www.dlib.si/details/URN:NBN:SI:spr-QOIKGUTE" /><dcterms:issued>2005</dcterms:issued><dc:creator>Lönneker, Birte</dc:creator><dc:format xml:lang="sl">številka:2</dc:format><dc:format xml:lang="sl">letnik:53</dc:format><dc:format xml:lang="sl">str. 193-210</dc:format><dc:identifier>ISSN:0350-6894</dc:identifier><dc:identifier>COBISSID:30090594</dc:identifier><dc:identifier>URN:URN:NBN:SI:doc-MFAZGQZL</dc:identifier><dc:language>sl</dc:language><dc:publisher xml:lang="sl">Slavistično društvo Slovenije</dc:publisher><dcterms:isPartOf xml:lang="sl">Slavistična revija</dcterms:isPartOf><dc:subject xml:lang="sl">korusna lingvistika</dc:subject><dc:subject xml:lang="sl">lematizacija</dc:subject><dc:subject xml:lang="sl">Nova Beseda</dc:subject><dc:subject xml:lang="sl">označevanje</dc:subject><dc:subject xml:lang="en">Slovene</dc:subject><dc:subject xml:lang="sl">slovenščina</dc:subject><dc:subject xml:lang="en">TreeTagger</dc:subject><dcterms:temporal rdf:resource="1948-2025" /><dc:title xml:lang="sl">Strojno oblikoslovno označevanje slovenskih besedil| kako daleč smo|</dc:title><dc:description xml:lang="sl">The article deals with part-of-speech tagging and lemmatization of Slovene texts. The first section explains how these procedures are performed. The second section presents results of experiments in automated tagging of Slovene texts, using a pre-tagged training corpus of one million words. The treeTagger, a statistical tagger, was trained for Slovene and achieved a precision of about 85%. It tagged and lemmatized 100 million russnig words of the Slovene corpus Nova Beseda</dc:description><dc:description xml:lang="sl">Članek obravnava oblikoslovno označevanje in lematizacijo slovenskih besedil. Prvo poglavje razlaga izvedbo teh postopkov. Drugo poglavje predstavi rezultate poskusov strojnega označevanja slovenskih besedil z uporabo milijonskega že označenega učnega korpusa. Za slovenščino prilagojen strojni označevalnik TreeTagger je dosegel točnost okoli 85 % in označil ter lematiziral 100 milijonov besed slovenskega korpusa Nova Beseda</dc:description><edm:type>TEXT</edm:type><dc:type xml:lang="sl">znanstveno časopisje</dc:type><dc:type xml:lang="en">journals</dc:type><dc:type rdf:resource="http://www.wikidata.org/entity/Q361785" /></edm:ProvidedCHO><ore:Aggregation rdf:about="http://www.dlib.si/?URN=URN:NBN:SI:doc-MFAZGQZL"><edm:aggregatedCHO rdf:resource="URN:NBN:SI:doc-MFAZGQZL" /><edm:isShownBy rdf:resource="http://www.dlib.si/stream/URN:NBN:SI:doc-MFAZGQZL/81101d9f-840a-42a7-99be-7d765e7b7824/PDF" /><edm:rights rdf:resource="http://creativecommons.org/licenses/by/4.0/" /><edm:provider>Slovenian National E-content Aggregator</edm:provider><edm:intermediateProvider xml:lang="en">National and University Library of Slovenia</edm:intermediateProvider><edm:dataProvider xml:lang="sl">Slavistično društvo Slovenije</edm:dataProvider><edm:object rdf:resource="http://www.dlib.si/streamdb/URN:NBN:SI:doc-MFAZGQZL/maxi/edm" /><edm:isShownAt rdf:resource="http://www.dlib.si/details/URN:NBN:SI:doc-MFAZGQZL" /></ore:Aggregation></rdf:RDF>