<?xml version='1.0' encoding='UTF-8'?><?xml-stylesheet href='static/style.xsl' type='text/xsl'?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd"><responseDate>2026-06-30T06:19:28Z</responseDate><request verb="GetRecord" identifier="oai:www.clarin.si:11356/1227" metadataPrefix="oai_dc">http://www.clarin.si/repository/oai/request</request><GetRecord><record><header><identifier>oai:www.clarin.si:11356/1227</identifier><datestamp>2023-03-27T17:01:19Z</datestamp><setSpec>hdl_11356_1023</setSpec><setSpec>hdl_11356_1024</setSpec></header><metadata><oai_dc:dc xmlns:oai_dc="http://www.openarchives.org/OAI/2.0/oai_dc/" xmlns:doc="http://www.lyncode.com/xoai" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:dc="http://purl.org/dc/elements/1.1/" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/oai_dc/ http://www.openarchives.org/OAI/2.0/oai_dc.xsd">
<dc:title>Corpus extraction tool LIST 1.0</dc:title>
<dc:creator>Krsnik, Luka</dc:creator>
<dc:creator>Arhar Holdt, Špela</dc:creator>
<dc:creator>Čibej, Jaka</dc:creator>
<dc:creator>Dobrovoljc, Kaja</dc:creator>
<dc:creator>Ključevšek, Aleksander</dc:creator>
<dc:creator>Krek, Simon</dc:creator>
<dc:creator>Robnik-Šikonja, Marko</dc:creator>
<dc:subject>corpus linguistics</dc:subject>
<dc:subject>text processing</dc:subject>
<dc:subject>extraction</dc:subject>
<dc:subject>characters</dc:subject>
<dc:subject>word parts</dc:subject>
<dc:subject>words</dc:subject>
<dc:subject>word sets</dc:subject>
<dc:subject>n-grams</dc:subject>
<dc:subject>morphology</dc:subject>
<dc:description>The LIST corpus extraction tool is a Java program for extracting lists from text corpora on the levels of characters, word parts, words, and word sets. It supports VERT and TEI P5 XML formats and outputs .CSV files that can be imported into Microsoft Excel or similar statistical processing software.</dc:description>
<dc:date>2019-03-25</dc:date>
<dc:type>toolService</dc:type>
<dc:identifier>http://hdl.handle.net/11356/1227</dc:identifier>
<dc:language>slv</dc:language>
<dc:language>eng</dc:language>
<dc:relation>http://www.sdjt.si/wp/wp-content/uploads/2018/09/JTDH-2018_Kljucevsek-et-al_Ucinkovit-izracun-frekvencnih-statistik-za-slovenske-jezikovne-korpuse.pdf</dc:relation>
<dc:relation>https://gitea.cjvt.si/lkrsnik/list</dc:relation>
<dc:relation>http://hdl.handle.net/11356/1276</dc:relation>
<dc:rights>The MIT License (MIT)</dc:rights>
<dc:rights>https://opensource.org/licenses/mit-license.php</dc:rights>
<dc:rights>PUB</dc:rights>
<dc:format>application/zip</dc:format>
<dc:format>text/plain; charset=utf-8</dc:format>
<dc:format>downloadable_files_count: 1</dc:format>
<dc:publisher>Centre for Language Resources and Technologies, University of Ljubljana</dc:publisher>
<dc:publisher>Faculty of Computer and Information Science, University of Ljubljana</dc:publisher>
<dc:publisher>Jožef Stefan Institute</dc:publisher>
<dc:source>http://slovnica.ijs.si/</dc:source>
</oai_dc:dc>
</metadata></record></GetRecord></OAI-PMH>