<?xml version='1.0' encoding='UTF-8'?><?xml-stylesheet href='static/style.xsl' type='text/xsl'?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd"><responseDate>2026-05-21T20:35:13Z</responseDate><request verb="GetRecord" identifier="oai:www.clarin.si:11356/1300" metadataPrefix="oai_dc">http://www.clarin.si/repository/oai/request</request><GetRecord><record><header><identifier>oai:www.clarin.si:11356/1300</identifier><datestamp>2024-05-12T16:47:44Z</datestamp><setSpec>hdl_11356_1023</setSpec><setSpec>hdl_11356_1024</setSpec></header><metadata><oai_dc:dc xmlns:oai_dc="http://www.openarchives.org/OAI/2.0/oai_dc/" xmlns:doc="http://www.lyncode.com/xoai" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:dc="http://purl.org/dc/elements/1.1/" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/oai_dc/ http://www.openarchives.org/OAI/2.0/oai_dc.xsd">
<dc:title>Slovenian parliamentary corpus (1990-2018) siParl 2.0</dc:title>
<dc:creator>Pančur, Andrej</dc:creator>
<dc:creator>Erjavec, Tomaž</dc:creator>
<dc:creator>Ojsteršek, Mihael</dc:creator>
<dc:creator>Šorn, Mojca</dc:creator>
<dc:creator>Blaj Hribar, Neja</dc:creator>
<dc:subject>parliamentary debates</dc:subject>
<dc:subject>Slovenian Parliament</dc:subject>
<dc:subject>TEI</dc:subject>
<dc:subject>Parla-CLARIN</dc:subject>
<dc:subject>universal dependencies</dc:subject>
<dc:description>The siParl corpus contains minutes of the Assembly of the Republic of Slovenia for 11th legislative period 1990-1992, minutes of the National Assembly of the Republic of Slovenia from the 1st to the 7th legislative period 1992-2018, minutes of the working bodies of the National Assembly of the Republic of Slovenia from the 2nd to the 7th legislative period 1996-2018, and minutes of the Council of the President of the National Assembly from the 2nd to the 7th legislative period 1996-2018. The corpus comprises over 10 thousand sessions, one million speeches or 200 million words. The corpus contains meta-data about the speakers, a typology of sessions etc. and structural, editorial and linguistic annotations. The corpus is encoded according to the Parla-CLARIN schema (https://github.com/clarin-eric/parla-clarin). Each mandate is in one directory, and each session in one file.&#xd;
&#xd;
This item comprises the following datasets: &#xd;
1. source DARAH-SI Parla-CLARIN encoded corpus; &#xd;
2. linguistically annotatated Parla-CLARIN encoded corpus: tokenisation, MSD tagging, lemmatisation, Universal Dependencies features and syntactic parses,  named entities;&#xd;
3. linguisticaly annotated corpus in vertical format used by CWB and Sketch Engine concordancers; this format is simpler and smaller but does not contain all the information from the source TEI;&#xd;
4. linguisticaly annotated corpus in CONLL-U format as used by Universal Dependencies&#xd;
5. plain text of the corpus&#xd;
&#xd;
Note that each dataset also includes TSV meta-data files on sessions (files) and speakers.&#xd;
&#xd;
As opposed to the previous version 1.0, this version corrects many errors, has substantially better meta-data and the linguistic processing has more levels and less errors.</dc:description>
<dc:date>2020-04-13</dc:date>
<dc:type>corpus</dc:type>
<dc:identifier>http://hdl.handle.net/11356/1300</dc:identifier>
<dc:language>slv</dc:language>
<dc:relation>http://hdl.handle.net/11356/1236</dc:relation>
<dc:relation>http://hdl.handle.net/11356/1748</dc:relation>
<dc:rights>Creative Commons - Attribution 4.0 International (CC BY 4.0)</dc:rights>
<dc:rights>https://creativecommons.org/licenses/by/4.0/</dc:rights>
<dc:rights>PUB</dc:rights>
<dc:format>application/zip</dc:format>
<dc:format>application/zip</dc:format>
<dc:format>application/zip</dc:format>
<dc:format>application/zip</dc:format>
<dc:format>application/zip</dc:format>
<dc:format>application/zip</dc:format>
<dc:format>text/plain; charset=utf-8</dc:format>
<dc:format>downloadable_files_count: 6</dc:format>
<dc:publisher>Institute of Contemporary History</dc:publisher>
<dc:source>https://github.com/DARIAH-SI/siParl/</dc:source>
</oai_dc:dc>
</metadata></record></GetRecord></OAI-PMH>