<?xml version="1.0" encoding="UTF-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xml:lang="en">
    <teiHeader>
        <fileDesc>
            <titleStmt>
                <title>Parlameter – a Corpus of Contemporary Slovene Parliamentary
                    Proceedings</title>
                <author>
                    <name>
                        <forename>Darja</forename>
                        <surname>Fišer</surname>
                        <affiliation>Department of Translation, Faculty of Arts, University of
                            Ljubljana</affiliation>
                        <address>
                            <addrLine>Aškerčeva 2</addrLine>
                            <addrLine>SI-1000 Ljubljana</addrLine>
                        </address>
                        <email>Darja.fiser@ff.uni-lj.si</email>
                        <affiliation>Department of Knowledge Technologies, Jožef Stefan
                            Institute</affiliation>
                        <address>
                            <addrLine>Jamova cesta 39</addrLine>
                            <addrLine>SI-1000 Ljubljana</addrLine>
                        </address>
                    </name>
                </author>
                <author>
                    <name>
                        <forename>Nikola</forename>
                        <surname>Ljubešič</surname>
                        <affiliation>Jožef Stefan Institute</affiliation>
                        <address>
                            <addrLine>Jamova cesta 39</addrLine>
                            <addrLine>SI-1000 Ljubljana</addrLine>
                        </address>
                        <email>nikola.ljubesic@ijs.si</email>
                    </name>
                </author>
                <author>
                    <name>
                        <forename>Tomaž</forename>
                        <surname>Erjavec</surname>
                        <affiliation>Department of Knowledge Technologies, Jožef Stefan
                            Institute</affiliation>
                        <address>
                            <addrLine>Jamova cesta 39</addrLine>
                            <addrLine>SI-1000 Ljubljana</addrLine>
                        </address>
                        <email>tomaz.erjavec@ijs.si</email>
                    </name>
                </author>
            </titleStmt>
            <editionStmt>
                <edition><date>2019-04-15</date></edition>
            </editionStmt>
            <publicationStmt>
                <publisher>
                    <orgName xml:lang="sl">Inštitut za novejšo zgodovino</orgName>
                    <orgName xml:lang="en">Institute of Contemporary History</orgName>
                    <address>
                        <addrLine>Kongresni trg 1</addrLine>
                        <addrLine>SI-1000 Ljubljana</addrLine>
                    </address>
                </publisher>
                <pubPlace>http://ojs.inz.si/pnz/article/view/327</pubPlace>
                <date>2019</date>
                <availability status="free">
                    <licence>http://creativecommons.org/licenses/by-nc-nd/4.0/</licence>
                </availability>
            </publicationStmt>
            <seriesStmt>
                <title xml:lang="sl">Prispevki za novejšo zgodovino</title>
                <title xml:lang="en">Contributions to Contemporary History</title>
                <biblScope unit="volume">59</biblScope>
                <biblScope unit="issue">1</biblScope>
                <idno type="ISSN">2463-7807</idno>
            </seriesStmt>
            <sourceDesc>
                <p>No source, born digital.</p>
            </sourceDesc>
        </fileDesc>
        <encodingDesc>
            <projectDesc xml:lang="en">
                <p>Contributions to Contemporary History is one of the central Slovenian scientific
                    historiographic journals, dedicated to publishing articles from the field of
                    contemporary history (the 19th and 20th century).</p>
                <p>The journal is published three times per year in Slovenian and in the following
                    foreign languages: English, German, Serbian, Croatian, Bosnian, Italian, Slovak
                    and Czech. The articles are all published with abstracts in English and
                    Slovenian as well as summaries in English.</p>
            </projectDesc>
            <projectDesc xml:lang="sl">
                <p>Prispevki za novejšo zgodovino je ena osrednjih slovenskih znanstvenih
                    zgodovinopisnih revij, ki objavlja teme s področja novejše zgodovine (19. in 20.
                    stoletje).</p>
                <p>Revija izide trikrat letno v slovenskem jeziku in v naslednjih tujih jezikih:
                    angleščina, nemščina, srbščina, hrvaščina, bosanščina, italijanščina, slovaščina
                    in češčina. Članki izhajajo z izvlečki v angleščini in slovenščini ter povzetki
                    v angleščini.</p>
            </projectDesc>
        </encodingDesc>
        <profileDesc>
            <langUsage>
                <language ident="sl"/>
                <language ident="en"/>
            </langUsage>
            <textClass>
                <keywords xml:lang="en">
                    <term>parliamentary proceedings</term>
                    <term>corpus construction</term>
                    <term>language technology</term>
                    <term>corpus analysis</term>
                </keywords>
                <keywords xml:lang="sl">
                    <term>parlamentarne razprave</term>
                    <term>izdelava korpusa</term>
                    <term>jezikovne tehnologije</term>
                    <term>korpusna analiza</term>
                </keywords>
            </textClass>
        </profileDesc>
        <revisionDesc>
            <listChange>
                <change>
                    <date>2019-06-10</date>
                    <name>Mihael Ojsteršek</name>
                    <desc>Pretvorba iz DOCX v TEI, dodatno kodiranje</desc>
                </change>
            </listChange>
        </revisionDesc>
    </teiHeader>
    <text>
        <front>
            <docAuthor>Darja Fišer<note place="foot" xml:id="ftn1" n="*"><hi
                        rend="footnote_reference"/>
                    <hi rend="bold">Department of Translation, Faculty of Arts, University of
                        Ljubljana, Aškerčeva cesta 2, SI-1000 Ljubljana, Department of Knowledge
                        Technologies, Jožef Stefan Institute, Jamova cesta 39, SI-1000 Ljubljana,
                        </hi><ref target="mailto:darja.fiser@ff.uni-lj.si"><hi rend="bold"
                            >darja.fiser@ff.uni-lj.si</hi></ref></note></docAuthor>
            <docAuthor>Nikola Ljubešič<note place="foot" xml:id="ftn2" n="**"><hi
                        rend="footnote_reference"/>
                    <hi rend="bold">Jožef Stefan Institute,
                        Jamova cesta 39, SI-1000 Ljubljana, </hi><ref
                        target="mailto:nikola.ljubesic@ijs.si"><hi rend="bold"
                            >nikola.ljubesic@ijs.si</hi></ref></note>
            </docAuthor>
            <docAuthor>Tomaž Erjavec<note place="foot" xml:id="ftn3" n="***"><hi
                        rend="footnote_reference"/>
                    <hi rend="bold">Department of Knowledge Technologies, Jožef Stefan Institute,
                        Jamova Cesta 39, SI-1000 Ljubljana, </hi><ref
                        target="mailto:tomaz.erjavec@ijs.si"><hi rend="bold"
                            >tomaz.erjavec@ijs.si</hi></ref></note>
            </docAuthor>
            <docImprint>
                <idno type="cobissType">Cobiss type: 1.01</idno>
                <idno type="UDC">UDC: 003.295: 342.537.6(497.4)"2014/2018"</idno>
            </docImprint>
            <div type="abstract" xml:lang="sl">
                <head>IZVLEČEK</head>
                <head>PARLAMETER – KORPUS RAZPRAV SLOVENSKEGA DRŽAVNEGA ZBORA</head>
                <p>
                    <hi rend="italic">V prispevku predstavimo korpus sodobnih parlamentarnih razprav
                        Parlameter, ki vsebuje razprave 7. mandata slovenskega Državnega zbora
                        (2014-2018). Korpus Parlameter vsebuje bogate metapodatke o govorcih (spol,
                        starost, izobrazba, strankarska pripadnost) in je jezikoslovno označen
                        (lematizacija, tegiranje), kar omogoča številne raziskave s področja
                        digitalne humanistike in družboslovja. V prispevku prikažemo potencial
                        korpusnoanalitičnih tehnik za raziskovanje političnih razprav. Korpusna
                        arhitektura je zasnovana tako, da omogoča širitev korpusa na druga časovna
                        obdobja, prav tako pa tudi vključevanje gradiv drugih parlamentov, začenši s
                        hrvaškim in bosanskim.</hi></p>
                <p>
                    <hi rend="italic">Ključne besede: parlamentarne razprave, izdelava korpusa,
                        jezikovne tehnologije, korpusna analiza</hi></p>
            </div>
            <div type="abstract">
                <head>ABSTRACT</head>
                <p>
                    <hi rend="italic">The paper presents the Parlameter corpus of contemporary
                        Slovene parliamentary proceedings, which covers the VIIth mandate of the
                        Slovene Parliament (2014-2018). The Parlameter corpus offers rich speaker
                        metadata (gender, age, education, party affiliation) and is linguistically
                        annotated (lemmatization, tagging), which boost research in several digital
                        humanities and social sciences disciplines. We demonstrate the potential of
                        the corpus analysis techniques for investigating political debates. The
                        corpus architecture allows for regular extensions of the corpus with
                        additional Slovene data, as well as data from other parliaments, starting
                        with Croatian and Bosnian.</hi></p>
                <p>
                    <hi rend="italic">Keywords: parliamentary proceedings, corpus construction,
                        language technology, corpus analysis</hi></p>
            </div>
        </front>
        <body>
            <div>
                <head>Introduction</head>
                <p>Parliamentary discourse is motivated by a wide range of communicative goals, from
                    position-claiming, persuasion and negotiation to agenda-setting and
                    opinion-building along ideological or party lines. It is characterized by
                    role-based commitments and confrontation and the awareness of a multi-layered
                    audience (<ref target="#Ilie.2017">Ilie 2017</ref>). The unique content,
                    structure and language of records of parliamentary debates are all factors that
                    make them an important object of study in a wide range disciplines in digital
                    humanities and social sciences, such as political science (<ref
                        target="#Dijk.2010">van Dijk 2010</ref>), sociology (<ref
                        target="#Cheng.2015">Cheng 2015</ref>), history (<ref
                        target="#Pančur.Šorn.2016">Pančur and Šorn 2016</ref>), discourse analysis
                        (<ref target="#Hirst.2014">Hirst et al. 2014</ref>), sociolinguistics (<ref
                        target="#Rheault.2016">Rheault et al. 2016</ref>), and multilinguality (<ref
                        target="#Bayley.2014">Bayley 2014</ref>).</p>
                <p>Despite the fact that parliamentary discourse has become an increasingly
                    important research topic in various fields of digital humanities and social
                    sciences in the past 50 years (<ref target="#Chester.1962">Chester and Bowring
                        1962</ref>; <ref target="#Franklin.1993">Franklin and Norton 1993</ref>), it
                    has only recently started to acquire a truly interdisciplinary scope (<ref
                        target="#Bayley.2014">Bayley 2014</ref>). Recent developments enable
                    cross-fertilization of linguistic studies with other disciplines and in-depth
                    exploration of institutional uses of language, interpersonal behaviour patterns,
                    interplay between language-shaped facts, and reality-prompted language
                    ritualization and change (<ref target="#Ihalainen.2016">Ihalainen et al.
                        2016</ref>).</p>
                <p>With an increasingly decisive role of parliaments and their rapidly changing
                    relations with the public, mass media, executive branch and international
                    organizations, further empirical research and development of integrative
                    analytical tools are necessary in order to achieve a better understanding of
                    parliamentary discourse as well as its wider societal impact, in particular with
                    studies that represent diverse parts of society (women, minorities, marginalized
                    groups) and cross-cultural studies (<ref target="#Hughes.2013">Hughes et al.
                        2013</ref>).</p>
            </div>
            <div>
                <head>Parliamentary Corpora</head>
                <p>The most distinguishing characteristic of records of parliamentary debates is
                    that they are essentially transcriptions of spoken language produced in
                    controlled and regulated circumstances. For this reason, they are rich in
                    invaluable (sociodemographic) meta-data. They are also easily available under
                    various Freedom of Information Acts set in place to enable informed
                    participation by the public and to improve effective functioning of democratic
                    systems, making the datasets even more valuable for researchers with
                    heterogeneous backgrounds.</p>
                <p>This has motivated a number of national as well as international initiatives (for
                    an overview, see <ref target="#Fišer.Lenardič.2018">Fišer and Lenardič
                        2018</ref>) to compile, process and analyse parliamentary corpora. They are
                    available for most countries within the CLARIN ERIC research infrastructure for
                    language resources and technology, with the UK’s Hansard Corpus being the
                    largest (1.6 billion tokens) and spanning the longest time period (1803-2005)
                    while corpora from other countries are significantly smaller (most comprise
                    between 10 and 100 million tokens) and cover significantly shorter periods
                    (mostly from the 1970s onwards).</p>
                <p>The Slovene parliamentary corpus SlovParl 2.0 (<ref target="#Pančur.2016">Pančur
                        2016</ref>) contains minutes of the Assembly of the Republic of Slovenia for
                    the legislative period 1990-1992 when Slovenia became an independent country.
                    The corpus comprises over 200 sessions, almost 60,000 speeches and 11 million
                    words. It contains extensive meta-data about the speakers, a typology of
                    sessions and structural and editorial annotations and is uniformly encoded to
                    the Text Encoding Initiative (TEI) Guidelines, a de-facto standard for encoding
                    and annotating textual data in Digital Humanities. It is available under the
                    CC-BY licence in the CLARIN.SI repository of language resources and via the
                    CLARIN.SI concordancers (<ref target="#Pančur.2017">Pančur et al. 2017</ref>).
                    SlovParl is thus an exemplary corpus but contains material from a quite limited,
                    and not very recent time period. This makes the corpus of limited use for the
                    rich body of research on recent parliamentary activities.</p>
                <p>Contemporary Slovenian parliamentary debates are monitored by the analytical tool
                        Parlameter<note place="foot" xml:id="ftn4" n="1">
                        <hi rend="italic">Parlameter</hi>, <ref target="https://parlameter.si/"
                            >https://parlameter.si</ref>.</note> which makes use of linguistic as
                    well as non-linguistic data, such as MPs' attendance and voting results. While
                    this is a very useful tool for journalists and citizen scientists and gives
                    valuable insight into contemporary parliamentary data, its functionality is
                    confined to that of the tool and as such cannot be freely manipulated by
                    scholars according to their specific research needs.</p>
                <p>The goal of the research presented in this paper was to convert the Parlameter
                    database into a freely and openly available linguistically annotated corpus
                    enriched with session and speaker metadata, and to showcase the analyses that
                    can be performed on such corpora via open-source tools for corpus analysis.
                    Section 3 gives the basic information on the corpus structure and size, Section
                    4 presents the analysis of the corpus according to the text and speaker metadata
                    by utilizing some of the best-known corpus analysis techniques, and Section 5
                    gives some conclusions and directions for further research.</p>
                <p>While the focus of the paper is the parliamentary language material which we
                    process with natural language processing and analyse with standard methods from
                    corpus linguistics, the aim of the analysis is to inform media and political
                    studies by transferring the presented methodology into these areas.</p>
            </div>
            <div>
                <head>Corpus Compilation</head>
                <p>The data dump from the Parlameter tool consisted of the minutes of the National
                    Assembly of the Republic of Slovenia from its VII<hi rend="superscript">th</hi>
                    mandate spanning sessions that started from 2014-08-01 to 2018-05-24 (the
                    complete mandated lasted till 2018-06-22). It was received from the Parlameter
                    API (application programming interface) as a series of JSON files, which were
                    first reorganised into a file containing speaker metadata and a file with the
                    transcriptions of the minutes with speaker identifiers. The speaker metadata
                    contains information about the speaker name and surname, and (for some speakers)
                    their sex, date of birth, education, and party affiliation. The complete speaker
                    metadata is available for the members of the parliament and of the government,
                    but not for, e.g., visiting field experts, representatives of governmental
                    agencies, non-governmental organizations or civil initiatives. This is why the
                    analyses in Section 4 are performed based on the instances for which the
                    metadata is available in the corpus.</p>
                <p>The transcriptions contain the ID of the session, name of the session (e.g. “<hi
                        rend="italic">4. izredna seja</hi>” - <hi rend="italic">4</hi><hi
                        rend="italic superscript">th</hi><hi rend="italic"> extraordinary
                        session</hi>), the date when the session started, and its speeches, each one
                    with the ID of the speaker and a number of segments, roughly corresponding to
                    paragraphs. As discussed below, the transcriptions also contain comments by the
                    transcribers.</p>
                <div>
                    <head>Normalisation of Speaker Data</head>
                    <p>The speaker data was normalised by removing extraneous spaces and removing
                        honorifics (sometimes the name was preceded by, e.g., “<hi rend="italic"
                            >Gospod</hi>” - <hi rend="italic">Mr.</hi>). Furthermore, in Slovene it
                        is relatively easy to infer the sex from the given name, so we also added
                        sex information to the speakers missing it.</p>
                </div>
                <div>
                    <head>Normalisation of Transcriptions</head>
                    <p>The JSON dump also contained empty speeches, as well as a significant amount
                        of duplicated speeches. These were removed, as well as extraneous spaces in
                        the text of the transcriptions.</p>
                    <p>Second, apart from the speeches, the minutes also contained 65,965 comments
                        on verbal and non-verbal behaviour of the speaker or the members of
                        parliament, and there are two types of such remarks. The first are written
                        between slashes and are mostly comments on audible incidents, e.g., <hi
                            rend="italic">/nerazumljivo/ (incomprehensible), /oglašanje iz dvorane/
                            (comments from the hall), /znak za konec razprave/ (sign for the end of
                            the discussion)</hi>. The second type of comments are written between
                        brackets and mainly denote voting results, e.g., <hi rend="italic">(nihče),
                            /nobody/, (10 članov) /10 members/, (proti 44) /44 against/</hi>. Both
                        types of comments have been removed from the transcriptions for the current
                        version of the corpus, as they are not part of the transcription proper and
                        would significantly complicate further processing. Furthermore, the content
                        of the comments is not uniform, with the same information written in various
                        ways (e.g. <hi rend="italic">/smeh/ - laughter, /smeh iz dvorane/ - laughter
                            from the hall, /smeh v dvorani/ - laughter in the hall</hi>), meaning
                        that the values would have to be unified before being converted to
                        appropriate corpus elements.</p>
                </div>
                <div>
                    <head>Linguistic Annotation</head>
                    <p>In the second stage, the text of the transcriptions was automatically
                        annotated with linguistic information. In particular, the text was
                        tokenised, i.e. split into words, punctuation marks and spaces, and
                        segmented into sentences, which was performed by the ReLDI tokeniser
                        (Ljubešić et al. 2016). Second, the words were part-of-speech tagged and
                        lemmatised, i.e. each word was assigned its context-dependent
                        morphosyntactic description and non-marked form, e.g., the words in “<hi
                            rend="italic">V naši sredini</hi>” - <hi rend="italic">In our midst</hi>
                        are assigned the MSDs “<hi rend="italic">Sl Ps1fslp Ncfsl</hi>” meaning
                        preposition in the locative case; the possessive pronoun in the first person
                        feminine singular locative with a plural owner number; and the feminine
                        common noun in the singular locative, while the lemmas are “<hi
                            rend="italic">v naš sredina</hi>”. The tagging and lemmatisation was
                        performed with the ReLDI tagger (<ref target="#Ljubešić.Erjavec.2016"
                            >Ljubešić and Erjavec 2016</ref>) using its model for Slovene. Finally,
                        the transcriptions were also tagged for named entities, i.e., names
                        identified in the corpus were marked and categorised into five classes,
                        those for persons, locations, organisations, for adjectives derived from a
                        person’s name (e.g. “<hi rend="italic">Cerarjev</hi>” - <hi rend="italic"
                            >Cerar’s</hi>), and a miscellaneous category. The named entity
                        annotation was performed with Janes-NER (<ref target="#Fišer.Ljubešić.2018"
                            >Fišer et al. 2018</ref>).</p>
                </div>
                <div>
                    <head>Corpus Encoding</head>
                    <p>The corpus is encoded in XML, according to the Text Encoding Initiative
                        Guidelines (<ref target="#TEIConsortium.">TEI Consortium 2017</ref>). The
                        complete corpus is stored as one TEI document, which contains its TEI header
                        with the metadata for the corpus, and its text body, containing the
                        transcriptions, one division for each starting date of the sessions; each
                        division is stored as a separate file, giving one root file for the corpus
                        and 525 files for the divisions.</p>
                    <p>The TEI header contains extensive metadata for the corpus as a whole, e.g.,
                        its authors and funders, the source description, the list and numbers of
                        elements used in the corpus, as well as the list of speakers and their
                        metadata. Most metadata is given both in Slovene and English.</p>
                    <p>As illustrated in Figure 1, the TEI text body date divisions contain a
                        division for each session, and then the utterances for each speaker, each
                        one containing one or more segments, which then contain the annotated
                        transcription.</p>

                    <figure>
                        <head>Figure 1: The TEI encoding of the corpus.</head>
                        <eg xml:space="preserve"><![CDATA[
<div xmlns="http://www.tei-c.org/ns/1.0" type="date">
  <docDate when="2014-08-26">26.08.2014–</docDate>
  <head>Mandat VII, 26.08.2014–</head>
  <div type="session">
    <head>2. redna seja</head>
    <docDate when="2014-08-26">26.08.2014–</docDate>
    <u xml:id="u529092" who="#spk11">
      <seg xml:id="u529092.seg1">
        <s xml:id="u529092.seg1.1">
          <w lemma="lepo" ana="mte:Rgp">Lepo</w><c> </c>
          <w lemma="pozdravljen" ana="mte:Appmpn">pozdravljeni</w>
          <pc ana="mte:Z">.</pc><c> </c>
        </s>
        <s xml:id="u529092.seg1.2">
          <w lemma="pričenjati" ana="mte:Vmpr1p">Pričenjamo</w><c> </c>
          <w lemma="2." ana="mte:Mdo">2.</w><c> </c>
          <w lemma="seja" ana="mte:Ncfsa">sejo</w><c> </c>
          <w lemma="kolegij" ana="mte:Ncmsg">Kolegija</w><c> </c>
          <w lemma="predsednik" ana="mte:Ncmsg">predsednika</w><c> </c>
          <name type="org">
            <w lemma="državen" ana="mte:Agpmsg">Državnega</w><c> </c>
            <w lemma="zbor" ana="mte:Ncmsg">zbora</w>
          </name>
          <pc ana="mte:Z">.</pc>
        </s>
]]></eg>
                    </figure>
                </div>
                <div>
                    <head>Corpus Size</head>
                    <p>Some basic statistics regarding the corpus are given in Table 1. In total,
                        the Parlameter corpus contains 371 sessions (as distinguished by their
                        title) which spanned over 525 days, i.e., 1.4 days per session on average.
                        If we count distinct sessions that started on a given day, the corpus
                        contains 1,338 such sessions. The VII<hi rend="superscript">th</hi> mandate
                        of the parliament heard 1,981 speakers who gave 133,287 speeches which
                        contain almost 35 million words, i.e., 67 speeches per speaker and 260 words
                        per speech on average. Due to a number of factors, such as different roles
                        of the speakers in the parliament, the distribution is, of course, far from
                        uniform, e.g., there is one speaker that gave 14,616 speeches, while 711
                        speakers gave only one speech.</p>
                    <table rend="table-scroll">
                        <head>Table 1: Basic statistic of the Parlameter corpus.</head>
                        <row>
                            <cell>Tokens</cell>
                            <cell style="text-align:right;">40,987,516</cell>
                        </row>
                        <row>
                            <cell>Words</cell>
                            <cell style="text-align:right;">34,882,499</cell>
                        </row>
                        <row>
                            <cell>Sentences</cell>
                            <cell style="text-align:right;">1,833,147</cell>
                        </row>
                        <row>
                            <cell>Utterances</cell>
                            <cell style="text-align:right;">133,287</cell>
                        </row>
                        <row>
                            <cell>Speakers</cell>
                            <cell style="text-align:right;">1,981</cell>
                        </row>
                        <row>
                            <cell>Sessions on date</cell>
                            <cell style="text-align:right;">1,338</cell>
                        </row>
                        <row>
                            <cell>Dates</cell>
                            <cell style="text-align:right;">525</cell>
                        </row>
                        <row>
                            <cell>Sessions</cell>
                            <cell style="text-align:right;">371</cell>
                        </row>
                    </table>
                </div>
                <div>
                    <head>Availability of the Corpus</head>
                    <p>The Parlameter corpus is available through CLARIN.SI. CLARIN is the European
                        research infrastructure for language resources and technologies, which makes
                        digital language resources available to scholars, researchers, students and
                        citizen-scientists from all disciplines, especially in the humanities and
                        social sciences, through single sign-on access. CLARIN offers long-term
                        solutions and technology services for deploying, connecting, analysing and
                        sustaining digital language data and tools. CLARIN is organised as a network
                        of national centres, with CLARIN.SI covering Slovenia. CLARIN.SI<note
                            place="foot" xml:id="ftn5" n="2">
                            <hi rend="italic">CLARIN Slovenia</hi>, <ref
                                target="http://www.clarin.si/info/about/"
                                >http://www.clarin.si/info/about/</ref>.</note> offers, inter alia,
                        two concordancers for on-line corpus exploration, and a repository of
                        language resources and tools, intended for their long-term archiving
                        together with support for different types of licences and an unambiguous way
                        for others to cite these resources, using Handle persistent identifiers. The
                        landing page of each resource also gives a cross-reference to the
                        concordancers for the particular corpus, and vice-versa. The repository also
                        exposes its metadata, which is being harvested by a number of other
                        services.</p>
                    <p>The Parlameter corpus is available through both CLARIN.SI concordancers, as
                        well as for download from its repository, both as a TEI document and in the
                        simpler vertical file format, under the liberal Creative Commons -
                        Attribution-ShareAlike (CC BY-SA 4.0) licence (<ref target="#Dobranić.2019"
                            >Dobranić et al. 2019</ref>). In this way we hope to raise interest
                        among other researchers to explore the corpus and make use of it in their
                        research.</p>
                </div>
            </div>
            <div>
                <head>Corpus Analysis</head>
                <p>By using the CLARIN.SI NoSketch Engine concordancer,<note place="foot"
                        xml:id="ftn6" n="3">
                        <hi rend="italic">NoSketch Engine @ CLARIN.SI</hi>, <ref
                            target="https://www.clarin.si/noske/"
                        >https://www.clarin.si/noske/</ref>.</note> we demonstrate the potential of
                    the basic corpus analysis techniques (<ref target="#Fišer.2013">Gorjanc and
                        Fišer 2013</ref>) for politology, history and other related humanities and
                    social sciences disciplines that base their research on large volumes of
                    language data. <hi rend="italic">Concordances</hi> are lists of all examples of
                    the search word or phrase from a corpus which are shown in the context they were
                    used in and are equipped with the available metadata. <hi rend="italic"
                        >Wordlists</hi> are comprehensive summarizations of the language inventory
                    in the corpus, organized by frequency or alphabetically. <hi rend="italic"
                        >Collocations</hi> are partly or fully fixed multi-word expressions which
                    have become established through usage. <hi rend="italic">Keywords</hi> are words
                    which appear in the focus corpus more frequently than they would in the general
                    language. Combined with the available text and speaker metadata, such as date,
                    speaker gender or political affiliation, they provide a powerful analytical tool
                    for discovering the commonalities and specificities of the linguistic footprint
                    and trends by different types of speakers in the parliament as will be shown in
                    the rest of this section.</p>
                <div>
                    <head>Production Volume and Vocabulary Size</head>
                    <p>As already presented in Table 1, the corpus contains nearly 41 million tokens
                        or 35 million words. noSketch Engine also offers the lexicon size of the
                        corpus, as given in Table 2, which shows that the corpus contains
                        approximately 263,000 different word forms (so, inflected words, e.g., <hi
                            rend="italic">Slovenije</hi>) and over 104,000 different lemmas (so,
                        base forms of words, e.g.,<hi rend="italic">Slovenija</hi>), and 1,080
                        different morphosyntactic tags (e.g.,<hi rend="italic">Verb main present
                            second plural</hi>). However, it should be noted that both lemmas and
                        the tags are automatically assigned, so they also contain some annotation
                        errors: the accuracy of morphosyntactic tags is around 94%, the accuracy of
                        lemmas is above 99%.</p>
                    <table rend="table-scroll">
                        <head>Table 2: Lexicon sizes of the Parlameter corpus.</head>
                        <row>
                            <cell>Unique words</cell>
                            <cell style="text-align:right;">263,007</cell>
                        </row>
                        <row>
                            <cell>Unique lemmas</cell>
                            <cell style="text-align:right;">104,247</cell>
                        </row>
                        <row>
                            <cell>Unique tags</cell>
                            <cell style="text-align:right;">1,080</cell>
                        </row>
                    </table>
                    <p>While the corpus contains parliamentary debates from the period 2014-2018 (see Table 3),
                        62% of the material was recorded in 2015 and 2016. Given the parliamentary
                        term, which lasted from 1 August 2014 to 14 April 2018, it is interesting to
                        observe an 8% smaller production in 2017 compared to the year before since
                        the last year of the term would be expectedly the busiest in order to wrap
                        up the workplan and set the ground for a new election cycle.</p>
                    <table rend="table-scroll">
                        <head>Table 3: Distribution of text quantity by year in Parlameter.</head>
                        <row role="label">
                            <cell>Year</cell>
                            <cell>No. of tokens</cell>
                            <cell>% of tokens</cell>
                            <cell>Rel. freq.</cell>
                        </row>
                        <row>
                            <cell style="text-align:right;">2014</cell>
                            <cell style="text-align:right;">3,759,110</cell>
                            <cell style="text-align:right;">9%</cell>
                            <cell style="text-align:right;">91,714</cell>
                        </row>
                        <row>
                            <cell style="text-align:right;">2015</cell>
                            <cell style="text-align:right;">12,441,754</cell>
                            <cell style="text-align:right;">30%</cell>
                            <cell style="text-align:right;">303,550</cell>
                        </row>
                        <row>
                            <cell style="text-align:right;">2016</cell>
                            <cell style="text-align:right;">13,270,257</cell>
                            <cell style="text-align:right;">32%</cell>
                            <cell style="text-align:right;">323,763</cell>
                        </row>
                        <row>
                            <cell style="text-align:right;">2017</cell>
                            <cell style="text-align:right;">9,944,401</cell>
                            <cell style="text-align:right;">24%</cell>
                            <cell style="text-align:right;">242,620</cell>
                        </row>
                        <row>
                            <cell style="text-align:right;">2018</cell>
                            <cell style="text-align:right;">1,571,994</cell>
                            <cell style="text-align:right;">4%</cell>
                            <cell style="text-align:right;">38,353</cell>
                        </row>
                        <row>
                            <cell>Total</cell>
                            <cell style="text-align:right;">40,987,516</cell>
                            <cell style="text-align:right;">100%</cell>
                            <cell style="text-align:right;">1,000,000</cell>
                        </row>
                    </table>
                </div>
                <div>
                    <head>Morphosyntactic Specificities of the Language in ParlaMeter</head>
                    <p>We performed a basic analysis of the morphosyntactic annotations of the
                        corpus in form of the most significant differences in their frequencies
                        between the Gigafida reference corpus of Slovene<note place="foot"
                            xml:id="ftn7" n="4">For this comparison we used the deduplicated version
                            of Gigafida 2.0. At the time of writing, this corpus was newly made and
                            does not yet have a reference publication. It is, however, freely
                            available for searching and analysis at <ref
                                target="https://www.clarin.si/noske/"
                                >https://www.clarin.si/noske/</ref>.</note> and the Parlameter
                        corpus, which are given in Table 4.<note place="foot" xml:id="ftn8" n="5"
                            >The morphosyntactic tags are given here in their expanded form to aid
                            understanding. The reference to these morphosyntactic descriptions is
                            given in <ref target="http://nl.ijs.si/ME/V6/msd/html/msd-sl.html"
                                >http://nl.ijs.si/ME/V6/msd/html/msd-sl.html</ref>.</note></p>
                    <table rend="table-scroll">
                        <head>Table 4: Most salient differences in morphosyntactic descriptions
                            between Gigafida 2.0 and Parlameter.</head>
                        <row role="label">
                            <cell style="text-align:center;">Gigafida</cell>
                            <cell style="text-align:center;">Parlameter</cell>
                        </row>
                        <row>
                            <cell>Residual web</cell>
                            <cell>Pronoun personal first singular nominative</cell>
                        </row>
                        <row>
                            <cell>Numeral roman cardinal</cell>
                            <cell>Verb main present second plural</cell>
                        </row>
                        <row>
                            <cell>Adjective possessive positive masculine singular
                                instrumental</cell>
                            <cell>Pronoun personal second masculine plural nominative</cell>
                        </row>
                        <row>
                            <cell>Auxiliary infinitive</cell>
                            <cell>Pronoun possessive first feminine singular genitive
                                singular</cell>
                        </row>
                        <row>
                            <cell>Adjective possessive positive masculine plural genitive</cell>
                            <cell>Verb main present first plural -Negative</cell>
                        </row>
                        <row>
                            <cell>Adjective possessive positive masculine singular locative</cell>
                            <cell>Verb main present second plural -Negative</cell>
                        </row>
                        <row>
                            <cell>Adjective possessive positive neuter singular locative</cell>
                            <cell>Pronoun demonstrative neuter plural accusative</cell>
                        </row>
                        <row>
                            <cell>Pronoun possessive third masculine singular accusative dual</cell>
                            <cell>Pronoun personal first singular accusative</cell>
                        </row>
                        <row>
                            <cell>Adjective possessive positive masculine singular nominative
                                -Definiteness</cell>
                            <cell>Verb main present first singular</cell>
                        </row>
                        <row>
                            <cell>Pronoun possessive third feminine plural locative singular
                                masculine</cell>
                            <cell>Verb main present first singular</cell>
                        </row>
                        <row>
                            <cell>Adjective possessive positive masculine plural nominative</cell>
                            <cell>Pronoun demonstrative masculine singular dative</cell>
                        </row>
                        <row>
                            <cell>Noun proper feminine plural dative</cell>
                            <cell>Pronoun indefinite feminine singular genitive</cell>
                        </row>
                        <row>
                            <cell>Numeral letter ordinal neuter plural genitive</cell>
                            <cell>Pronoun indefinite masculine singular accusative</cell>
                        </row>
                        <row>
                            <cell>Pronoun personal first dual accusative</cell>
                            <cell>Verb auxiliary present second plural -Negative</cell>
                        </row>
                        <row>
                            <cell>Pronoun personal first dual dative</cell>
                            <cell>Verb auxiliary future first singular -Negative</cell>
                        </row>
                        <row>
                            <cell>Noun proper neuter singular instrumental</cell>
                            <cell>Pronoun personal first masculine plural nominative</cell>
                        </row>
                        <row>
                            <cell>Adjective possessive positive feminine singular locative</cell>
                            <cell>Verb auxiliary present second plural +Negative</cell>
                        </row>
                        <row>
                            <cell>Pronoun personal second singular accusative bound</cell>
                            <cell>Verb main present first plural</cell>
                        </row>
                        <row>
                            <cell>Pronoun personal third masculine dual dative +Clitic</cell>
                            <cell>Pronoun indefinite feminine singular accusative</cell>
                        </row>
                        <row>
                            <cell>Adjective possessive positive masculine plural locative</cell>
                            <cell>Pronoun demonstrative feminine plural accusative</cell>
                        </row>
                    </table>
                    <p>The results show that the parliamentary speeches, as expected, contain more
                        present tense verb forms, especially in the first and second person singular
                        or plural (e.g., <hi rend="italic">imamo - we have, pozdravljam - I greet,
                            zaupate- you trust</hi>), as well as personal and demonstrative
                        pronouns, the former most prominently as the first person singular personal
                        pronoun (<hi rend="italic">jaz - I</hi>).</p>
                    <p>On the other hand, the parliamentary proceedings do not contain URLs or Roman
                        numerals. More interestingly, they also contain significantly fewer
                        possessive adjectives (e.g. <hi rend="italic">torkovim - Tuesday’s</hi>) and
                        pronouns (<hi rend="italic">njun - theirs</hi><hi rend="italic subscript"
                            >[dual]</hi>), proper names, numerals, personal pronouns in the dual
                        number (<hi rend="italic">naju - us two</hi>), or in second person singular
                        accusative (<hi rend="italic">nate - to you</hi>) than general Slovene.</p>
                </div>
                <div>
                    <head>Language and Gender in Parlameter</head>
                    <p>As Table 5 shows, gender is recorded for all but one speaker in the corpus.<note place="foot"
                            xml:id="ftn9" n="6">This missing information is due to errors in input
                            metadata records, which will be improved in the next version of the
                            corpus.</note> In total, 1,965 speakers are represented, 62% of which
                        are male and 38% female. Interestingly, the contribution from the speakers
                        is not proportionate to the distribution according to their gender, with the
                        male speakers contributing 71% of the tokens in the corpus and the female
                        speakers 29%. On the speech level the difference is even more pronounced as
                        the male speakers delivered 73% of the speeches while female speakers only
                        27%, indicating that, on average, the speeches given by female speakers were
                        somewhat longer than those by male speakers.</p>
                    <table rend="table-scroll">
                        <head>Table 5: Distribution of speakers and text production by gender in
                            Parlameter.</head>
                        <row role="label">
                            <cell>Gender</cell>
                            <cell style="text-align:center;">No. of speakers</cell>
                            <cell style="text-align:center;">% of speakers</cell>
                            <cell style="text-align:center;">No. of tokens</cell>
                            <cell style="text-align:center;">% of tokens</cell>
                        </row>
                        <row>
                            <cell>Female</cell>
                            <cell style="text-align:right;">747</cell>
                            <cell style="text-align:right;">38%</cell>
                            <cell style="text-align:right;">29,147,871</cell>
                            <cell style="text-align:right;">71%</cell>
                        </row>
                        <row>
                            <cell>Male</cell>
                            <cell style="text-align:right;">1217</cell>
                            <cell style="text-align:right;">62%</cell>
                            <cell style="text-align:right;">11,838,913</cell>
                            <cell style="text-align:right;">29%</cell>
                        </row>
                        <row>
                            <cell>Unknown</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">0%</cell>
                            <cell style="text-align:right;">732</cell>
                            <cell style="text-align:right;">0%</cell>
                        </row>
                        <row>
                            <cell>Total</cell>
                            <cell style="text-align:right;">1965</cell>
                            <cell style="text-align:right;">100%</cell>
                            <cell style="text-align:right;">40,987,516</cell>
                            <cell style="text-align:right;">100%</cell>
                        </row>
                    </table>
                    <p>Table 6, which lists top-ranking 10 female and male speakers and their
                        production in terms of tokens, shows that the most prolific male speakers
                        produced nearly twice as much material as their female counterparts.
                        Overall, all top 10 speakers except one (Miha Kordiš, male, the Levica
                        party) have a leading role in one or more parliamentary or governmental
                        bodies, including 2 ministers, both of which are female, 2 opposition deputy
                        group chairs, who are both male, and the Chair of the National Assembly who
                        is also male. Based on their roles in the parliament or the government,
                        top-ranking speakers represent issues on culture, corruption, judiciary,
                        finances, agriculture, foreign policy, education and infrastructure. In
                        terms of political orientation, the largest opposition party SDS is best
                        represented with 5 top-ranking male and 3 female speakers, including chair
                        and vice-chair of their deputy group. Among the top-ranking female speakers,
                        the entire political spectrum is represented while male speakers from the SD
                        and DeSUS parties do not make the list, and the SMC party is only
                        represented by the Chair of the National Assembly whose role is most likely
                        predominantly procedural, not to promote the party agenda.</p>
                    <table rend="table-scroll">
                        <head>Table 6: Top-ranking 10 female and male speakers and their text
                            production in Parlameter.</head>
                        <row role="label">
                            <cell style="text-align:center;">Female</cell>
                            <cell style="text-align:center;">Party affiliation // Role</cell>
                            <cell style="text-align:center;">Tok. <lb/> %</cell>
                            <cell>Male</cell>
                            <cell>Party affiliation // Role</cell>
                            <cell style="text-align:center;">Tok. <lb/> %</cell>
                        </row>
                        <row>
                            <cell>Anja B. Žibert</cell>
                            <cell>SDS // Chair of the Culture Committee</cell>
                            <cell style="text-align:right;">698,883 <lb/> 6%</cell>
                            <cell>Jožef Horvat</cell>
                            <cell>NSI // Chair of the Foreign Policy Committee; Chair of the Deputy
                                Group NSI</cell>
                            <cell style="text-align:right;">1,141,778 <lb/> 4%</cell>
                        </row>
                        <row>
                            <cell>Jelka Godec</cell>
                            <cell>SDS // Chair of the Inquiry Commission on the Misuse Practices in
                                Healthcare </cell>
                            <cell style="text-align:right;">530,029 <lb/> 4%</cell>
                            <cell>Jani Möderndorfer</cell>
                            <cell>ZAAB // Chair of the Inquiry Commission on bank money laundering;
                                Vice-chair of the Election Committee</cell>
                            <cell style="text-align:right;">1,062,546 <lb/> 4%</cell>
                        </row>
                        <row>
                            <cell>Iva Dimic</cell>
                            <cell>NSI // Vice-chair of the Judiciary Committee</cell>
                            <cell style="text-align:right;">509,101 <lb/> 4%</cell>
                            <cell>Franc Trček</cell>
                            <cell>Levica // Vice-chair of the Infrastructure Committee; Vice-chair
                                of the Inquiry Commission on bank money laundering</cell>
                            <cell style="text-align:right;">1,060,399 <lb/> 4%</cell>
                        </row>
                        <row>
                            <cell>Alenka Bratušek</cell>
                            <cell>ZAAB // Vice-chair of the Public Finances Committee; Vice-chair of
                                the Deupty Group ZAAB</cell>
                            <cell style="text-align:right;">483,171 <lb/> 4%</cell>
                            <cell>Milan Brglez</cell>
                            <cell>SMC // Chair of the National Assembly; Chair of the Constitution
                                Committee</cell>
                            <cell style="text-align:right;">948,334 <lb/> 3%</cell>
                        </row>
                        <row>
                            <cell>Violeta Tomić</cell>
                            <cell>Levica // Vice-chair of the Agriculture Committee</cell>
                            <cell style="text-align:right;">446,460 <lb/> 4%</cell>
                            <cell>Vinko Gorenak</cell>
                            <cell>SDS // Vice-chair of the Deputy Group SDS</cell>
                            <cell style="text-align:right;">788,678 <lb/> 3%</cell>
                        </row>
                        <row>
                            <cell>Eva Irgl</cell>
                            <cell>SDS // Chair of the petition committee</cell>
                            <cell style="text-align:right;">439,042 <lb/> 4%</cell>
                            <cell>Franc Breznik</cell>
                            <cell>SDS // Vice-chair of the Election Committee</cell>
                            <cell style="text-align:right;">763,437 <lb/> 3%</cell>
                        </row>
                        <row>
                            <cell>Urška Ban</cell>
                            <cell>SMC // Chair of the Finances and Monetary Policy Committee</cell>
                            <cell style="text-align:right;">382,425 <lb/> 3%</cell>
                            <cell>Jože Tanko</cell>
                            <cell>SDS // Chair of the Deputy Group SDS</cell>
                            <cell style="text-align:right;">752,130 <lb/> 3%</cell>
                        </row>
                        <row>
                            <cell>Mateja V. Erman</cell>
                            <cell>Minister of Finance</cell>
                            <cell style="text-align:right;">381,604 <lb/> 3%</cell>
                            <cell>Andrej Šircelj</cell>
                            <cell>SDS // Chair of the Public Finances Committee</cell>
                            <cell style="text-align:right;">721,135 <lb/> 2%</cell>
                        </row>
                        <row>
                            <cell>Bojana Muršič</cell>
                            <cell>SD // Vice-chair of the National Assembly, Vice-chair of the
                                Education Committee</cell>
                            <cell style="text-align:right;">366,547 <lb/> 3%</cell>
                            <cell>Tomaž Lisec</cell>
                            <cell>SDS // Chair of the Agriculture Committee</cell>
                            <cell style="text-align:right;">707,666 <lb/> 2%</cell>
                        </row>
                        <row>
                            <cell>Julijana B. Mlakar</cell>
                            <cell>DeSUS // Minister of Culture; Vice-chair of the Foreign Policy
                                Committee</cell>
                            <cell style="text-align:right;">308,355 <lb/> 3%</cell>
                            <cell>Miha Kordiš</cell>
                            <cell>Levica</cell>
                            <cell style="text-align:right;">676,717 <lb/> 2%</cell>
                        </row>
                    </table>
                    <p>In order to compare the topics discussed by female and male speakers in the
                        Slovene parliament, we analysed their 100 top-ranking key lemmas, where we
                        used the corpus of all female speakers as the target corpus against the
                        reference corpus of all male speakers in the Parlameter corpus, and vice
                        versa, so the two lists display the distinguishing features of each of the
                        groups. By observing their contexts via concordances, we manually classified
                        them into one of the 13 topics represented by the ministries in the
                        Slovenian government:</p>
                    <list type="unordered">
                        <item><hi rend="italic">agriculture, forestry and food</hi></item>
                        <item><hi rend="italic">culture</hi></item>
                        <item><hi rend="italic">defence</hi></item>
                        <item><hi rend="italic">economy and technology</hi></item>
                        <item><hi rend="italic">education, science and sport</hi></item>
                        <item><hi rend="italic">environment and spatial planning</hi></item>
                        <item><hi rend="italic">finance</hi></item>
                        <item><hi rend="italic">health</hi></item>
                        <item><hi rend="italic">foreign affairs</hi></item>
                        <item><hi rend="italic">infrastructure</hi></item>
                        <item><hi rend="italic">interior</hi></item>
                        <item><hi rend="italic">justice</hi></item>
                        <item><hi rend="italic">labour, family and social affairs</hi></item>
                        <item><hi rend="italic">public administration</hi></item>
                    </list>
                    <p>In addition, we introduced 4 additional categories for words that could not
                        be classified into any of the topics above:</p>
                    <list type="unordered">
                        <item><hi rend="italic">interaction/procedural</hi> for keywords which
                            referred to other people attending the session (e.g., references to
                            names of other speakers, <hi rend="italic">predsednik - chairman</hi>)
                            or expressed procedural matters during the session (e.g., <hi
                                rend="italic">prisotni - present, dobrodošli - welcome</hi>)</item>
                        <item><hi rend="italic">style</hi> for keywords which were either distinctly
                            colloquial or distinctly formal and were frequently used only by a
                            single or very few speakers in order to achieve a special effect (e.g.,
                                <hi rend="italic">penez</hi>, a very informal expression for money,
                                <hi rend="italic">šiht</hi>, a very informal expression for
                            job)</item>
                        <item><hi rend="italic">ideology</hi> for keywords which were used to
                            ideologically label an individual speaker or a group of speakers (e.g.,
                                <hi rend="italic">levičarski - leftist, kapitalizem -
                                capitalism</hi>)</item>
                        <item><hi rend="italic">multiple</hi> for keywords which were used in
                            several topics (e.g., <hi rend="italic">zgodnji - early, fantastičen -
                                fantastic</hi>).</item>
                    </list>
                    <p>As can be seen from Table 7, the most frequent topics among the female
                        speakers are <hi rend="italic">health</hi> (35) and <hi rend="italic"
                            >labour, family and social affairs</hi> (33), which are followed by <hi
                            rend="italic">public administration</hi> (13) and <hi rend="italic"
                            >education, science and sport</hi> (8). Most of the 100 top-ranking
                        keywords uttered by male speakers, on the other hand, could not be
                        classified into a single topic because they were used either to achieve a
                            <hi rend="italic">stylistic effect</hi> (24), were general words that
                        were used in <hi rend="italic">multiple topics</hi>, such as descriptive
                        adjectives or legal terms (22), or <hi rend="italic">ideological
                            expressions</hi> (6), all of which indicate a more discursive, debating
                        style of the male speakers, but could also stem from the fact that the
                        leading roles in that term were predominantly held by male members of
                            parliament.<note place="foot" xml:id="ftn10" n="7">This problem could be
                            avoided by removing outliers regarding production in the dataset before
                            performing the analyses. But our goal here was to present the complete
                            corpus and demonstrate the basic corpus analysis techniques.</note>
                        Despite being much more infrequent than in the female part of the corpus
                        overall, the most frequently represented specific topics by male speakers
                        are <hi rend="italic">infrastructure</hi> (9), <hi rend="italic"
                            >interior</hi> (6), <hi rend="italic">agriculture, forestry and
                            food</hi> (5), and <hi rend="italic">defence</hi> (5), suggesting a
                        significant difference in the roles and interests of male and female
                        speakers in the Slovene parliament.</p>
                    <table rend="table-scroll">
                        <head>Table 7: Topics of 100 top-ranking keywords of female and male
                            speakers in Parlameter.</head>
                        <row role="label">
                            <cell>Topics – female</cell>
                            <cell style="text-align:right;">Freq.</cell>
                            <cell style="text-align:right;">Topics - male</cell>
                            <cell style="text-align:right;">Freq.</cell>
                        </row>
                        <row>
                            <cell>health</cell>
                            <cell style="text-align:right;">35</cell>
                            <cell style="text-align:right;">style</cell>
                            <cell style="text-align:right;">24</cell>
                        </row>
                        <row>
                            <cell>labour, family &amp; social affairs</cell>
                            <cell style="text-align:right;">33</cell>
                            <cell style="text-align:right;">multiple</cell>
                            <cell style="text-align:right;">22</cell>
                        </row>
                        <row>
                            <cell>public administration</cell>
                            <cell style="text-align:right;">13</cell>
                            <cell style="text-align:right;">infrastructure</cell>
                            <cell style="text-align:right;">9</cell>
                        </row>
                        <row>
                            <cell>education, science &amp; sport</cell>
                            <cell style="text-align:right;">8</cell>
                            <cell style="text-align:right;">interior</cell>
                            <cell style="text-align:right;">6</cell>
                        </row>
                        <row>
                            <cell>interaction/procedural</cell>
                            <cell style="text-align:right;">3</cell>
                            <cell style="text-align:right;">ideology</cell>
                            <cell style="text-align:right;">6</cell>
                        </row>
                        <row>
                            <cell>multiple</cell>
                            <cell style="text-align:right;">3</cell>
                            <cell style="text-align:right;">interaction/procedural</cell>
                            <cell style="text-align:right;">5</cell>
                        </row>
                        <row>
                            <cell>environment &amp; spatial planning</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">agriculture, forestry &amp; food</cell>
                            <cell style="text-align:right;">5</cell>
                        </row>
                        <row>
                            <cell>agriculture, forestry &amp; food</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">defense</cell>
                            <cell style="text-align:right;">5</cell>
                        </row>
                        <row>
                            <cell>culture</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">foreign affairs</cell>
                            <cell style="text-align:right;">4</cell>
                        </row>
                        <row>
                            <cell>finance</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">finance</cell>
                            <cell style="text-align:right;">4</cell>
                        </row>
                        <row>
                            <cell>economy &amp; technology</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">justice</cell>
                            <cell style="text-align:right;">3</cell>
                        </row>
                        <row>
                            <cell>Total</cell>
                            <cell style="text-align:right;">100</cell>
                            <cell style="text-align:right;">Total</cell>
                            <cell style="text-align:right;">100</cell>
                        </row>
                    </table>
                    <p>Illustrative examples of the 10 top-ranking female- and male-specific
                        keywords with a manually assigned topic are listed in Tables 8 and 9.</p>
                    <table rend="table-scroll">
                        <head>Table 8: Most frequent keywords, topics and word type among female
                            speakers in Parlameter. N stands for nouns, Adj for adjectives, and NP
                            for proper nouns (names).</head>
                        <row role="label">
                            <cell>Lemma – English translation</cell>
                            <cell>Topic</cell>
                            <cell>PoS</cell>
                            <cell>Freq.</cell>
                            <cell>Freq_ref</cell>
                            <cell>Score</cell>
                        </row>
                        <row>
                            <cell>rejništvo – fostercare</cell>
                            <cell>labour, family &amp; social affairs</cell>
                            <cell>N</cell>
                            <cell style="text-align:right;">264</cell>
                            <cell style="text-align:right;">59</cell>
                            <cell>7.7</cell>
                        </row>
                        <row>
                            <cell>mark – mark</cell>
                            <cell>health</cell>
                            <cell>PN</cell>
                            <cell style="text-align:right;">155</cell>
                            <cell style="text-align:right;">29</cell>
                            <cell>7.1</cell>
                        </row>
                        <row>
                            <cell>enostarševski – single-parent</cell>
                            <cell>labour, family &amp; social affairs</cell>
                            <cell>Adj</cell>
                            <cell style="text-align:right;">167</cell>
                            <cell style="text-align:right;">38</cell>
                            <cell>6.6</cell>
                        </row>
                        <row>
                            <cell>roditeljski – parent</cell>
                            <cell>labour, family &amp; social affairs</cell>
                            <cell>Adj</cell>
                            <cell style="text-align:right;">169</cell>
                            <cell style="text-align:right;">39</cell>
                            <cell>6.5</cell>
                        </row>
                        <row>
                            <cell>medical – medical</cell>
                            <cell>health</cell>
                            <cell>PN</cell>
                            <cell style="text-align:right;">128</cell>
                            <cell style="text-align:right;">26</cell>
                            <cell>6.2</cell>
                        </row>
                        <row>
                            <cell>plazma – plasma</cell>
                            <cell>health</cell>
                            <cell>N</cell>
                            <cell style="text-align:right;">82</cell>
                            <cell style="text-align:right;">9</cell>
                            <cell>6.1</cell>
                        </row>
                        <row>
                            <cell>pacientov – patient’s</cell>
                            <cell>health</cell>
                            <cell>Adj</cell>
                            <cell style="text-align:right;">282</cell>
                            <cell style="text-align:right;">97</cell>
                            <cell>5.7</cell>
                        </row>
                        <row>
                            <cell>zaznamba – notice</cell>
                            <cell>public administration</cell>
                            <cell>N</cell>
                            <cell style="text-align:right;">155</cell>
                            <cell style="text-align:right;">43</cell>
                            <cell>5.7</cell>
                        </row>
                        <row>
                            <cell>žilen – stent</cell>
                            <cell>health</cell>
                            <cell>Adj</cell>
                            <cell style="text-align:right;">518</cell>
                            <cell style="text-align:right;">213</cell>
                            <cell>5.4</cell>
                        </row>
                        <row>
                            <cell>duševen – mental</cell>
                            <cell>health</cell>
                            <cell>Adj</cell>
                            <cell style="text-align:right;">393</cell>
                            <cell style="text-align:right;">156</cell>
                            <cell>5.4</cell>
                        </row>
                        <row>
                            <cell>nasilnež – violent person</cell>
                            <cell>labour, family &amp; social affairs</cell>
                            <cell>N</cell>
                            <cell style="text-align:right;">98</cell>
                            <cell style="text-align:right;">21</cell>
                            <cell>5.4</cell>
                        </row>
                    </table>
                    <table rend="table-scroll">
                        <head>Table 9: Most frequent keywords, topics and word type among male
                            speakers in Parlameter.</head>
                        <row role="label">
                            <cell>lemma – English translation</cell>
                            <cell>category</cell>
                            <cell>PoS</cell>
                            <cell>Freq_ref</cell>
                            <cell>Score</cell>
                        </row>
                        <row>
                            <cell>penez – inf. money</cell>
                            <cell>finance</cell>
                            <cell>N</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell>13.2</cell>
                        </row>
                        <row>
                            <cell>navsezadnje – nevertheless</cell>
                            <cell>multiple</cell>
                            <cell>Adv</cell>
                            <cell style="text-align:right;">90</cell>
                            <cell>8.4</cell>
                        </row>
                        <row>
                            <cell>kubik – cubic</cell>
                            <cell>agriculture, forestry &amp; food</cell>
                            <cell>N</cell>
                            <cell style="text-align:right;">10</cell>
                            <cell>7.8</cell>
                        </row>
                        <row>
                            <cell>islam – Islam</cell>
                            <cell>interior</cell>
                            <cell>N</cell>
                            <cell style="text-align:right;">6</cell>
                            <cell>6.4</cell>
                        </row>
                        <row>
                            <cell>levičarski – leftist</cell>
                            <cell>ideology</cell>
                            <cell>Adj</cell>
                            <cell style="text-align:right;">2</cell>
                            <cell>6.2</cell>
                        </row>
                        <row>
                            <cell>navzoč – present</cell>
                            <cell>interaction/procedural</cell>
                            <cell>Adj</cell>
                            <cell style="text-align:right;">211</cell>
                            <cell>6.0</cell>
                        </row>
                        <row>
                            <cell>avtošola – driving school</cell>
                            <cell>infrastructure</cell>
                            <cell>N</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell>5.8</cell>
                        </row>
                        <row>
                            <cell>socialist – socialist</cell>
                            <cell>ideology</cell>
                            <cell>N</cell>
                            <cell style="text-align:right;">25</cell>
                            <cell>5.5</cell>
                        </row>
                        <row>
                            <cell>svojevrsten – peculiar</cell>
                            <cell>multiple</cell>
                            <cell>Adj</cell>
                            <cell style="text-align:right;">16</cell>
                            <cell>5.4</cell>
                        </row>
                        <row>
                            <cell>e-klopa – e-bench</cell>
                            <cell>interaction/procedural</cell>
                            <cell>N</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell>5.3</cell>
                        </row>
                        <row>
                            <cell>prečenje – crossing</cell>
                            <cell>style</cell>
                            <cell>N</cell>
                            <cell style="text-align:right;">3</cell>
                            <cell>5.2</cell>
                        </row>
                    </table>
                    <p>That the nature and style of male speeches is quite different from the female
                        ones can also be seen from the analysis of the morphosyntactic types of 100
                        highest-ranking keywords for male and female speakers. While nouns are the
                        most frequent category and are used equally frequently by both male and
                        female speakers (44%), many more adjectives were found among the female
                        top-ranking keywords (33% vs. 16%), while the male keywords had more adverbs
                        (11% vs. 4%) and verbs (9% vs. 2%), which again could be related to the
                        roles of the speakers in the parliament. However, given the results of our
                        preliminary work on this dataset (<ref target="#Ljubešić.2018">Ljubešić et al.
                            2018</ref>), during which we removed the speakers that produced most of the linguistic
                        material from the analysis, we see similar trends both in the
                        gender-dependent keyword and morphosyntactic analysis, and are therefore
                        rather in favour of accepting the observed differences as impact of gender
                        and not role.</p>
                </div>
                <div>
                    <head>Language and Party Affiliation in Parlameter</head>
                    <p>Affiliation is recorded for only 113 speakers out of the 1982, however, these
                        are responsible for 79% of the tokens in the corpus. Affiliation is
                        considered as either deputy group membership or a role in the government,
                        where it must be noted that in this version of the corpus the metadata
                        reflect the situation at the beginning of the term and does not keep track
                        of party membership transfers or resignations of ministers or members of
                        parliament. Also, when elected members of parliament were later appointed as
                        ministers, the metadata record only their party affiliation and records as
                        ministers only those who were appointed without being first elected to the
                        parliament. To facilitate more fine-grained and accurate use of the corpus
                        in political science or contemporary history, we plan to refine the metadata
                        for the next release of the corpus, adding also the MP’s membership in the
                        working bodies of the National Assembly, etc. Also, the metadata in the
                        current version of the corpus do not flag the independent members of
                        parliament who do not belong to any of the parliamentary parties and operate
                        in the Independents deputy group, which is why they are not included in our
                        analysis.</p>
                    <p>As Table 10 shows, the most prolific deputy group is the largest opposition
                        party Slovenian Democratic Party (SDS), whose 20 members contributed nearly
                        10 million tokens or 30% of the corpus. SDS is followed by the main
                        governing party, Party of Modern Centre (SMC), whose 42 members contributed
                        7 million tokens or 22% of the corpus. It is interesting to note that in
                        terms of the volume contributed to the corpus on one side and the number of
                        speakers on the other, that this party was the least productive among the
                        main parties, with a ratio of the percentage of tokens to the percentage of
                        speakers (i.e., the relative token to speaker ratio) of 0.54, which means
                        that this party generated a little bit more than a half of the material that
                        would have been expected given their number of speakers and the overall
                        activity of all the speakers. The Left (Levica) and New Slovenia (NSi) rank
                        third and fourth, despite the fact that they had only 6 members each in the
                        parliament, making them the most productive parties with a relative token to
                        speaker ratio of 1.83 and 1.66. The Democratic Party of Pensioners of
                        Slovenia had as many as 12 elected MPs but contributed 1 million tokens less
                        than the two previous parties, which makes them the second least productive
                        party with a relative token to speaker ratio of 0.67.</p>
                    <table rend="table-scroll">
                        <head>Table 10: Distribution of speakers and text production by party
                            affiliation in ParlaMeter with speakers with unknown affiliation
                                removed.<note place="foot" xml:id="ftn11" n="8">The number of
                                speakers per party is calculated from the ParlaMeter dump and
                                deviates slightly from the official member number due to different
                                handling of speakers with multiple roles.</note></head>
                        <row role="label">
                            <cell>Affiliation</cell>
                            <cell>No. of speakers</cell>
                            <cell>% of speakers</cell>
                            <cell>No. of tokens</cell>
                            <cell>% of tokens</cell>
                        </row>
                        <row>
                            <cell>Slovenian Democratic Party Deputy Group (SDS)</cell>
                            <cell style="text-align:right;">20</cell>
                            <cell style="text-align:right;">20%</cell>
                            <cell style="text-align:right;">9.516.651</cell>
                            <cell style="text-align:right;">30%</cell>
                        </row>
                        <row>
                            <cell>Party of Modern Centre Deputy Group (SMC)</cell>
                            <cell style="text-align:right;">42</cell>
                            <cell style="text-align:right;">41%</cell>
                            <cell style="text-align:right;">7.162.719</cell>
                            <cell style="text-align:right;">22%</cell>
                        </row>
                        <row>
                            <cell>The Left Deputy Group (Levica)</cell>
                            <cell style="text-align:right;">6</cell>
                            <cell style="text-align:right;">6%</cell>
                            <cell style="text-align:right;">3.438.194</cell>
                            <cell style="text-align:right;">11%</cell>
                        </row>
                        <row>
                            <cell>New Slovenia – Christian Democrats Deputy Group (NSI)</cell>
                            <cell style="text-align:right;">6</cell>
                            <cell style="text-align:right;">6%</cell>
                            <cell style="text-align:right;">3.370.131</cell>
                            <cell style="text-align:right;">10%</cell>
                        </row>
                        <row>
                            <cell>Social Democrats Deputy Group (SD)</cell>
                            <cell style="text-align:right;">9</cell>
                            <cell style="text-align:right;">9%</cell>
                            <cell style="text-align:right;">2.533.019</cell>
                            <cell style="text-align:right;">8%</cell>
                        </row>
                        <row>
                            <cell>Democratic Party of Pensioners of Slovenia Deputy Group
                                (DeSUS)</cell>
                            <cell style="text-align:right;">12</cell>
                            <cell style="text-align:right;">12%</cell>
                            <cell style="text-align:right;">2.435.884</cell>
                            <cell style="text-align:right;">8%</cell>
                        </row>
                        <row>
                            <cell>Party of Alenka Bratušek Deputy Group (SAB)</cell>
                            <cell style="text-align:right;">4</cell>
                            <cell style="text-align:right;">4%</cell>
                            <cell style="text-align:right;">1.876.294</cell>
                            <cell style="text-align:right;">6%</cell>
                        </row>
                        <row>
                            <cell>Italian and Hugarian National Minorities Deputy Group
                                (IMNS)</cell>
                            <cell style="text-align:right;">2</cell>
                            <cell style="text-align:right;">2%</cell>
                            <cell style="text-align:right;">117.709</cell>
                            <cell style="text-align:right;">0%</cell>
                        </row>
                        <row>
                            <cell>Government</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">1%</cell>
                            <cell style="text-align:right;">1.765.374</cell>
                            <cell style="text-align:right;">5%</cell>
                        </row>
                        <row>
                            <cell>Total</cell>
                            <cell style="text-align:right;">102</cell>
                            <cell style="text-align:right;">100%</cell>
                            <cell style="text-align:right;">32.215.975</cell>
                            <cell style="text-align:right;">100%</cell>
                        </row>
                    </table>
                    <p>Next, we performed a manual analysis of the 100 top-ranking keywords of each
                        political party against the rest of the corpus (see Table 12). These analyses display the
                        distinct properties of one party that are not shared by other parties. Using
                        the concordances, we classified the keywords into the same categories as in
                        Section 4.1, the results of which are summarized in Table 11.</p>
                    <table rend="table-scroll">
                        <head>Table 11: Topics of 100 top-ranking keywords of party members in
                            Parlameter.</head>
                        <row role="label">
                            <cell>Topics</cell>
                            <cell rend="width:100">SMC</cell>
                            <cell rend="width:100">DeSUS</cell>
                            <cell rend="width:100">SD</cell>
                            <cell rend="width:100">SDS</cell>
                            <cell rend="width:100">NSi</cell>
                            <cell rend="width:100">Levica</cell>
                            <cell rend="width:100">SAB</cell>
                        </row>
                        <row>
                            <cell>agriculture, forestry &amp; food</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;"><hi rend="bold">34</hi></cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;"><hi rend="bold">27</hi></cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>culture</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">3</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>defense</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;"><hi rend="bold">21</hi></cell>
                            <cell style="text-align:right;">5</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">1</cell>
                        </row>
                        <row>
                            <cell>economy &amp; technology</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">5</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;"><hi rend="bold">11</hi></cell>
                            <cell style="text-align:right;"><hi rend="bold">13</hi></cell>
                            <cell style="text-align:right;">1</cell>
                        </row>
                        <row>
                            <cell>education, science &amp; sport</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">4</cell>
                        </row>
                        <row>
                            <cell>environment &amp; spatial planning</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">3</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">6</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>finance</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">2</cell>
                            <cell style="text-align:right;">2</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">6</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">1</cell>
                        </row>
                        <row>
                            <cell>foreign affairs</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">5</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">2</cell>
                            <cell style="text-align:right;">4</cell>
                            <cell style="text-align:right;">3</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>health</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">3</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">8</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">5</cell>
                        </row>
                        <row>
                            <cell>ideology </cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;"><hi rend="bold">15</hi></cell>
                            <cell style="text-align:right;">3</cell>
                            <cell style="text-align:right;">9</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>infrastructure</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">2</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">7</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">1</cell>
                        </row>
                        <row>
                            <cell>interaction/procedural </cell>
                            <cell style="text-align:right;"><hi rend="bold">99</hi></cell>
                            <cell style="text-align:right;"><hi rend="bold">61</hi></cell>
                            <cell style="text-align:right;">14</cell>
                            <cell style="text-align:right;"><hi rend="bold">17</hi></cell>
                            <cell style="text-align:right;">10</cell>
                            <cell style="text-align:right;">4</cell>
                            <cell style="text-align:right;">14</cell>
                        </row>
                        <row>
                            <cell>interior</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">3</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">3</cell>
                            <cell style="text-align:right;">5</cell>
                        </row>
                        <row>
                            <cell>justice</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">8</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>labour, family &amp; social affairs</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;"><hi rend="bold">13</hi></cell>
                            <cell style="text-align:right;">3</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">4</cell>
                            <cell style="text-align:right;">13</cell>
                            <cell style="text-align:right;">3</cell>
                        </row>
                        <row>
                            <cell>multiple</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">2</cell>
                            <cell style="text-align:right;">6</cell>
                            <cell style="text-align:right;">13</cell>
                            <cell style="text-align:right;">8</cell>
                            <cell style="text-align:right;">17</cell>
                            <cell style="text-align:right;">29</cell>
                        </row>
                        <row>
                            <cell>public administration</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">2</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">5</cell>
                            <cell style="text-align:right;">2</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">7</cell>
                        </row>
                        <row>
                            <cell>style </cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">8</cell>
                            <cell style="text-align:right;">9</cell>
                            <cell style="text-align:right;"><hi rend="bold">22</hi></cell>
                            <cell style="text-align:right;">11</cell>
                            <cell style="text-align:right;"><hi rend="bold">33</hi></cell>
                            <cell style="text-align:right;"><hi rend="bold">29</hi></cell>
                        </row>
                        <row>
                            <cell>Total</cell>
                            <cell style="text-align:right;">100</cell>
                            <cell style="text-align:right;">100</cell>
                            <cell style="text-align:right;">100</cell>
                            <cell style="text-align:right;">100</cell>
                            <cell style="text-align:right;">100</cell>
                            <cell style="text-align:right;">100</cell>
                            <cell style="text-align:right;">100</cell>
                        </row>
                    </table>
                    <p>Unsurprisingly, due to the role of the main governing party SMC, practically
                        all their top-ranking keywords are interactional elements with the other
                        speakers or have a procedural nature (e.g., <hi rend="italic">navzoč –
                            present, glasovanje – voting, amandma – amendment</hi>). That DeSUS is a
                        single-issue party can be seen from their keywords, which, apart from a
                        surprisingly high proportion of interactive keywords, belong almost
                        exclusively to the semantic field of retirement and pension (e.g., <hi
                            rend="italic">regres – holiday pay, valorizirati – to revalue, gmoten –
                            material</hi>). Interestingly, even the topics of foreign affairs and
                        culture are nearly completely absent from their keyword list, despite the
                        fact that these ministers came from their party, suggesting that these
                        topics are more or less evenly shared with other parties. SD, the third
                        coalition party, clearly display their priority areas of agriculture,
                        forestry and food (e.g., <hi rend="italic">teran – Teran wine, fermentiran –
                            fermented, kmetovati – to farm</hi>) and defence (e.g., <hi
                            rend="italic">vojakinja – female soldier, neeksplodiran – unexploded,
                            strelivo – ammunition</hi>), which can be traced back to their
                        ministers.</p>
                    <p>The largest opposition party SDS stands out from the rest by the amount of
                        ideological keywords identified among the top-ranking keywords (e.g. <hi
                            rend="italic">tranzicijski – transitional, totalitarizem – totalitarism,
                            lustracija – lustration</hi>). NSi and Levica, the opposition parties
                        with the same number of MPs but from the opposite ends of the political
                        spectrum, both address the widest variety of issues (their keywords were
                        classified into 13 out of 18 topics). The topics with nearly equal number of
                        completely opposite keywords are economy and technology (e.g. <hi
                            rend="italic">soupravljanje – co-management</hi> for Levica vs.<hi
                            rend="italic"> espejevec – private entrepreneur</hi> for NSi). While NSi
                        mostly talks about the local issues related to their constituencies (e.g.
                            <hi rend="italic">samooskrba – self-sufficiency, posekan – cut down,
                            obdelovati - farm</hi>), Levica stands out by signature stylistic
                        devices which range from very informal (e.g. <hi rend="italic">šlamastika –
                            pickle, gazda – informal for master, nabijati – to bang on</hi>) to
                        highly elevated registers (e.g. <hi rend="italic">nemara – perhaps, onkraj –
                            beyond, ducat – dozen</hi>) and displays the largest proportion of
                        ideological vocabulary next to SDS (e.g. <hi rend="italic">tovarišica –
                            camerade, revizionizem – revisionism, imperializem – imperialism</hi>).
                        SAB seems to stand out by a predominantly (local)
                        administrative/procedural/governance vocabulary (e.g. <hi rend="italic"
                            >proporcionalen – proportional, odpoklic – recall, dvokrožen –
                            double-ballot</hi>) as well as a discursive, informal style of
                        distinctly negative sentiment, which is characteristic of one of their
                        members Vinko Möderndorfer (e.g. <hi rend="italic">rešpektiram - honour,
                            kozlarija - nonsense, zmazek - disaster</hi>).</p>
                    <table rend="table-scroll">
                        <head>Table 12: 100 top-ranking keywords per political party, taking into
                            account lowercased lemmas, computed against the rest of the Parlameter
                            corpus and sorted according to their keyness score.</head>
                        <row>
                            <cell>SMC</cell>
                            <cell>navzoč, e-klopa, udis, roberto, prekinjen, podprogram, prehajati,
                                lipicer, kustec, katerim, grebenšek, h, battelli, epi, stanujoč,
                                obveščati, krajnc, zaključevati, predajati, pričenjati, sodin,
                                porotnica, simona, franc, glasovati, obrazložitev, moderen, kolegij,
                                tanko, postopkovno, potisek, končevati, nuklearen, brezpredmeten,
                                ep, jernej, dneven, počkaj, glasovnica, mandatno-volilen, vojko,
                                jožef, trček, bojan, neusklajen, tilen, prelog, ustavnorevizijski,
                                odločanje, arko, nadomeščati, he, branislav, matej, jože,
                                glasovanje, prvopodpisan, e-klop, glas, dopolnjen, porotnik,
                                terminski, vložen, simono, franca, pogačnik, erman, ugotavljati,
                                klanjšček, smc, stebernak, nepovezan, jana, žibert, bien, matjaž,
                                šircelj, fajt, postopkoven, lilijana, skrajšan, monetaren,
                                prekinjati, poslovniški, matičen, bah, mag., marinka, šergan, lenča,
                                vraničar, , izvolitev, karlovšek, razpravljavec, predstavnica,
                                razširitev, anita, amandma, nadomeščanje, zame</cell>
                        </row>
                        <row>
                            <cell>DeSUS</cell>
                            <cell>meglič, črnak, pripadajoč, desus, pogačar, dasiravno, vukov,
                                valenca, požun, inferioren, upajoč, mӧderndorfer, pregrešiti,
                                divjak, valorizacija, korva, rezime, kkr, kuzmanič, marijan,
                                upokojen, vuk, mehčati, pojbič, košnik, bližnjevzhoden,
                                zaposlovalen, punkcija, žmavc, milojka, zaporedno, celarc,
                                konzularen, xv., marija, kolar, bačič, erika, grošelj, rubelj,
                                minski, lukić, rudarski, zadržanost, mirjam, godec, valorizirati,
                                sng, tašner, kušar, brinovšek, invalid, zamrznitev, tedaj,
                                dvoživkarstvo, nina, pirnat, dekleva, merše, federacija, nada,
                                klanjšček, protiukrep, jelka, ogrizek, gmoten, kisikov, ivo, majcen,
                                izvoliti, iva, dimic., modifikacija, ljubič, žan, upokojenec,
                                prikrajšanje, prečitati, šimenko, jasna, izplačevanje, zipro,
                                korpič, antonija, premožen, sapa, voljč, suzana, dimic, vesni,
                                lukič, zdravko, irena, teja, sluga, regres, ruše, janja, razparava,
                                trivialen</cell>
                        </row>
                        <row>
                            <cell>SD</cell>
                            <cell>izčistiti, genetsko, izčiščen, vezava, surov, demokrat, vojakinja,
                                gorsko-hribovski, travinje, potočan, vadišče, razprodati, hip,
                                služenje, hišniški, faktorski, pripadnica, stiskanje, zmogljivost,
                                omd-, kočevski, anhovo, vrtojba, peterica, mineralen, maji, krušen,
                                kmetica, ciolos, vklop, deti, socialdemokratski, formacijski, teran,
                                selnica, kloniran, urszr, obramben, salonit, radeče, mlekarna,
                                neperspektiven, marjana, popolnjevanje, omd, odzivanje, vrtnina,
                                vselej, zorganizirati, vikariat, eutm, pokolp, govedo, rogaška,
                                klirinški, razprodaja, surovina, ksenija, vinko, izčiščevati,
                                konzumen, refundirati, pripadnik, neeksplodiran, social, uokviriti,
                                žito, kfor, prebroditi, konvergenca, grajski, brecelj, hogan,
                                administriranje, trader, kočevsko, h4, primož, korenjak, bržkone,
                                kmetovati, obrtništvo, vojska, strelivo, poveljevanje, snežnik,
                                plasiran, gorsko, refundacija, hribovski, proizvodnja, subvencijski,
                                dacian, missing, kmetija, opazovati, voditeljstvo, kramar,
                                fermentiran, viher</cell>
                        </row>
                        <row>
                            <cell>SDS</cell>
                            <cell>islam, fišer, mark, svinjarija, levičarski, odnosno, medical, kb,
                                demokratski, odnosen, lenart, zemljarič, kučan, zalar, bordojski,
                                kb1909, morišče, zločin, iznenada, velikanski, tomos, kangler,
                                patria, multikulti, masleša, prvorazreden, škrlec, udba, stožice,
                                tranzicijski, šef, praprotnik, moralno-etičen, ilegalno, zločinski,
                                bomben, peticija, porsche, srebrenica, cener, umor, totalitaren,
                                pokrasti, totalno, genocid, drugorazreden, tamle, erdogan, judikat,
                                vega, ribičič, privilegiranec, komunističen, razorožitev,
                                varnostnoobveščevalen, žilen, opornica, indičen, škandal, ornik,
                                lustracija, poljanski, posavje, počenjati, furlan, pobiti, sevnica,
                                ubog, janković, krkovič, npu, deček, opran, bojda, blamaža, lopov,
                                toplak, kerševan, slikati, bmw, veselo, amen, totalen, komunizem,
                                totalitarizem, obsoditi, preiskati, bedarija, udbovski, pomorjen,
                                turnšek, vladavina, zlagati, šoping, vpiti, ukc, avion, klemenčič,
                                koruptiven, neumnost</cell>
                        </row>
                        <row>
                            <cell>NSI</cell>
                            <cell>komunalno, socialno-tržen, marn, božičnica, zidanica, egalitaren,
                                krščanski, espejevec, fantastičen, ekstrapolacija, planšarija,
                                medparlamentaren, kamnik, demografija, kapica, bundestag,
                                podonavski, bajuk, samoprispevek, vinogradnik, razlastiti, vipavski,
                                prijateljstvo, kanalizacija, aksiom, pomurje, bogataš, ferenc,
                                parcelacija, optimirati, oljčnik, komenda, polnost, vrtalec, ozp,
                                pomurski, ikt, simulirati, dimniški, parlamentarec, podčrtovati,
                                artikulirati, obžalovati, omizje, cerknica, polčas, ginijev,
                                zbirno-reciklažen, brutalno, prekladanje, širokogruden,
                                absorpcijski, šinko, dolenjsko, lestev, vodovod, rodnost, traktor,
                                notranjska, opn, posekan, vinograd, zaraščati, odvajanje, loža,
                                kristjan, davno, regresen, lovrenčič, firefox, parcela, akrapovič,
                                obdelovati, obratovalnica, zpn, terezija, mihael, odlašati,
                                peskovci, vamp, notranjski, ovs, copatek, veselica, upniški,
                                penzija, hala, digitalen, goljuf, identifikacijski, mohar,
                                postoriti, goveji, prirasti, splačati, samooskrba, prazniti,
                                odstaven, todorić, pozor</cell>
                        </row>
                        <row>
                            <cell>Levica</cell>
                            <cell>penez, tuliti, vračljivost, ubesedovati, onkraj, bajta,
                                neoliberalen, prečiti, nemara, ducat, socialist, delavski,
                                imperialističen, zvrniti, desnica, navsezadnje, blazen, sociolog,
                                šiht, soupravljanje, zategovanje, mandarin, kapitalizem, strokovec,
                                šlamastika, blazno, kapitalističen, tovarišica, ubesedovanje,
                                revizionizem, prekarnost, vzdržan, gazda, profit, sodržavljanka,
                                izkoriščevalski, represija, protisocialen, nabijati, prekaren,
                                metafora, soodločanje, periferen, agregaten, cinkarna, rezilen,
                                mezda, amandmiranje, demokratizacija, ips, efektivno, natov, levica,
                                belokranjec, bučka, zaposlovalec, izhajajoč, reven, požegnati,
                                profiten, marof, ics, minimalec, podrejati, imperializem,
                                kapitalist, silno, prekarizacija, odpustek, sodržavljan,
                                noveliranje, versus, zvo, bolgarski, zastraševanje, informatičen,
                                metaforično, režati, razreden, ciničen, striči, ropotati,
                                korporacija, rasizem, redistributiven, pregrevanje, trade, rez, omv,
                                prekeren, deregulacija, štacuna, grosist, znoreti, penzion,
                                oligopolen, jahati, fevdalizacija, sočasno, prečenje</cell>
                        </row>
                        <row>
                            <cell>SAB</cell>
                            <cell>svojevrsten, večnost, mvk, pooblaščati, that's, diskvalifikacija,
                                prekleto, bla, resnica, fakt, naglas, odpoklic, zavezništvo, minis,
                                četrten, trapast, istrabenz, zasebništvo, zamah, dvokrožen,
                                ramšakov, diskvalificirati, športnica, drk, štos, cetera, ups,
                                nedostojno, redarski, strojan, nijz, proporcionalen, ma, evtanazija,
                                zanič, bloudkov, etc, mv, vsakič, naturalizacija, zamera, nor,
                                listnica, smešiti, dispečiranje, diskusija, strašansko, nefer,
                                diskutirati, regres, sprevržen, r., zavrtanik, večen, hiv,
                                nekorektno, ubežati, imperativen, presedan, prastrah, dinozaver,
                                halo, ekstremističen, rimskokatoliški, mvk-, namenoma, zmazek,
                                gedrih, somalijski, zamahniti, nonstop, kostanjevec, policaj,
                                domišljati, prohibicija, znakoven, paradoks, barantati, et, hecen,
                                močvirnik, avans, nametati, preprosto, prepričevati, podžupan,
                                traparija, kričati, ekstra, non-stop, telovadba, stefanovič,
                                el-zoheiry, ničkolikokrat, kozlarija, prvenstvo, boh, domišljija,
                                rešpektiram</cell>
                        </row>
                    </table>
                </div>
                <div>
                    <head>The Zeitgeist of ParlaMeter</head>
                    <p>Finally, we observe the zeitgeist of the Parlameter corpus by comparing it
                        with its older and smaller cousin, the SlovParl corpus, which contains
                        material from the period of Slovenia’s independence (1990-1992). First, we
                        created keyword lists with each of the two corpora acting as a focus and a
                        reference corpus (see Table 14). We then manually classified 100 top-ranking keywords into
                        the same categories as in Section 4.1, with the following additional
                        categories:</p>
                    <list type="unordered">
                        <item>abbreviations (<hi rend="italic">etc., Mr.</hi>), which were in use in
                            the SlovParl but are no longer the convention in the ParlaMeter
                            transcriptions of the parliamentary sessions</item>
                        <item>IT vocabulary (<hi rend="italic">internet, web</hi>), which at the
                            time of SlovParl was not yet widespread.</item>
                    </list>
                    <p>If we disregard the differences in the mentions of the active politicians in
                        the two periods, which are the most frequent category, most of the
                        top-ranking keywords in both corpora belong to procedural and legal issues,
                        which are clearly different in a newly established state and a state
                        integrated in the EU (see Table 13). Apart from that, many more
                        topics are identified in the Parlameter corpus, such as economy and
                        technology, foreign affairs and health, which again is not surprising as a
                        well-established state will need to take care of a full spectrum of
                        issues.</p>
                    <table rend="table-scroll">
                        <head>Table 13: Topics of the 100 top-ranking keywords in Parlameter and
                            SlovParl.</head>
                        <row role="label">
                            <cell>Topic</cell>
                            <cell>ParlaMeter</cell>
                            <cell>SlovParl</cell>
                        </row>
                        <row>
                            <cell>abbreviation</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">3</cell>
                        </row>
                        <row>
                            <cell>defence</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">1</cell>
                        </row>
                        <row>
                            <cell>economy &amp; technology</cell>
                            <cell style="text-align:right;">6</cell>
                            <cell style="text-align:right;">2</cell>
                        </row>
                        <row>
                            <cell>education</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>environment &amp; spatial planning</cell>
                            <cell style="text-align:right;">2</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>finance</cell>
                            <cell style="text-align:right;">12</cell>
                            <cell style="text-align:right;">7</cell>
                        </row>
                        <row>
                            <cell>foreign affairs</cell>
                            <cell style="text-align:right;">4</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>health</cell>
                            <cell style="text-align:right;">4</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>multiple</cell>
                            <cell style="text-align:right;">0</cell>
                            <cell style="text-align:right;">1</cell>
                        </row>
                        <row>
                            <cell>informal vocabulary</cell>
                            <cell style="text-align:right;">2</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>infrastructure</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>interior</cell>
                            <cell style="text-align:right;">2</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>it vocabulary</cell>
                            <cell style="text-align:right;">2</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>justice</cell>
                            <cell style="text-align:right;">1</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>labour, family &amp; social affairs</cell>
                            <cell style="text-align:right;">3</cell>
                            <cell style="text-align:right;">0</cell>
                        </row>
                        <row>
                            <cell>legal/procedural</cell>
                            <cell style="text-align:right;">14</cell>
                            <cell style="text-align:right;">21</cell>
                        </row>
                        <row>
                            <cell>politician/party</cell>
                            <cell style="text-align:right;">46</cell>
                            <cell style="text-align:right;">65</cell>
                        </row>
                        <row>
                            <cell>Total</cell>
                            <cell style="text-align:right;">100</cell>
                            <cell style="text-align:right;">100</cell>
                        </row>
                    </table>
                    <table rend="table-scroll">
                        <head>Table 14: 100 top-ranking keywords in Parlameter contrasted against
                            SlovParl and vice versa.</head>
                        <row>
                            <cell>ParlaMeter</cell>
                            <cell>evro, eu, desus, smc, cerar, sdh, dutb, möderndorfer, trček,
                                bratušek, sds, gorenak, spleten, mandatno-volilen, deležnik,
                                koalicijski, kordiš, anja, matej, direktiva, postopkovno, kpk,
                                okoljski, kohezijski, javnofinančen, tonin, bdp, veber, naročanje,
                                korupcija, bah, jani, levica, nlb, unija, tanko, migrantski,
                                povprečnina, vatovec, čakalen, pojbič, migrant, varuhinja, prikl,
                                žnidar, šircelj, varuh, zujf, teš, violeta, tomić, mahnič, ddv,
                                digitalen, han, istospolen, lisec, telekom, vrtovec, dars, žibert,
                                novela, globa, zorčič, vajeništvo, godec, trošarina, čuš, okrožen,
                                internet, prvopodpisan, schengenski, matić, trajnosten, gašperšič,
                                jurša, podneben, dz, lipica, lah, podizvajalec, žan, uredba,
                                blagajna, okej, verbič, ferluga, dobovšek, mramor, računski,
                                vraničar, zakonik, ljudmila, nevladen, postopkoven, preiskovalen,
                                direktorat, hanžek, muršič, irgl</cell>
                        </row>
                        <row>
                            <cell>SlovParl</cell>
                            <cell>delegat, oz., glavič, družbenopolitičen, gros, dinar, republiški,
                                usklajevalen, din, skupščinski, starman, zakonjšek, alinea,
                                vzdržati, potrč, vzdržan, kolešnik, izvršen, lukač, sklepčnost,
                                pintar, npr., navzočnost, buser, arzenšek, feltrin, atelšek,
                                liberalno-demokratski, smole, razpravljalec, školč, zvezen,
                                schwarzbartl, delegatski, tomšič, zagožen, železarna, jakič, gošnik,
                                skupščina, polajnar, tomažič, muren, štefančič, lastninjenje,
                                deviza, zlobec, šter, demos, dretnik, kreditno-monetaren, sdp,
                                čimprej, nabornik, devizen, marka, delegatka, sekretariat, bekeš,
                                deželak, klavora, peterle, črnej, halb, kreft, šonc, lokar,
                                gradišar, šeligo, juri, perko, sfrj, voljč, požarnik, semolič,
                                volilec, kramarič, bučar, plebiscit, dvornik, tomše, grašič, tolar,
                                starc, pregelj, podobnik, pozsonec, balažic, g., moge, medzborovski,
                                jaša, razdevšek, rojec, šetinc, urbančič, lavtižar-bebler, vivod,
                                anka, šešok</cell>
                        </row>
                    </table>
                    <p>To illustrate differences in the zeitgeist of both corpora, we extracted the
                        strongest collocations of the following 3 expressions, which are frequent in
                        both corpora, taking into account the collocation candidates that appear at
                        least 5 times immediately next (left or right) to the headword, and analysed
                        the first 50 collocation candidates:</p>
                    <list type="unordered">
                        <item>adjective <hi rend="italic">južen – southern</hi>,</item>
                        <item>noun <hi rend="italic">kriza – crisis</hi>, and</item>
                        <item>verb <hi rend="italic">sprožiti – trigger</hi>.</item>
                    </list>
                    <table rend="table-scroll">
                        <head>Table 15: Comparison of collocations of <hi rend="italic">južen</hi>,
                                <hi rend="italic">kriza</hi> and <hi rend="italic">sprožiti</hi> in
                            SlovParl and ParlaMeter. Topics or morphosyntactic categories are
                            indicated in square brackets, and new collocations in Parlameter are
                            highlighted in bold.</head>
                        <row>
                            <cell/>
                            <cell role="label">SlovParl</cell>
                            <cell role="label">ParlaMeter</cell>
                        </row>
                        <row>
                            <cell>južen</cell>
                            <cell><p>178 (14.03 per million)</p><list type="unordered">
                                    <item>[GEOGRAPHY]: koreja, primorska, amerika</item>
                                    <item>[CONCRETE]: meja, železnica </item>
                                    <item>[METAPHORICAL]: trg, del, stran, republika</item>
                                </list></cell>
                            <cell><p>910 (22.20 per million)</p><list type="unordered">
                                    <item>[GEOGRAPHY]:<hi rend="bold"> afrika</hi>, koreja, <hi
                                            rend="bold">sredozemlje</hi>, amerika, <hi rend="bold"
                                            >tirolska</hi>, <hi rend="bold">sudan</hi>, <hi
                                            rend="bold">tirolec</hi>, <hi rend="bold">koroška</hi>,
                                            <hi rend="bold">italija</hi>, <hi rend="bold"
                                            >evropa</hi>, <hi rend="bold">nemčija</hi>, <hi
                                            rend="bold">slovenija</hi></item>
                                    <item>[CONCRETE]: meja, <hi rend="bold">obvoznica</hi>, <hi
                                            rend="bold">tok, sadje, odsek, </hi>železnica, <hi
                                            rend="bold">ulica</hi></item>
                                    <item>[METAPHORICAL]:<hi rend="bold"> sosedstvo, soseda, sosed,
                                            soseščina</hi>, del, trg, <hi rend="bold">projekt,
                                            stran, država, republika</hi></item>
                                </list></cell>
                        </row>
                        <row>
                            <cell>sprožiti</cell>
                            <cell><p>548 (43.19 per million)</p><list type="unordered">
                                    <item>[CONCRETE]: spor, postopek, proces, interpelacijo,
                                        arbitražo</item>
                                    <item>[METAPHORICAL]: reakcijo, polemiko, akcijo, mehanizem,
                                        pobudo, vprašanje, diskusijo, zahtevo, spremembo, razpravo,
                                        zadevo</item>
                                </list></cell>
                            <cell><p>1,569 (38.28 per million)</p><list type="unordered">
                                    <item>[CONCRETE]: postopek, spor, <hi rend="bold"
                                        >preiskavo</hi>, <hi rend="bold">alarm</hi>, process<hi
                                            rend="bold">, ovadbo, tožbo</hi>, <hi rend="bold"
                                            >stečaj</hi>, <hi rend="bold">prijavo</hi>, <hi
                                            rend="bold">revizijo</hi></item>
                                    <item>[METAPHORICAL]:<hi rend="bold"> plaz</hi>, mehanizem,
                                        polemiko, reakcijo, <hi rend="bold">kepo</hi>, pobudo,
                                        akcijo, <hi rend="bold">iniciativo</hi>, <hi rend="bold"
                                            >aktivnost</hi>, <hi rend="bold">debato</hi>, <hi
                                            rend="bold">kampanjo</hi></item>
                                </list></cell>
                        </row>
                        <row>
                            <cell>kriza</cell>
                            <cell><p>1,114 (87.79 per million)</p><list type="unordered">
                                    <item>[GEOGRAPHY]: jugoslovanska, zalivska kriza</item>
                                    <item>[POLITICS]: vladna, gospodarska, parlamentarna, ekonomska,
                                        ustavna, politična kriza</item>
                                    <item>[METAPHORICAL]: duševna, socialna, razvojna, družbena
                                        kriza</item>
                                    <item>[MODIFIERS]: huda, moralna, globoka, katastrofalna,
                                        velika, težka kriza</item>
                                    <item>[NOUNS]: reševanje, razrešitev, rešitev, razplet,
                                        razreševanje krize</item>
                                    <item>[VERBS]: prebroditi, poglabljati, razrešiti, povzročiti,
                                        rešiti, začeti krizo</item>
                                </list></cell>
                            <cell><p>8,062 (196.69 per million)</p><list type="unordered">
                                    <item>[GEOGRAPHY]: ukrajinska, grška, svetovna, globalna
                                        kriza</item>
                                    <item>[POLITICS]:<hi rend="bold"> migrantska, begunska</hi>,
                                        gospodarska, finančna, <hi rend="bold">migracijska</hi>, <hi
                                            rend="bold">humanitarna</hi>, ekonomska, <hi rend="bold"
                                            >dolžniška</hi>, bančna, politična, <hi rend="bold"
                                            >begunsko-migrantska</hi>, <hi rend="bold">mlečna</hi>,
                                            <hi rend="bold">javnofinančna</hi>, <hi rend="bold"
                                            >varnostna</hi>, kapitalistična kriza</item>
                                    <item>[METAPHORICAL]: <hi rend="bold">socialna</hi> kriza</item>
                                    <item>[MODIFIERS]: huda, <hi rend="bold">kompleksna</hi>,
                                        globoka, velika kriza</item>
                                    <item>[NOUNS]: <hi rend="bold">začetek</hi>, breme, <hi
                                            rend="bold">izbruh</hi>, <hi rend="bold">nastop</hi>,
                                            <hi rend="bold">posledica</hi>, <hi rend="bold"
                                            >nastanek</hi>, reševanje, <hi rend="bold">obdobje</hi>
                                        krize</item>
                                    <item>[VERBS]: kriza <hi rend="bold">nastopi</hi>, <hi
                                            rend="bold">nastane</hi>, <hi rend="bold">pokaže</hi>,
                                            <hi rend="bold">udari</hi> // povzročiti, reševati,
                                        poglabljati krizo</item>
                                </list></cell>
                        </row>
                    </table>
                    <p>As can be seen from Table 15, the biggest difference in relative frequency
                        between the two corpora is observed for the noun <hi rend="italic"
                            >crisis</hi>, which is more than twice as frequent in Parlameter
                        compared to SlovParl, despite the fact that the early 1990s were marked by a
                        long and bloody war in the Balkans as well as severe economic hardship
                        related to change of the economic and political system. Parlameter contains
                        the largest number of new collocation candidates that indicate issues that
                        were not present in the period of SlovParl, such as <hi rend="italic"
                            >migrant/refugee/humanitarian/security crisis</hi>. On the other hand,
                        the secession period was marked by <hi rend="italic"
                            >constitutional/parliamentary crisis</hi>, which are not observed in the
                        late 2010s. Interestingly, SlovParl contains more metaphorical collocations
                        which are not prominent in the Parlameter corpus, such as <hi rend="italic"
                            >mental/social/welfare/moral crisis</hi>. Collocations containing
                        geographical terms indicate the key political, military and social hotspots
                        from that period: <hi rend="italic">Yugoslav/Gulf crisis</hi> in early
                        1990s, and <hi rend="italic">Ukraine/Greek crisis</hi> in late 2010s. An
                        analysis of key verbal collocates with the noun crisis reveals another
                        interesting observation, which is that in SlovParl, all the verbs are about
                        solving the crisis (<hi rend="italic">to solve/resolve/untangle the
                            crisis</hi>), whereas in Parlameter, politicians mostly use verbs that
                        discuss the beginnings or deepening of the crisis (<hi rend="italic">crisis
                            sets in/appears/starts/hits</hi>, <hi rend="italic">to trigger/deepen
                            the crisis</hi>).</p>
                    <p>The verb <hi rend="italic">trigger</hi> is the only one of the three examples
                        that has a higher relative frequency in SlovParl but despite the greater
                        relative frequency, Parlameter contains more collocation candidates, both in
                        the direct and the metaphorical sense, such as <hi rend="italic">trigger an
                            investigation/indictment/lawsuit</hi>, or <hi rend="italic">trigger an
                            audit/bankruptcy</hi>.</p>
                    <p>It is interesting to note that the adjective <hi rend="italic">southern</hi>
                        is more frequently used and has more collocations in general in ParlaMeter
                        despite the fact that in the secession period, links to the rest of former
                        Yugoslavia were probably stronger and there were probably more open issues,
                        signalling that certain topics were probably not discussed on purpose until
                        the issues were resolved and the relations were established again.
                        Especially interesting are all the neighbour-related collocations, which
                        only appear in the Parlameter corpus, 30 years after Slovenia left
                        Yugoslavia: <hi rend="italic">southern neighbour / neighbours /
                            neighbourhood / market / fruit, </hi>despite the fact that
                        geographically speaking, the former Yugoslav republics, spread south-east,
                        not south of Slovenia. The one major unsettled issue is the border with
                        Croatia that has even been subject of international arbitration during the
                        parliamentary term included in the Parlameter corpus, which is reflected in
                        the top-ranking strong collocation <hi rend="italic">južna meja/southern
                            border</hi>.</p>
                </div>
            </div>
            <div>
                <head>Conclusions</head>
                <p>In this paper we presented the Parlameter corpus of contemporary Slovene
                    parliamentary proceedings. We analysed the linguistic production of the speakers
                    according to the morphosyntactic annotation of the corpus and the speaker
                    metadata.</p>
                <p>We have shown that despite the fact that the material included in the corpus
                    spans the period 2014-2018, the bulk of the material was recorded in the first
                    two full years of the parliament. When contrasted against general Slovene,
                    parliamentary speeches contain more present tense forms and personal and
                    demonstrative pronouns. A comparison of male and female speakers shows that
                    while male speakers take the floor more often than their female colleagues, it
                    is the female speakers who make longer contributions. Female speakers mostly
                    address the topics of <hi rend="italic">health</hi>, <hi rend="italic">labour,
                        family and social affairs</hi>, <hi rend="italic">public
                    administration</hi>, and <hi rend="italic">education, science and sport</hi>,
                    while most of the keywords from male speakers do not belong to specific topics,
                    which indicate a more discursive, debating style of the male speakers. When
                    comparing speeches according to party lines, the most prolific deputy group is
                    the largest opposition party Slovenian Democratic Party (SDS) while the ruling
                    Party of Modern Centre (SMC) is the least prolific one. The most productive
                    parties with a relative token to speaker ratio are the smallest parties in this
                    parliamentary term, the Left (Levica) and New Slovenia (NSi). The largest
                    opposition party SDS stands out from the rest by the large amount of ideological
                    keywords while Levica stands out by signature stylistic devices which range from
                    very informal to highly elevated. NSi and Levica, the opposition parties with
                    the same number of MPs but from the opposite ends of the political spectrum,
                    both address the widest variety of issues. With keywords belonging almost
                    exclusively to the semantic field of retirement and pension, DeSUS lies on the
                    other end of the spectrum as a single-issue party. A comparison with the
                    SlovParl corpus of parliamentary debates from the period of Slovenia’s
                    independence, many more topics are identified in Parlameter, which
                    understandable as a well-established state will need to take care of a full
                    spectrum of issues whereas a new state will mostly be dealing with procedural
                    issues and the new legislature. In the future we plan to enrich the corpus with
                    additional session records of previous and the most recent parliamentary terms
                    as well as with additional metadata available through the Parlameter system,
                    such as voting data and accepted legislation, which are also valuable for
                    addressing a number of research questions in various research communities. In
                    parallel, we also plan to develop comparable corpora from other parliaments,
                    starting with Croatian and Bosnian.</p>
            </div>
            <div>
                <head>Acknowledgments</head>
                <p>The work described in this paper was funded by the Slovenian Research Agency
                    within the national basic research project “Resources, methods, and tools for
                    the understanding, identification, and classification of various forms of
                    socially unacceptable discourse in the information society” (J7-8280, 2017-2019)
                    and the Slovenian research infrastructure for language resources and technology
                    CLARIN.SI.</p>
            </div>
        </body>
        <back>
            <div type="bibliography">
                <head>Sources and Literature</head>
                <div>
                    <head>Literature:</head>
                    <listBibl>
                        <bibl xml:id="Bayley.2014">Bayley, Paul. 2014. “Introduction: The whys and
                            wherefores of analyzing parliamentary discourse.” In <hi rend="italic"
                                >Cross-Cultural Perspectives on Parliamentary Discourse</hi>, edited
                            by Paul Bayley, 1–44. Amsterdam, Philadelphia: John Benjamins
                            Publishing.</bibl>
                        <bibl xml:id="Cheng.2015">Cheng, Jennifer E. 2015. “Islamophobia,
                            Muslimophobia or racism? Parliamentary discourses on Islam and Muslims
                            in debates on the minaret ban in Switzerland.” <hi rend="italic"
                                >Discourse &amp; Society</hi> 26 (5): 562–86.</bibl>
                        <bibl xml:id="Chester.1962">Chester, Daniel Norman, and Nona Bowring. 1962.
                                <hi rend="italic">Questions in Parliament.</hi> Oxford: Clarendon
                            Press.</bibl>
                        <bibl xml:id="Dijk.2010">van Dijk, Teun A. 2010. “Political identities in
                            parliamentary debates.” In <hi rend="italic">European Parliaments under
                                Scrutiny: Discourse strategies and interaction practices</hi>,
                            edited by Cornelia Ilie, 29–56. Amsterdam, Philadelphia: John Benjamins
                            Publishing. </bibl>
                        <bibl xml:id="Fišer.Lenardič.2018">Fišer, Darja, and Jakob Lenardič. 2018.
                            “Parliamentary Corpora in the CLARIN infrastructure.” In <hi
                                rend="italic">Selected papers from the CLARIN Annual Conference
                                2017</hi>, edited by Maciej Piasecki, 75–85. Accessed February 27,
                            2019. <ref target="http://www.ep.liu.se/ecp/147/007/ecp17147007.pdf"><hi
                                    rend="Internet_Link"><seg style="font-size:10pt"
                                        >http://www.ep.liu.se/ecp/147/007/ecp17147007.pdf</seg></hi></ref>.</bibl>
                        <bibl xml:id="Fišer.2013">Fišer, Darja, and Vojko Gorjanc. 2013. <hi
                                rend="italic">Korpusna analiza</hi>. Ljubljana: Znanstvena založba
                            Filozofske Fakultete.</bibl>
                        <bibl xml:id="Fišer.Ljubešić.2018">Fišer, Darja, Nikola Ljubešić, and Tomaž
                            Erjavec. 2018. “The Janes project: language resources and tools for
                            Slovene user generated content.” <hi rend="italic">Language Resources
                                and Evaluation</hi>. In press. <ref
                                target="https://doi.org/10.1007/s10579-018-9425-z"><hi
                                    rend="Internet_Link"><seg style="font-size:10pt"
                                        >https://doi.org/10.1007/s10579-018-9425-z</seg></hi></ref>.</bibl>
                        <bibl xml:id="Franklin.1993">Franklin, Mark N., and Philip Norton. 1993. <hi
                                rend="italic">Parliamentary Questions: For the Study of Parliament
                                Group</hi>. Oxford: Oxford University Press.</bibl>
                        <bibl xml:id="Hirst.2014">Hirst, Graeme, Vanessa Wei Feng, Christopher
                            Cochrane, and Nona Naderi. 2014. “Argumentation, Ideology, and Issue
                            Framing in Parliamentary Discourse.” In <hi rend="italic">ArgNLP</hi>.
                            Accessed 27 February 2019. <ref
                                target="ftp://www.cs.toronto.edu/pub/gh/Hirst-etal-Bertinoro-2014.pdf"
                                    ><hi rend="Internet_Link"><seg style="font-size:10pt"
                                        >ftp://www.cs.toronto.edu/pub/gh/Hirst-etal-Bertinoro-2014.pdf</seg></hi></ref>.</bibl>
                        <bibl xml:id="Hughes.2013">Hughes, Lorna M., Paul S. Ell, Gareth A.G.
                            Knight, and Milena Dobreva. 2013. “Assessing and measuring impact of a
                            digital collection in the humanities: An analysis of the SPHERE
                            (Stormont Parliamentary Hansards: Embedded in Research and Education)
                            Project.” <hi rend="italic">Digital Scholarship in the Humanities
                            </hi>30 (2): 183–98.</bibl>
                        <bibl xml:id="Ihalainen.2016">Ihalainen, Pasi, Cornelia Ilie, and Kari
                            Palonen. 2016. <hi rend="italic">Parliament and Parliamentarism: A
                                Comparative History of a European Concept.</hi> Oxford, New York:
                            Berghahn Books.</bibl>
                        <bibl xml:id="Ilie.2017">Ilie, Cornelia. 2017. “Parliamentary Debates.” In
                                <hi rend="italic">The Routledge Handbook of Language and
                                Politics</hi>, edited by Ruth Wodak and Bernhard Forchtner.
                            Routledge.</bibl>
                        <bibl xml:id="Ljubešić.Erjavec.2016">Ljubešić, Nikola, and Tomaž Erjavec.
                            2016. “Corpus vs. Lexicon Supervision in Morphosyntactic Tagging: The
                            Case of Slovene.” In <hi rend="italic">Proceedings of the Tenth
                                International Conference on Language Resources and Evaluation (LREC
                                2016)</hi>, edited by Nicoletta Calzolari, Khalid Choukri, Thierry
                            Declerck, Sara Goggi, Marko Grobelnik, Bente Maegaard, Joseph Mariani,
                            Helene Mazo, Asuncion Moreno, Jan Odijk, and Stelios Piperidis, 1527–31.
                            Accessed February 27, 2019.<ref
                                target="http://www.lrec-conf.org/proceedings/lrec2016/pdf/811_Paper.pdf"
                                    ><hi rend="Internet_Link"><seg style="font-size:10pt"
                                        >http://www.lrec-conf.org/proceedings/lrec2016/pdf/811_Paper.pdf</seg></hi></ref><hi
                                rend="Internet_Link"><seg style="font-size:10pt">.</seg></hi>
                        </bibl>
                        <bibl xml:id="Ljubešić.Erjavec.Fišer.2016">Ljubešić, Nikola, Tomaž Erjavec,
                            Darja Fišer, Tanja Samardžić, Maja Miličević, Filip Klubička, and Filip
                            Petkovski. 2016. “Easily Accessible Language Technologies for Slovene,
                            Croatian and Serbian.” In <hi rend="italic">Proceedings of the
                                Conference on Language Technologies and Digital Humanities
                            2016</hi>, edited by Tomaž Erjavec and Darja Fišer, 120–24. Accessed
                            February 27, 2019. <ref
                                target="http://www.sdjt.si/wp/wp-content/uploads/2016/09/JTDH-2016_Ljubesic-et-al_Easily-Accessible-Language-Technologies.pdf"
                                    ><hi rend="Internet_Link"><seg style="font-size:10pt"
                                        >http://www.sdjt.si/wp/wp-content/uploads/2016/09/JTDH-2016_Ljubesic-et-al_Easily-Accessible-Language-Technologies.pdf</seg></hi></ref>.</bibl>
                        <bibl xml:id="Ljubešić.2018">Ljubešić, Nikola, Darja Fišer, Tomaž Erjavec, and Filip Dobranić. 2018.
                            “The Parlameter corpus of contemporary Slovene parliamentary proceedings.” In 
                            <hi rend="italic">Proceedings of the Conference on Language Technologies and Digital Humanities 2018</hi>,
                            edited by Darja Fišer and Andrej Pančur, 162–167. Accessed June 12, 2019. 
                            <ref target="http://www.sdjt.si/wp/wp-content/uploads/2018/09/JTDH-2018_Ljubesic-et-al_The-Parlameter-corpus-of-contemporary-Slovene-parliamentary-proceedings.pdf">http://www.sdjt.si/wp/wp-content/uploads/2018/09/JTDH-2018_Ljubesic-et-al_The-Parlameter-corpus-of-contemporary-Slovene-parliamentary-proceedings.pdf</ref>.</bibl>
                        <bibl xml:id="Pančur.Šorn.2016">Pančur, Andrej, and Mojca Šorn. 2016. “Smart
                            Big Data: Use of Slovenian Parliamentary Papers in Digital History.” <hi
                                rend="italic">Prispevki za novejšo zgodovino</hi> 56 (3): 130–46. </bibl>
                        <bibl xml:id="Pančur.2016">Pančur, Andrej. 2016. “Označevanje zbirke
                            zapisnikov sej slovenskega parlamenta s smernicami TEI.” In <hi
                                rend="italic">Proceedings of the Conference on Language Technologies
                                and Digital Humanities 2016</hi>, edited by Tomaž Erjavec and Darja
                            Fišer, 142–48. Accessed February 27, 2019. <ref
                                target="http://www.sdjt.si/wp/wp-content/uploads/2016/09/JTDH-2016_Pancur_Oznacevanje-zbirke-zapisnikov-sej-slovenskega-parlamenta.pdf"
                                    ><hi rend="Internet_Link"><seg style="font-size:10pt"
                                        >http://www.sdjt.si/wp/wp-content/uploads/2016/09/JTDH-2016_Pancur_Oznacevanje-zbirke-zapisnikov-sej-slovenskega-parlamenta.pdf</seg></hi></ref>.</bibl>
                        <bibl xml:id="Rheault.2016">Rheault, Ludovic, Kaspar Beelen, Christopher
                            Cochrane, and Graeme Hirst. 2016. “Measuring Emotion in Parliamentary
                            Debates with Automated Textual Analysis.” <hi rend="italic">PLoS
                                ONE</hi> 11 (12): 1–18. </bibl>
                        <bibl xml:id="TEIConsortium.">TEI Consortium, 2017. Guidelines for
                            Electronic Text Encoding and Interchange. Accessed February 27, 2019.
                                <ref
                                target="http://www.tei-c.org/release/doc/tei-p5-doc/en/html/index.html"
                                    ><hi rend="Internet_Link"><seg style="font-size:10pt"
                                        >http://www.tei-c.org/release/doc/tei-p5-doc/en/html/index.html</seg></hi></ref><hi
                                rend="Internet_Link"><seg style="font-size:10pt">.</seg></hi></bibl>
                    </listBibl>
                </div>
                <div>
                    <head>Sources:</head>
                    <listBibl>
                        <bibl xml:id="Dobranić.2019">Dobranić, Filip, Nikola Ljubešić, and Tomaž,
                            Erjavec. 2019. <hi rend="italic">Slovenian parliamentary corpus
                                ParlaMeter-sl 1.0</hi>, Slovenian language resource repository
                            CLARIN.SI. <ref target="http://hdl.handle.net/11356/1208"><hi
                                    rend="Internet_Link"><seg style="font-size:10pt"
                                        >http://hdl.handle.net/11356/1208</seg></hi></ref>.</bibl>
                        <bibl xml:id="Pančur.2017">Pančur, Andrej, Mojca Šorn, and Tomaž Erjavec.
                            2017. <hi rend="italic">Slovenian parliamentary corpus SlovParl
                            2.0</hi>, Slovenian language resource repository CLARIN.SI. <ref
                                target="http://hdl.handle.net/11356/1167"><hi rend="Internet_Link"
                                        ><seg style="font-size:10pt"
                                        >http://hdl.handle.net/11356/1167</seg></hi></ref>. </bibl>
                    </listBibl>
                </div>
            </div>
            <div type="summary">
                <docAuthor>Darja Fišer, Nikola Ljubešič, Tomaž Erjavec</docAuthor>
                <head style="text-transform: uppercase;">Parlameter – a corpus of contemporary Slovene parliamentary proceedings</head>
                <head rend="subheader">SUMMARY</head>
                <p>The unique content, structure and language, as well as the availability of
                    records of parliamentary debates are all factors that make them an important
                    object of study in a wide range disciplines in digital humanities and social
                    sciences. This has motivated a number of national as well as international
                    initiatives to compile, process and analyse parliamentary corpora. This paper
                    presents the Parlameter corpus of contemporary Slovene parliamentary
                    proceedings, which covers the VIIth mandate of the Slovene Parliament
                    (2014-2018). The Parlameter corpus offers rich speaker metadata (gender, age,
                    education, party affiliation) and is linguistically annotated (lemmatization,
                    tagging, named entity recognition).</p>
                <p>The Parlameter corpus contains 371 sessions and 1,981 speakers who gave 133,287
                    speeches which contain almost 35 million words. In the paper we demonstrate the
                    potential of the corpus analysis techniques for investigating political debates
                    by analysing the linguistic production of the speakers according to the
                    morphosyntactic annotation of the corpus and the speaker metadata. When
                    contrasted against general Slovene, parliamentary speeches contain more present
                    tense forms and personal and demonstrative pronouns. While male speakers take
                    the floor more often than their female colleagues, the female speakers’
                    contributions tend to be longer. Female speakers mostly address the topics of
                    health, labour, family and social affairs, public administration, and education,
                    science and sport, while most of the keywords from male speakers do not belong
                    to specific topics, which indicate a more discursive, debating style of the male
                    speakers. The most prolific deputy group overall is the largest opposition party
                    Slovenian Democratic Party (SDS) while the then ruling Party of Modern Centre
                    (SMC) is the least prolific. The most productive parties with a relative token
                    to speaker ratio are the smallest parties in that parliamentary term, the Left
                    (Levica) and New Slovenia (NSi). The largest opposition party SDS stands out
                    from the rest by the large amount of ideological keywords while Levica stands
                    out by signature stylistic devices which range from very informal to highly
                    elevated. NSi and Levica, the opposition parties with the same number of MPs but
                    from the opposite ends of the political spectrum, both address the widest
                    variety of issues. With keywords belonging almost exclusively to the semantic
                    field of retirement and pension, DeSUS lies on the other end of the spectrum as
                    a single-issue party. A comparison with the SlovParl corpus of parliamentary
                    debates from the period of Slovenia’s independence, many more topics are
                    identified in Parlameter, which understandable as a well-established state will
                    need to take care of a full spectrum of issues whereas a new state will mostly
                    be dealing with procedural issues and the new legislature.</p>
                <p>The Parlameter corpus is available through both CLARIN.SI concordancers, as well
                    as for download from its repository, both as a TEI document and in the simpler
                    vertical file format, under the liberal Creative Commons -
                    Attribution-ShareAlike (CC BY-SA 4.0) licence. The corpus architecture allows
                    for regular extensions of the corpus with additional Slovene data, as well as
                    data from other parliaments, starting with Croatian and Bosnian.</p>
            </div>
            <div type="summary" xml:lang="sl">
                <docAuthor>Darja Fišer, Nikola Ljubešič, Tomaž Erjavec</docAuthor>
                <head>PARLAMETER – KORPUS RAZPRAV SLOVENSKEGA DRŽAVNEGA ZBORA</head>
                <head rend="subheader">POVZETEK</head>
                <p>Edinstvena vsebina, struktura in jezik, pa tudi dostopnost prepisov
                    parlamentarnih razprav so dejavniki, zaradi katerih so le-ti pomemben predmet
                    raziskav v številnih znanstvenih disciplinah digitalne humanistike in
                    družboslovja. To je motiviralo številne nacionalne in mednarodne iniciative za
                    izgradnjo, označevanje in analizo parlamentarnih korpusov. V tem prispevku
                    predstavimo korpus sodobnih parlamentarnih razprav Parlameter, ki vsebuje
                    razprave 7. mandata slovenskega Državnega zbora (2014-2018). Korpus Parlameter
                    vsebuje bogate metapodatke o govorcih (spol, starost, izobrazba, strankarska
                    pripadnost) in je jezikoslovno označen (lematizacija, tegiranje, imenske
                    entitete).</p>
                <p>Korpus Parlameter vsebuje 371 razprav in 1.981 govorcev, ki so prispevali 133.287
                    govorov oziroma 35 milijonov besed. V prispevku prikažemo potencial
                    korpusnoanalitičnih tehnik za raziskovanje političnih razprav z analizo
                    jezikovne produkcije govorcev glede na morfosintaktične oznake in metapodatke o
                    govorcih. Primerjava s splošno slovenščino pokaže, da v parlamentarnih govorih
                    izstopajo sedanjiške oblike ter osebni in kazalni zaimki. Čeprav moški govorci
                    spregovorijo večkrat, so govori žensk daljši. Ženske večinoma razpravljajo o
                    temah, kot so zdravje, delo, družina in sociala, javna uprava ter izobraževanje,
                    znanost in šoprt, večina ključnih besed v moških govorih pa ni vezanih na
                    določeno tematiko, kar nakazuje bolj diskurziven, razpravljalski slog moških
                    govorcev. V celoti gledano je najbolj produktivna strankarska skupina največja
                    opozicijska stranka SDS, medtem ko je vladajoča stranka SMC v korpusu zastopana
                    z najmanj izrečenimi besedami. Najvišji relativni delež števila pojavnic na
                    govorca imata najmanjši parlamentarni stranki tega sklica Levica in NSi.
                    Največja opozicijska stranka SDS izstopa po izrazito velikem obsegu ideološko
                    obarvanih ključnih besed, Levica pa po specifičnih slogovnih figurah, ki so tako
                    zelo neformalne kot zelo povzdignjene. NSi in Levica, opozicijski stranki z
                    enakim številom poslancev a s povsem različnih polov političnega spektra, obe
                    naslavljajta največje število tematik. Po drugi strani pa s ključnimi besedami,
                    ki skoraj v celoti spadajo v pomensko polje upokojevanja in pokojnin, pa je
                    povsem obratno pri stranki DeSUS, ki s tem utrjuje svoj status problemske
                    stranke. Primerjava s korpusom SlovParl iz obdobja slovenske osamosvojitve kaže,
                    da je v korpusu Parlameter obravnavanih veliko več tem kot v korpusu SlovParl,
                    kar je razumljivo, saj se mora uveljavljena država ukvarjati s celotnim spektrom
                    problematik, medtem ko se novo ustanovljena država posveča predvsem
                    priceduralnim vprašanjem in sprejemanju nove zakonodaje.</p>
                <p>Korpus Parlameter je dostopen preko obeh konkordančnikov v okviru raziskovalne
                    infrastructure CLARIN.SI, prav tako pa ga je mogoče prenesti z repozitorija v
                    format TEI, pa tudi v preprostejšem vertikalnem formatu pod licenco Creative
                    Commons - Attribution-ShareAlike (CC BY-SA 4.0). Korpusna arhitektura je
                    zasnovana tako, da omogoča širitev korpusa na druga časovna obdobja, prav tako
                    pa tudi vključevanje gradiv drugih parlamentov, začenši s hrvaškim in
                    bosanskim.</p>
            </div>
        </back>
    </text>
</TEI>
