Dataset Open Access

INEL Kalmyk Corpus

Baranova, Vlada


MARC21 XML Export

<?xml version='1.0' encoding='UTF-8'?>
<record xmlns="http://www.loc.gov/MARC21/slim">
  <leader>00000nmm##2200000uu#4500</leader>
  <datafield tag="542" ind1=" " ind2=" ">
    <subfield code="l">open</subfield>
  </datafield>
  <datafield tag="909" ind1="C" ind2="O">
    <subfield code="o">oai:fdr.uni-hamburg.de:17676</subfield>
    <subfield code="p">user-inel</subfield>
    <subfield code="p">user-adwhh</subfield>
    <subfield code="p">user-uhh</subfield>
  </datafield>
  <datafield tag="773" ind1=" " ind2=" ">
    <subfield code="a">10.25592/uhhfdm.17675</subfield>
    <subfield code="i">isVersionOf</subfield>
    <subfield code="n">doi</subfield>
  </datafield>
  <controlfield tag="005">20250722105913.0</controlfield>
  <datafield tag="540" ind1=" " ind2=" ">
    <subfield code="u">https://creativecommons.org/licenses/by-nc-sa/4.0/legalcode</subfield>
    <subfield code="a">Creative Commons Attribution Non Commercial Share Alike 4.0 International</subfield>
  </datafield>
  <datafield tag="260" ind1=" " ind2=" ">
    <subfield code="c">2025-07-17</subfield>
  </datafield>
  <datafield tag="041" ind1=" " ind2=" ">
    <subfield code="a">xal</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">endangered language</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">indigenous language</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">language contact</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">language documentation</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">INEL</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">folklore</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">narrative</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">monologue</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">morphological glossing</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">English translation</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">Russian translation</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">EXMARaLDA</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">ELAN</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">XML</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">ISO/TEI</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">Mongolic languages</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">annotated corpus</subfield>
  </datafield>
  <datafield tag="245" ind1=" " ind2=" ">
    <subfield code="a">INEL Kalmyk Corpus</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">758388</subfield>
    <subfield code="u">https://www.fdr.uni-hamburg.de/record/17676/files/kalmyk-1.0-documentation.pdf</subfield>
    <subfield code="z">md5:944f208fd72cd8658f479d33bc98fcd6</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">8667672</subfield>
    <subfield code="u">https://www.fdr.uni-hamburg.de/record/17676/files/kalmyk-1.0-lite.zip</subfield>
    <subfield code="z">md5:9ae0dfd2e3bf56af4206eacc9e9326f3</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">377964899</subfield>
    <subfield code="u">https://www.fdr.uni-hamburg.de/record/17676/files/kalmyk-1.0-mp3.zip</subfield>
    <subfield code="z">md5:e3fbf20d950fd90e65b52f316dafd704</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">1835703820</subfield>
    <subfield code="u">https://www.fdr.uni-hamburg.de/record/17676/files/kalmyk-1.0-standard.zip</subfield>
    <subfield code="z">md5:45d29e3248b62b4549e464b207c91afe</subfield>
  </datafield>
  <datafield tag="650" ind1="1" ind2="7">
    <subfield code="a">cc-by</subfield>
    <subfield code="2">opendefinition.org</subfield>
  </datafield>
  <datafield tag="520" ind1=" " ind2=" ">
    <subfield code="a">&lt;p&gt;&lt;strong&gt;Corpus citation&lt;/strong&gt;&lt;/p&gt;

&lt;p&gt;&lt;em&gt;Baranova, Vlada&lt;/em&gt;. 2025. INEL Kalmyk Corpus. Archived at Universit&amp;auml;t Hamburg. Version 1.0. Publication date 2025-07-17.&amp;nbsp;&lt;a href="https://hdl.handle.net/11022/0000-0007-FFB1-2"&gt;https://hdl.handle.net/11022/0000-0007-FFB1-2&lt;/a&gt;. Archived at Universit&amp;auml;t Hamburg. In: &lt;em&gt;The INEL Corpora of Indigenous Northern Eurasian Languages&lt;/em&gt;.&amp;nbsp;&lt;a href="https://hdl.handle.net/11022/0000-0007-F45A-1"&gt;https://hdl.handle.net/11022/0000-0007-F45A-1&lt;/a&gt;.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Corpus Description&lt;/strong&gt;&lt;/p&gt;

&lt;p&gt;The INEL Kalmyk Corpus has been created within the long-term INEL project (&amp;quot;Grammatical Descriptions, Corpora and Language Technology for Indigenous Northern Eurasian Languages&amp;quot;), 2016&amp;ndash;2033.&lt;/p&gt;

&lt;p&gt;The corpus consists of transcribed audio recordings collected in the Republic of Kalmykia between 2007 and 2018 in the Ketchenerovsky District (Derbet&amp;nbsp; and Torgut dialect).&lt;/p&gt;

&lt;p&gt;All texts in the corpus are provided with interlinear morpheme-by-morpheme glosses and translation into English and Russian. All texts for which the audio recordings were accessible are time-aligned with them.&amp;nbsp;&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Corpus Size&lt;/strong&gt;&lt;/p&gt;

&lt;p&gt;The corpus contains &lt;strong&gt;55 &lt;/strong&gt;texts, &lt;strong&gt;2,076 &lt;/strong&gt;sentences, and &lt;strong&gt;19,742&amp;nbsp;&lt;/strong&gt;tokens. The total duration of the audio recordings is &lt;strong&gt;4 &lt;/strong&gt;hours and &lt;strong&gt;23 &lt;/strong&gt;minutes.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Funding&lt;/strong&gt;&lt;/p&gt;

&lt;p&gt;The corpus has been produced in the context of the joint research funding of the German Federal Government and Federal States in the Academies&amp;rsquo; Programme, with funding from the Federal Ministry of Education and Research and the Free and Hanseatic City of Hamburg. The Academies&amp;rsquo; Programme is coordinated by the Union of the German Academies of Sciences and Humanities.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Contributions / Acknowledgements&lt;/strong&gt;&lt;/p&gt;

&lt;p&gt;Native speakers generously shared their knowledge of Kalmyk, making the creation of this corpus possible. Zamira Xejchieva and Galina Cabdy`rova assisted with oral transcription and the Russian translation of the audio materials.&lt;/p&gt;

&lt;p&gt;Part of the materials were recorded during joint expeditions of St. Petersburg University and the Institute for Linguistic Studies of the Russian Academy of Sciences in 2007&amp;ndash;2008, under the direction of Elena Perekhvalskaya and Sergey Say.&lt;/p&gt;

&lt;p&gt;This corpus primarily follows the transcription system and partially adopts the glossing conventions developed by a research team led by Sergey Say, with input from other expedition participants.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Searching the corpus&lt;/strong&gt;&lt;/p&gt;

&lt;p&gt;The corpus can be downloaded from the ZFDM Repository using the links provided below and browsed or searched locally using the&amp;nbsp;&lt;a href="https://exmaralda.org/"&gt;EXMARaLDA&lt;/a&gt;&amp;nbsp;software or, alternatively,&amp;nbsp;&lt;a href="https://archive.mpi.nl/tla/elan"&gt;ELAN&lt;/a&gt;.&lt;/p&gt;

&lt;p&gt;Online search with Tsakorpus platform is available at&amp;nbsp;&lt;a href="https://inel.corpora.uni-hamburg.de/KalmykCorpus/search"&gt;https://inel.corpora.uni-hamburg.de/KalmykCorpus/search&lt;/a&gt;.&lt;/p&gt;

&lt;p&gt;Remote search with EXMARaLDA is also possible without downloading all the files (see&amp;nbsp;&lt;a href="https://inel.corpora.uni-hamburg.de/portal/help/en/index.php"&gt;https://inel.corpora.uni-hamburg.de/portal/help/en/index.php&lt;/a&gt;).&lt;/p&gt;

&lt;p&gt;See the user documentation&amp;nbsp;(section 3) for details on transcription, annotation tiers and annotation tags.&lt;br&gt;
Find further information and links on the Kalmyk Corpus page at the INEL Resources portal:&amp;nbsp;&lt;a href="https://inel.corpora.uni-hamburg.de/portal/corpora/kalmyk/"&gt;https://inel.corpora.uni-hamburg.de/portal/corpora/kalmyk/&lt;/a&gt;.&lt;/p&gt;</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">dataset</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">user-adwhh</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">user-inel</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">user-uhh</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="a">Lazarenko, Elena</subfield>
    <subfield code="u">Universität Hamburg</subfield>
    <subfield code="4">dtm</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="a">Riaposov, Aleksandr</subfield>
    <subfield code="u">Universität Hamburg</subfield>
    <subfield code="4">dtm</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="a">Arkhipov, Alexandre</subfield>
    <subfield code="u">Universität Hamburg</subfield>
    <subfield code="4">edt</subfield>
  </datafield>
  <datafield tag="024" ind1=" " ind2=" ">
    <subfield code="a">10.25592/uhhfdm.17676</subfield>
    <subfield code="2">doi</subfield>
  </datafield>
  <datafield tag="024" ind1=" " ind2=" ">
    <subfield code="a">11022/0000-0007-FFB1-2</subfield>
    <subfield code="2">handle</subfield>
    <subfield code="q">alternateidentifier</subfield>
  </datafield>
  <datafield tag="100" ind1=" " ind2=" ">
    <subfield code="a">Baranova, Vlada</subfield>
    <subfield code="u">Universität Hamburg</subfield>
    <subfield code="0">(orcid)0000-0003-1642-4003</subfield>
  </datafield>
  <controlfield tag="001">17676</controlfield>
</record>

Cite record as