Conference paper Open Access

Dataset for Temporal Analysis of English-French Cognates

Frossard, Esteban; Coustaty, Mickael; Doucet, Antoine; Jatowt, Adam; Hengchen, Simon


MARC21 XML Export

<?xml version='1.0' encoding='UTF-8'?>
<record xmlns="http://www.loc.gov/MARC21/slim">
  <leader>00000nam##2200000uu#4500</leader>
  <datafield tag="041" ind1=" " ind2=" ">
    <subfield code="a">eng</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">Crosslingual semantic change</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">cognates</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">temporal analysis</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">semantic analysis</subfield>
  </datafield>
  <controlfield tag="005">20200313172458.0</controlfield>
  <controlfield tag="001">3693651</controlfield>
  <datafield tag="711" ind1=" " ind2=" ">
    <subfield code="d">13th-15th May 2020</subfield>
    <subfield code="g">LREC 2020</subfield>
    <subfield code="a">12th Edition Language Resources and Evaluation Conference.</subfield>
    <subfield code="c">Marseilles, France</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">University of La Rochelle, L3i Laboratory,</subfield>
    <subfield code="0">(orcid)0000-0002-0123-439X</subfield>
    <subfield code="a">Coustaty, Mickael</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">University of La Rochelle, L3i Laboratory,</subfield>
    <subfield code="0">(orcid)0000-0001-6160-3356</subfield>
    <subfield code="a">Doucet, Antoine</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Kyoto University</subfield>
    <subfield code="0">(orcid)0000-0001-7235-0665</subfield>
    <subfield code="a">Jatowt, Adam</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">University of Helsinki</subfield>
    <subfield code="0">(orcid)0000-0002-8453-7221</subfield>
    <subfield code="a">Hengchen, Simon</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">649627</subfield>
    <subfield code="z">md5:dfa800d83f8db46c2e7a75944c723980</subfield>
    <subfield code="u">https://zenodo.org/record/3693651/files/LREC_Temporal_Study.pdf</subfield>
  </datafield>
  <datafield tag="542" ind1=" " ind2=" ">
    <subfield code="l">open</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="y">Conference website</subfield>
    <subfield code="u">https://lrec2020.lrec-conf.org/en/</subfield>
  </datafield>
  <datafield tag="260" ind1=" " ind2=" ">
    <subfield code="c">2020-05-13</subfield>
  </datafield>
  <datafield tag="909" ind1="C" ind2="O">
    <subfield code="p">openaire</subfield>
    <subfield code="p">user-newseye</subfield>
    <subfield code="o">oai:zenodo.org:3693651</subfield>
  </datafield>
  <datafield tag="100" ind1=" " ind2=" ">
    <subfield code="u">University of La Rochelle, L3i Laboratory,</subfield>
    <subfield code="0">(orcid)0000-0003-4621-244X</subfield>
    <subfield code="a">Frossard, Esteban</subfield>
  </datafield>
  <datafield tag="245" ind1=" " ind2=" ">
    <subfield code="a">Dataset for Temporal Analysis of English-French Cognates</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">user-newseye</subfield>
  </datafield>
  <datafield tag="536" ind1=" " ind2=" ">
    <subfield code="c">770299</subfield>
    <subfield code="a">NewsEye: A Digital Investigator for Historical Newspapers</subfield>
  </datafield>
  <datafield tag="536" ind1=" " ind2=" ">
    <subfield code="c">825153</subfield>
    <subfield code="a">Cross-Lingual Embeddings for Less-Represented Languages in European News Media</subfield>
  </datafield>
  <datafield tag="540" ind1=" " ind2=" ">
    <subfield code="u">https://creativecommons.org/licenses/by/4.0/legalcode</subfield>
    <subfield code="a">Creative Commons Attribution 4.0 International</subfield>
  </datafield>
  <datafield tag="650" ind1="1" ind2="7">
    <subfield code="a">cc-by</subfield>
    <subfield code="2">opendefinition.org</subfield>
  </datafield>
  <datafield tag="520" ind1=" " ind2=" ">
    <subfield code="a">&lt;p&gt;Languages change over time and, thanks to abundance of digital corpora, their evolutionary analysis using computational techniques has recently gained much research attention. In this paper, we focus on creating a database to investigate the similarity in evolution&amp;nbsp;between different languages. We look in particular into the similarities and differences between the use of corresponding words across time in English and French, two languages from different linguistic families yet with shared syntax and close contact. To analyze this evolution, we select a set of cognates in both languages and study their temporal changes and correlations. We propose a new database for computational approaches of synchronized diachronic investigation of language pairs, and subsequent novel findings stemming from the cognates temporal comparison of the two chosen languages. To the best of our knowledge, the present study is the first in the literature to use computational approaches and large data to make a cross-language temporal analysis.&lt;/p&gt;</subfield>
  </datafield>
  <datafield tag="773" ind1=" " ind2=" ">
    <subfield code="n">doi</subfield>
    <subfield code="i">isVersionOf</subfield>
    <subfield code="a">10.5281/zenodo.3693650</subfield>
  </datafield>
  <datafield tag="024" ind1=" " ind2=" ">
    <subfield code="a">10.5281/zenodo.3693651</subfield>
    <subfield code="2">doi</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">publication</subfield>
    <subfield code="b">conferencepaper</subfield>
  </datafield>
</record>
117
59
views
downloads
All versions This version
Views 117117
Downloads 5958
Data volume 38.3 MB37.7 MB
Unique views 104104
Unique downloads 5756

Share

Cite as