Project deliverable Open Access

Lynx D2.6 Report on Lynx acquired corpora

Ēriks Ajausks; Christian Sageder; Andis Lagzdiņš; Víctor Rodríguez-Doncel


MARC21 XML Export

<?xml version='1.0' encoding='UTF-8'?>
<record xmlns="http://www.loc.gov/MARC21/slim">
  <leader>00000nam##2200000uu#4500</leader>
  <datafield tag="041" ind1=" " ind2=" ">
    <subfield code="a">eng</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">Lynx legal copora, Lynx translation corpora</subfield>
  </datafield>
  <controlfield tag="005">20200302060019.0</controlfield>
  <controlfield tag="001">3692591</controlfield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">openlaws</subfield>
    <subfield code="a">Christian Sageder</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">TILDE</subfield>
    <subfield code="a">Andis Lagzdiņš</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Universidad Politécnica de Madrid</subfield>
    <subfield code="a">Víctor Rodríguez-Doncel</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">TILDE</subfield>
    <subfield code="4">oth</subfield>
    <subfield code="a">Roberts Rozis</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">TILDE</subfield>
    <subfield code="4">oth</subfield>
    <subfield code="a">Rinalds Vīksna</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">TILDE</subfield>
    <subfield code="4">oth</subfield>
    <subfield code="a">Matīss Rikters</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">822654</subfield>
    <subfield code="z">md5:996eee54ce1714b1699660ea1a235813</subfield>
    <subfield code="u">https://zenodo.org/record/3692591/files/D2.6_Report_on_Lynx acquired corpora_Final.pdf</subfield>
  </datafield>
  <datafield tag="542" ind1=" " ind2=" ">
    <subfield code="l">open</subfield>
  </datafield>
  <datafield tag="260" ind1=" " ind2=" ">
    <subfield code="c">2020-02-29</subfield>
  </datafield>
  <datafield tag="909" ind1="C" ind2="O">
    <subfield code="p">openaire</subfield>
    <subfield code="p">user-lynx</subfield>
    <subfield code="o">oai:zenodo.org:3692591</subfield>
  </datafield>
  <datafield tag="100" ind1=" " ind2=" ">
    <subfield code="u">TILDE</subfield>
    <subfield code="a">Ēriks Ajausks</subfield>
  </datafield>
  <datafield tag="245" ind1=" " ind2=" ">
    <subfield code="a">Lynx D2.6 Report on Lynx acquired corpora</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">user-lynx</subfield>
  </datafield>
  <datafield tag="536" ind1=" " ind2=" ">
    <subfield code="c">780602</subfield>
    <subfield code="a">Building the Legal Knowledge Graph for Smart Compliance Services in Multilingual Europe</subfield>
  </datafield>
  <datafield tag="540" ind1=" " ind2=" ">
    <subfield code="u">http://creativecommons.org/licenses/by/4.0/legalcode</subfield>
    <subfield code="a">Creative Commons Attribution 4.0 International</subfield>
  </datafield>
  <datafield tag="650" ind1="1" ind2="7">
    <subfield code="a">cc-by</subfield>
    <subfield code="2">opendefinition.org</subfield>
  </datafield>
  <datafield tag="520" ind1=" " ind2=" ">
    <subfield code="a">&lt;p&gt;This deliverable summarizes the final work on acquired corpora (as part of WP2) within the context of the Lynx project. The aim of this task is to provide a description of the corpora collection methods, and the resulting collected corpora by Lynx partners around the different use cases. There are three business cases for each corpus. The first case is related to Compliance Assurance Services for Contracts, the second is related to Compliance Assurance Services in Oil &amp;amp; Gas and Energy, and the third Business Case is about Compliance Assurance Services in Labor Law. This document serves as reference material for the corpora collected to cover the needs of the three business cases, and for the first steps in the method followed to index that corpora. Furthermore, the document describes the corpora preparation workflow to be used in the training of Neural MT engines for specific languages and domains. Finally, this document reports on the term extraction process on the compiled corpora.&lt;/p&gt;</subfield>
  </datafield>
  <datafield tag="773" ind1=" " ind2=" ">
    <subfield code="n">doi</subfield>
    <subfield code="i">isVersionOf</subfield>
    <subfield code="a">10.5281/zenodo.3692590</subfield>
  </datafield>
  <datafield tag="024" ind1=" " ind2=" ">
    <subfield code="a">10.5281/zenodo.3692591</subfield>
    <subfield code="2">doi</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">publication</subfield>
    <subfield code="b">deliverable</subfield>
  </datafield>
</record>
24
21
views
downloads
All versions This version
Views 2424
Downloads 2121
Data volume 17.3 MB17.3 MB
Unique views 2323
Unique downloads 1818

Share

Cite as