Conference paper Open Access

The IWSLT 2019 KIT Speech Translation System

Pham, Ngoc-Quan; Nguyen, Thai-Son; Ha, Thanh-Le; Hussain, Juan; Schneider, Felix; Niehues, Jan; Stüker, Sebastian; Waibel, Alexander


MARC21 XML Export

<?xml version='1.0' encoding='UTF-8'?>
<record xmlns="http://www.loc.gov/MARC21/slim">
  <leader>00000nam##2200000uu#4500</leader>
  <datafield tag="041" ind1=" " ind2=" ">
    <subfield code="a">eng</subfield>
  </datafield>
  <controlfield tag="005">20200120170502.0</controlfield>
  <controlfield tag="001">3525564</controlfield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Institute for Anthropomatics and Robotics, KIT - Karlsruhe Institute of Technology, Germany</subfield>
    <subfield code="a">Nguyen, Thai-Son</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Institute for Anthropomatics and Robotics, KIT - Karlsruhe Institute of Technology, Germany</subfield>
    <subfield code="a">Ha, Thanh-Le</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Institute for Anthropomatics and Robotics, KIT - Karlsruhe Institute of Technology, Germany</subfield>
    <subfield code="a">Hussain, Juan</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">IInstitute for Anthropomatics and Robotics, KIT - Karlsruhe Institute of Technology, Germany</subfield>
    <subfield code="a">Schneider, Felix</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Department of Data Science, University of Maastricht, Netherlands</subfield>
    <subfield code="a">Niehues, Jan</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Institute for Anthropomatics and Robotics KIT - Karlsruhe Institute of Technology, Germany</subfield>
    <subfield code="a">Stüker, Sebastian</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Language Technologies Institute, Carnegie Mellon University &amp; Institute for Anthropomatics and Robotics KIT - Karlsruhe Institute of Technology, Germany</subfield>
    <subfield code="a">Waibel, Alexander</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">233710</subfield>
    <subfield code="z">md5:c328ea0a9f886839abd3b19cac97b40b</subfield>
    <subfield code="u">https://zenodo.org/record/3525564/files/IWSLT2019_paper_40.pdf</subfield>
  </datafield>
  <datafield tag="542" ind1=" " ind2=" ">
    <subfield code="l">open</subfield>
  </datafield>
  <datafield tag="260" ind1=" " ind2=" ">
    <subfield code="c">2019-11-02</subfield>
  </datafield>
  <datafield tag="909" ind1="C" ind2="O">
    <subfield code="p">openaire</subfield>
    <subfield code="p">user-iwslt2019</subfield>
    <subfield code="o">oai:zenodo.org:3525564</subfield>
  </datafield>
  <datafield tag="100" ind1=" " ind2=" ">
    <subfield code="u">Institute for Anthropomatics and Robotics, KIT - Karlsruhe Institute of Technology, Germany</subfield>
    <subfield code="a">Pham, Ngoc-Quan</subfield>
  </datafield>
  <datafield tag="245" ind1=" " ind2=" ">
    <subfield code="a">The IWSLT 2019 KIT Speech Translation System</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">user-iwslt2019</subfield>
  </datafield>
  <datafield tag="540" ind1=" " ind2=" ">
    <subfield code="u">https://creativecommons.org/licenses/by/4.0/legalcode</subfield>
    <subfield code="a">Creative Commons Attribution 4.0 International</subfield>
  </datafield>
  <datafield tag="650" ind1="1" ind2="7">
    <subfield code="a">cc-by</subfield>
    <subfield code="2">opendefinition.org</subfield>
  </datafield>
  <datafield tag="520" ind1=" " ind2=" ">
    <subfield code="a">&lt;p&gt;This paper describes KIT&amp;rsquo;s submission to the IWSLT 2019 Speech Translation task on two sub-tasks corresponding to two different datasets. We investigate different end-to-end architectures for the speech recognition module, including our new transformer-based architectures. Overall, our modules in the pipe-line are based on the transformer architecture which has recently achieved great results in various fields. In our systems, using transformer is also advantageous compared to traditional hybrid systems in term of simplicity while still having competent results.&lt;/p&gt;</subfield>
  </datafield>
  <datafield tag="773" ind1=" " ind2=" ">
    <subfield code="n">doi</subfield>
    <subfield code="i">isVersionOf</subfield>
    <subfield code="a">10.5281/zenodo.3525563</subfield>
  </datafield>
  <datafield tag="024" ind1=" " ind2=" ">
    <subfield code="a">10.5281/zenodo.3525564</subfield>
    <subfield code="2">doi</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">publication</subfield>
    <subfield code="b">conferencepaper</subfield>
  </datafield>
</record>
405
436
views
downloads
All versions This version
Views 405405
Downloads 436436
Data volume 101.9 MB101.9 MB
Unique views 359359
Unique downloads 392392

Share

Cite as