There is a newer version of this record available.

Dataset Open Access

Jingju a cappella singing dataset part1

Rong Gong; Rafael Caro Repetto; Yile Yang; Xavier Serra


MARC21 XML Export

<?xml version='1.0' encoding='UTF-8'?>
<record xmlns="http://www.loc.gov/MARC21/slim">
  <leader>00000nmm##2200000uu#4500</leader>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">Beijing opera</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">annotation</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">phoneme</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">syllable</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">phrase</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">singing voice</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">praat</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">textgrid</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">wave audio</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">jingju</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">MTG</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">C4DM</subfield>
  </datafield>
  <datafield tag="653" ind1=" " ind2=" ">
    <subfield code="a">a cappella</subfield>
  </datafield>
  <controlfield tag="005">20200124192604.0</controlfield>
  <controlfield tag="001">1244720</controlfield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Music Technology Group - Universitat Pompeu Fabra</subfield>
    <subfield code="a">Rafael Caro Repetto</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Music Technology Group - Universitat Pompeu Fabra</subfield>
    <subfield code="a">Yile Yang</subfield>
  </datafield>
  <datafield tag="700" ind1=" " ind2=" ">
    <subfield code="u">Music Technology Group - Universitat Pompeu Fabra</subfield>
    <subfield code="0">(orcid)0000-0003-1395-2345</subfield>
    <subfield code="a">Xavier Serra</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">217942</subfield>
    <subfield code="z">md5:dfb3bfc0322ff3144f713bcaef39d534</subfield>
    <subfield code="u">https://zenodo.org/record/1244720/files/annotation_txt.zip</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">4817</subfield>
    <subfield code="z">md5:ffaa9c074e556e1be45f3e6231cdcdd9</subfield>
    <subfield code="u">https://zenodo.org/record/1244720/files/catalogue - dan.csv</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">3397</subfield>
    <subfield code="z">md5:768fa00ce1f8880ae5480fae103ecc06</subfield>
    <subfield code="u">https://zenodo.org/record/1244720/files/catalogue - laosheng.csv</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">17485</subfield>
    <subfield code="z">md5:1e4c9b2a9a584d13736196fff6e41951</subfield>
    <subfield code="u">https://zenodo.org/record/1244720/files/pycode.zip</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">2017</subfield>
    <subfield code="z">md5:f1113d4c03b379a6a23d85e2c215d54b</subfield>
    <subfield code="u">https://zenodo.org/record/1244720/files/readme.txt</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">1241608</subfield>
    <subfield code="z">md5:8088161679f519d13f96dc1be9f53bdd</subfield>
    <subfield code="u">https://zenodo.org/record/1244720/files/textgrid.zip</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">686516146</subfield>
    <subfield code="z">md5:4506a948480ff4d46d487148e7528f82</subfield>
    <subfield code="u">https://zenodo.org/record/1244720/files/wav_mono.zip</subfield>
  </datafield>
  <datafield tag="856" ind1="4" ind2=" ">
    <subfield code="s">868953391</subfield>
    <subfield code="z">md5:4722abda831c20b169a62b2754b15bea</subfield>
    <subfield code="u">https://zenodo.org/record/1244720/files/wav.zip</subfield>
  </datafield>
  <datafield tag="542" ind1=" " ind2=" ">
    <subfield code="l">open</subfield>
  </datafield>
  <datafield tag="260" ind1=" " ind2=" ">
    <subfield code="c">2018-05-10</subfield>
  </datafield>
  <datafield tag="909" ind1="C" ind2="O">
    <subfield code="p">openaire_data</subfield>
    <subfield code="p">user-mdm-dtic-upf</subfield>
    <subfield code="p">user-mir</subfield>
    <subfield code="p">user-mtgupf</subfield>
    <subfield code="o">oai:zenodo.org:1244720</subfield>
  </datafield>
  <datafield tag="100" ind1=" " ind2=" ">
    <subfield code="u">Music Technology Group - Universitat Pompeu Fabra</subfield>
    <subfield code="0">(orcid)0000-0002-4659-9034</subfield>
    <subfield code="a">Rong Gong</subfield>
  </datafield>
  <datafield tag="245" ind1=" " ind2=" ">
    <subfield code="a">Jingju a cappella singing dataset part1</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">user-mdm-dtic-upf</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">user-mir</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">user-mtgupf</subfield>
  </datafield>
  <datafield tag="536" ind1=" " ind2=" ">
    <subfield code="c">267583</subfield>
    <subfield code="a">Computational models for the discovery of the world's music</subfield>
  </datafield>
  <datafield tag="540" ind1=" " ind2=" ">
    <subfield code="u">https://creativecommons.org/licenses/by-nc/4.0/legalcode</subfield>
    <subfield code="a">Creative Commons Attribution Non Commercial 4.0 International</subfield>
  </datafield>
  <datafield tag="650" ind1="1" ind2="7">
    <subfield code="a">cc-by</subfield>
    <subfield code="2">opendefinition.org</subfield>
  </datafield>
  <datafield tag="520" ind1=" " ind2=" ">
    <subfield code="a">&lt;p&gt;This is the 4th version of the dataset. The folder structure has been changed since the 2nd version, where the Laosheng folder has been moved directly into .wav or textgrid&amp;nbsp;folder.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Description:&lt;/strong&gt;&lt;/p&gt;

&lt;p&gt;This dataset is a collection of boundary annotations of a cappella singing performed by Beijing Opera (Jingju, 京剧) professional and amateur singers.&amp;nbsp;&lt;/p&gt;

&lt;ol&gt;
	&lt;li&gt;wav.zip: audio files in .wav format, mono or stereo.&lt;/li&gt;
	&lt;li&gt;wav_mono.zip: audio files in .wav&amp;nbsp;format, mono&lt;/li&gt;
	&lt;li&gt;annotation_txt.zip: line, syllable and phoneme time boundaries (second) and labels in .txt format&lt;/li&gt;
	&lt;li&gt;textgrid.zip: line, syllable and phoneme annotation in Praat .textgrid format&lt;/li&gt;
	&lt;li&gt;pycode.zip: util code for parsing the .textgrid annotation&lt;/li&gt;
	&lt;li&gt;catalogue*.csv: recording metadata, source separation recordings are not included.&lt;/li&gt;
&lt;/ol&gt;

&lt;p&gt;The boundaries (onset and offset) have been annotated in both &lt;strong&gt;Praat TextGrid (textgrid.zip)&lt;/strong&gt; and .&lt;strong&gt;txt (annotation_txt.zip)&lt;/strong&gt; format hierarchically:&lt;/p&gt;

&lt;ol&gt;
	&lt;li&gt;Line (phrase),&lt;/li&gt;
	&lt;li&gt;syllable,&lt;/li&gt;
	&lt;li&gt;phoneme&lt;/li&gt;
&lt;/ol&gt;

&lt;p&gt;Singing units in pinyin and X-SAMPA have been annotated to a jingju&amp;nbsp;a cappella singing audio dataset.&lt;/p&gt;

&lt;p&gt;The corresponding audio files are the a cappella singing arias recordings, which are stereo or mono, sampled at 44.1 kHz, and stored as .wav files. The .wav files are recorded by two institutes: those file names ending with &amp;lsquo;qm&amp;rsquo; are recorded by C4DM, Queen Mary University of London; others file names ending with &amp;lsquo;upf&amp;rsquo; or &amp;lsquo;lon&amp;rsquo; are recorded by MTG-UPF. Additionally, another collection of 15 clean singing recordings is included in this dataset. They are extracted from the commercial recordings which originally contains karaoke accompaniment and mixed versions.&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;If you use this audio dataset in your work, please cite (1) this dataset as well (2) the following publication:&lt;/strong&gt;&lt;/p&gt;

&lt;blockquote&gt;
&lt;p&gt;D. A. A. Black, M. Li, and M. Tian, &amp;ldquo;Automatic Identification of Emotional Cues in Chinese Opera Singing,&amp;rdquo; in 13th Int. Conf. on Music Perception and Cognition (ICMPC-2014), 2014, pp. 250&amp;ndash;255.&lt;/p&gt;
&lt;/blockquote&gt;

&lt;p&gt;&amp;nbsp;&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Details:&lt;/strong&gt;&lt;br&gt;
Annotation format, units, parsing code and other information please refer to &lt;a href="https://github.com/MTG/jingjuPhonemeAnnotation"&gt;https://github.com/MTG/jingjuPhonemeAnnotation&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;&lt;br&gt;
&lt;strong&gt;License:&lt;/strong&gt;&lt;br&gt;
Textgrid annotations are licensed under Creative Commons Attribution-NonCommercial&amp;nbsp;4.0 International License.&lt;/p&gt;

&lt;p&gt;Wav audio ending with &amp;lsquo;upf&amp;rsquo; or &amp;lsquo;lon&amp;rsquo; is licensed under&amp;nbsp;Creative Commons Attribution-NonCommercial&amp;nbsp;4.0 International.&lt;/p&gt;

&lt;p&gt;For the license of .wav audio ending with &amp;lsquo;qm&amp;rsquo; from C4DM Queen Mary University of London, please refer to this page &lt;a href="http://isophonics.org/SingingVoiceDataset"&gt;http://isophonics.org/SingingVoiceDataset&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;&lt;strong&gt;Contact information:&lt;/strong&gt;&lt;/p&gt;

&lt;p&gt;Rong Gong: rong&amp;lt;dot&amp;gt;gong&amp;lt;at&amp;gt;upf&amp;lt;dot&amp;gt;edu&lt;/p&gt;

&lt;p&gt;Rafael Caro Repetto: rafael&amp;lt;dot&amp;gt;caro&amp;lt;at&amp;gt;upf&amp;lt;dot&amp;gt;edu&lt;/p&gt;</subfield>
  </datafield>
  <datafield tag="773" ind1=" " ind2=" ">
    <subfield code="n">doi</subfield>
    <subfield code="i">isVersionOf</subfield>
    <subfield code="a">10.5281/zenodo.780559</subfield>
  </datafield>
  <datafield tag="024" ind1=" " ind2=" ">
    <subfield code="a">10.5281/zenodo.1244720</subfield>
    <subfield code="2">doi</subfield>
  </datafield>
  <datafield tag="980" ind1=" " ind2=" ">
    <subfield code="a">dataset</subfield>
  </datafield>
</record>
1,417
1,186
views
downloads
All versions This version
Views 1,41724
Downloads 1,18625
Data volume 619.2 GB3.1 GB
Unique views 1,16024
Unique downloads 3044

Share

Cite as