Journal article Open Access

2018 YPIC Challenge: A case study in characterizing an unknown protein sample

Pino, Lindsay; Lin, Andy; Bittremieux, Wout


DCAT Export

<?xml version='1.0' encoding='utf-8'?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:adms="http://www.w3.org/ns/adms#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dct="http://purl.org/dc/terms/" xmlns:dctype="http://purl.org/dc/dcmitype/" xmlns:dcat="http://www.w3.org/ns/dcat#" xmlns:duv="http://www.w3.org/ns/duv#" xmlns:foaf="http://xmlns.com/foaf/0.1/" xmlns:frapo="http://purl.org/cerif/frapo/" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:gsp="http://www.opengis.net/ont/geosparql#" xmlns:locn="http://www.w3.org/ns/locn#" xmlns:org="http://www.w3.org/ns/org#" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:prov="http://www.w3.org/ns/prov#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:schema="http://schema.org/" xmlns:skos="http://www.w3.org/2004/02/skos/core#" xmlns:vcard="http://www.w3.org/2006/vcard/ns#" xmlns:wdrs="http://www.w3.org/2007/05/powder-s#">
  <rdf:Description rdf:about="https://zenodo.org/record/3551499">
    <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://zenodo.org/record/3551499</dct:identifier>
    <foaf:page rdf:resource="https://zenodo.org/record/3551499"/>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0003-1857-7222">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0003-1857-7222</dct:identifier>
        <foaf:name>Pino, Lindsay</foaf:name>
        <foaf:givenName>Lindsay</foaf:givenName>
        <foaf:familyName>Pino</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Department of Genome Sciences, University of Washington, Seattle WA 98195, USA</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0003-0072-612X">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0003-0072-612X</dct:identifier>
        <foaf:name>Lin, Andy</foaf:name>
        <foaf:givenName>Andy</foaf:givenName>
        <foaf:familyName>Lin</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Department of Genome Sciences, University of Washington, Seattle WA 98195, USA</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0002-3105-1359">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0002-3105-1359</dct:identifier>
        <foaf:name>Bittremieux, Wout</foaf:name>
        <foaf:givenName>Wout</foaf:givenName>
        <foaf:familyName>Bittremieux</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Department of Genome Sciences, University of Washington, Seattle WA 98195, USA</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:title>2018 YPIC Challenge: A case study in characterizing an unknown protein sample</dct:title>
    <dct:publisher>
      <foaf:Agent>
        <foaf:name>Zenodo</foaf:name>
      </foaf:Agent>
    </dct:publisher>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#gYear">2019</dct:issued>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#date">2019-09-26</dct:issued>
    <owl:sameAs rdf:resource="https://zenodo.org/record/3551499"/>
    <adms:identifier>
      <adms:Identifier>
        <skos:notation rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://zenodo.org/record/3551499</skos:notation>
        <adms:schemeAgency>url</adms:schemeAgency>
      </adms:Identifier>
    </adms:identifier>
    <owl:sameAs rdf:resource="https://doi.org/10.1021/acs.jproteome.9b00384"/>
    <dct:description>&lt;p&gt;For the 2018 YPIC Challenge, contestants were invited to try to decipher two unknown English questions encoded by a synthetic protein expressed in Escherichia coli. In addition to deciphering the sentence, contestants were asked to determine the three-dimensional structure and detect any post-translation modifications left by the host organism. We present our experimental and computational strategy to characterize this sample by identifying the unknown protein sequence and detecting the presence of post-translational modifications. The sample was acquired with dynamic exclusion disabled to increase the signal-to-noise ratio of the measured molecules, after which spectral clustering was used to generate high-quality consensus spectra. De novo spectrum identification was used to determine the synthetic protein sequence, and any post-translational modifications introduced by E. coli on the synthetic protein were analyzed via spectral networking. This workflow resulted in a de novo sequence coverage of 70%, on par with sequence database searching performance. Additionally, the spectral networking analysis indicated that no systematic modifications were introduced on the synthetic protein by E. coli. The strategy presented here can be directly used to analyze samples for which no protein sequence information is available or when the identity of the sample is unknown. All software and code to perform the bioinformatics analysis is available as open source, and self-contained Jupyter notebooks are provided to fully recreate the analysis.&lt;/p&gt; &lt;p&gt;This document is the unedited Author&amp;#39;s version of a Submitted Work that was subsequently accepted for publication in the Journal of Proteome Research, copyright &amp;copy; American Chemical Society after peer review. To access the final edited and published work see https://pubs.acs.org/articlesonrequest/AOR-gV4SwwddkH9NagGMX6bP.&lt;/p&gt;</dct:description>
    <dct:accessRights rdf:resource="http://publications.europa.eu/resource/authority/access-right/PUBLIC"/>
    <dct:accessRights>
      <dct:RightsStatement rdf:about="info:eu-repo/semantics/openAccess">
        <rdfs:label>Open Access</rdfs:label>
      </dct:RightsStatement>
    </dct:accessRights>
    <dct:license rdf:resource="https://creativecommons.org/licenses/by/4.0/legalcode"/>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.1021/acs.jproteome.9b00384"/>
        <dcat:byteSize>826918</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/3551499/files/Pino2019.pdf"/>
        <dcat:mediaType>application/pdf</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
  </rdf:Description>
</rdf:RDF>
73
44
views
downloads
Views 73
Downloads 44
Data volume 36.4 MB
Unique views 71
Unique downloads 44

Share

Cite as