There is a newer version of this record available.

Software Open Access

quanteda/quanteda: CRAN v1.5.0

Kenneth Benoit; Kohei Watanabe; Haiyan Wang; Paul Nulty; Adam Obeng; Stefan Müller; Jiong Wei Lua; Aki Matsuo; Christian Mueller; Will Lowe; Pablo Barberá; Tyler Rinker; mark padgham; Christopher Gandrud; José Tomás Atria; Tom Paskhalis; nicmer; lindbrook; hofaichan; etienne-s; hotzeplotz; Thomas J. Leeper; Stas Malavin; Michael W. Kearney; Michael Chirico; Katrin Leinweber; Johannes Gruber


DCAT Export

<?xml version='1.0' encoding='utf-8'?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:adms="http://www.w3.org/ns/adms#" xmlns:cnt="http://www.w3.org/2011/content#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dct="http://purl.org/dc/terms/" xmlns:dctype="http://purl.org/dc/dcmitype/" xmlns:dcat="http://www.w3.org/ns/dcat#" xmlns:duv="http://www.w3.org/ns/duv#" xmlns:foaf="http://xmlns.com/foaf/0.1/" xmlns:frapo="http://purl.org/cerif/frapo/" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:gsp="http://www.opengis.net/ont/geosparql#" xmlns:locn="http://www.w3.org/ns/locn#" xmlns:org="http://www.w3.org/ns/org#" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:prov="http://www.w3.org/ns/prov#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:schema="http://schema.org/" xmlns:skos="http://www.w3.org/2004/02/skos/core#" xmlns:vcard="http://www.w3.org/2006/vcard/ns#" xmlns:wdrs="http://www.w3.org/2007/05/powder-s#">
  <rdf:Description rdf:about="https://doi.org/10.5281/zenodo.3268686">
    <rdf:type rdf:resource="http://www.w3.org/ns/dcat#Dataset"/>
    <dct:type rdf:resource="http://purl.org/dc/dcmitype/Software"/>
    <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://doi.org/10.5281/zenodo.3268686</dct:identifier>
    <foaf:page rdf:resource="https://doi.org/10.5281/zenodo.3268686"/>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Kenneth Benoit</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>London School of Economics and Political Science</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Kohei Watanabe</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Waseda University</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Haiyan Wang</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Tracr</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Paul Nulty</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>University College Dublin</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Adam Obeng</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Columbia University, London School of Economics</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Stefan Müller</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>University of Zurich</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Jiong Wei Lua</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>London School of Economics</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Aki Matsuo</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Institute for Analytics and Data Science, University of Essex</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Christian Mueller</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>London School of Economics and Political Science</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Will Lowe</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Princeton University</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Pablo Barberá</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>University of Southern California</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Tyler Rinker</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Campus Labs</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>mark padgham</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>@ATFutures</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Christopher Gandrud</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>@zalando</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>José Tomás Atria</foaf:name>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Tom Paskhalis</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>London School of Economics and Political Science</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>nicmer</foaf:name>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>lindbrook</foaf:name>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>hofaichan</foaf:name>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>etienne-s</foaf:name>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>hotzeplotz</foaf:name>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Thomas J. Leeper</foaf:name>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Stas Malavin</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Soil Cryology Lab</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Michael W. Kearney</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>@MUDSA</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Michael Chirico</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>@myteksi</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Katrin Leinweber</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>@TIBHannover</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Johannes Gruber</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>University of Glasgow</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:title>quanteda/quanteda: CRAN v1.5.0</dct:title>
    <dct:publisher>
      <foaf:Agent>
        <foaf:name>Zenodo</foaf:name>
      </foaf:Agent>
    </dct:publisher>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#gYear">2019</dct:issued>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#date">2019-07-04</dct:issued>
    <owl:sameAs rdf:resource="https://zenodo.org/record/3268686"/>
    <adms:identifier>
      <adms:Identifier>
        <skos:notation rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://zenodo.org/record/3268686</skos:notation>
      </adms:Identifier>
    </adms:identifier>
    <dct:relation rdf:resource="https://github.com/quanteda/quanteda/tree/v1.5.0"/>
    <dct:isVersionOf rdf:resource="https://doi.org/10.5281/zenodo.596731"/>
    <owl:versionInfo>v1.5.0</owl:versionInfo>
    <dct:description>New features &lt;ul&gt; &lt;li&gt;Add &lt;code&gt;flatten&lt;/code&gt; and &lt;code&gt;levels&lt;/code&gt; arguments to &lt;code&gt;as.list.dictionary2()&lt;/code&gt; to enable more flexible conversion of dictionary objects. (#1661)&lt;/li&gt; &lt;li&gt;In &lt;code&gt;corpus_sample()&lt;/code&gt;, the &lt;code&gt;size&lt;/code&gt; now works with the &lt;code&gt;by&lt;/code&gt; argument, to control the size of units sampled from each group.&lt;/li&gt; &lt;li&gt;Improvements to &lt;code&gt;textstat_dist()&lt;/code&gt; and &lt;code&gt;textstat_simil()&lt;/code&gt;, see below.&lt;/li&gt; &lt;li&gt;Long tokens are not discarded automatically in the call to &lt;code&gt;tokens()&lt;/code&gt;. (#1713)&lt;/li&gt; &lt;/ul&gt; Behaviour changes &lt;ul&gt; &lt;li&gt;&lt;code&gt;textstat_dist()&lt;/code&gt; and &lt;code&gt;textstat_simil()&lt;/code&gt; now return sparse symmetric matrix objects using classes from the &lt;strong&gt;Matrix&lt;/strong&gt; package. This replaces the former structure based on the &lt;code&gt;dist&lt;/code&gt; class. Computation of these classes is now also based on the fast implementation in the &lt;strong&gt;proxyC&lt;/strong&gt; package. When computing similarities, the new &lt;code&gt;min_simil&lt;/code&gt; argument allows a user to ignore certain values below a specified similarity threshold. A new coercion method &lt;code&gt;as.data.frame.textstat_simildist()&lt;/code&gt; now exists for converting these returns into a data.frame of pairwise comparisons. Existing methods such as &lt;code&gt;as.matrix()&lt;/code&gt;, &lt;code&gt;as.dist()&lt;/code&gt;, and &lt;code&gt;as.list()&lt;/code&gt; work as they did before.&lt;/li&gt; &lt;li&gt;We have removed the "faith", "chi-squared", and "kullback" methods from &lt;code&gt;textstat_dist()&lt;/code&gt; and &lt;code&gt;textstat_simil()&lt;/code&gt; because these were either not symmetric or not invariant to document or feature ordering. Finally, the &lt;code&gt;selection&lt;/code&gt; argument has been deprecated in favour of a new &lt;code&gt;y&lt;/code&gt; argument. &lt;/li&gt; &lt;li&gt;&lt;code&gt;textstat_readability()&lt;/code&gt; now defaults to &lt;code&gt;measure = "Flesch"&lt;/code&gt; if no measure is supplied. This makes it consistent with &lt;code&gt;textstat_lexdiv()&lt;/code&gt; that also takes a default measure ("TTR") if none is supplied. (#1715)&lt;/li&gt; &lt;li&gt;The default values for &lt;code&gt;max_nchar&lt;/code&gt; and &lt;code&gt;min_nchar&lt;/code&gt; in &lt;code&gt;tokens_select()&lt;/code&gt; are now NULL, meaning they are not applied if the user does not supply values. Fixes #1713.&lt;/li&gt; &lt;/ul&gt; Bug fixes and stability enhancements &lt;ul&gt; &lt;li&gt;&lt;code&gt;kwic.corpus()&lt;/code&gt; and &lt;code&gt;kwic.tokens()&lt;/code&gt; behaviour now aligned, meaning that dictionaries are correctly faceted by key instead of by value. (#1684)&lt;/li&gt; &lt;li&gt;Improved formatting of &lt;code&gt;tokens()&lt;/code&gt; verbose output. (#1683)&lt;/li&gt; &lt;li&gt;Subsetting and printing of subsetted kwic objects is more robust. (#1665)&lt;/li&gt; &lt;li&gt;The "Bormuth" and "DRP" measures are now fixed for &lt;code&gt;textstat_readability()&lt;/code&gt;. (#1701)&lt;/li&gt; &lt;/ul&gt;</dct:description>
    <dct:accessRights rdf:resource="http://publications.europa.eu/resource/authority/access-right/PUBLIC"/>
    <dct:accessRights>
      <dct:RightsStatement rdf:about="info:eu-repo/semantics/openAccess">
        <rdfs:label>Open Access</rdfs:label>
      </dct:RightsStatement>
    </dct:accessRights>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.3268686"/>
      </dcat:Distribution>
    </dcat:distribution>
  </rdf:Description>
</rdf:RDF>
671
135
views
downloads
All versions This version
Views 67115
Downloads 1352
Data volume 3.7 GB74.1 MB
Unique views 62715
Unique downloads 522

Share

Cite as