Report Open Access

Intermediary topic modelling analysis results: Mapping the tech world using text mining methods

Kristóf Gyódi; Łukasz Nawaro; Michał Paliński


DCAT Export

<?xml version='1.0' encoding='utf-8'?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:adms="http://www.w3.org/ns/adms#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dct="http://purl.org/dc/terms/" xmlns:dctype="http://purl.org/dc/dcmitype/" xmlns:dcat="http://www.w3.org/ns/dcat#" xmlns:duv="http://www.w3.org/ns/duv#" xmlns:foaf="http://xmlns.com/foaf/0.1/" xmlns:frapo="http://purl.org/cerif/frapo/" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:gsp="http://www.opengis.net/ont/geosparql#" xmlns:locn="http://www.w3.org/ns/locn#" xmlns:org="http://www.w3.org/ns/org#" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:prov="http://www.w3.org/ns/prov#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:schema="http://schema.org/" xmlns:skos="http://www.w3.org/2004/02/skos/core#" xmlns:vcard="http://www.w3.org/2006/vcard/ns#" xmlns:wdrs="http://www.w3.org/2007/05/powder-s#">
  <rdf:Description rdf:about="https://doi.org/10.5281/zenodo.5796271">
    <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://doi.org/10.5281/zenodo.5796271</dct:identifier>
    <foaf:page rdf:resource="https://doi.org/10.5281/zenodo.5796271"/>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0003-2999-8444">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0003-2999-8444</dct:identifier>
        <foaf:name>Kristóf Gyódi</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>University of Warsaw</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0003-1995-4894">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0003-1995-4894</dct:identifier>
        <foaf:name>Łukasz Nawaro</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>University of Warsaw</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0002-0075-3585">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0002-0075-3585</dct:identifier>
        <foaf:name>Michał Paliński</foaf:name>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>University of Warsaw</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:title>Intermediary topic modelling analysis results: Mapping the tech world using text mining methods</dct:title>
    <dct:publisher>
      <foaf:Agent>
        <foaf:name>Zenodo</foaf:name>
      </foaf:Agent>
    </dct:publisher>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#gYear">2021</dct:issued>
    <dcat:keyword>Human-centric, future, technology, data-driven, policy, collective intelligence, news</dcat:keyword>
    <frapo:isFundedBy rdf:resource="info:eu-repo/grantAgreement/EC/H2020/825652/"/>
    <schema:funder>
      <foaf:Organization>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">10.13039/100010661</dct:identifier>
        <foaf:name>European Commission</foaf:name>
      </foaf:Organization>
    </schema:funder>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#date">2021-12-21</dct:issued>
    <owl:sameAs rdf:resource="https://zenodo.org/record/5796271"/>
    <adms:identifier>
      <adms:Identifier>
        <skos:notation rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://zenodo.org/record/5796271</skos:notation>
        <adms:schemeAgency>url</adms:schemeAgency>
      </adms:Identifier>
    </adms:identifier>
    <dct:isVersionOf rdf:resource="https://doi.org/10.5281/zenodo.5796270"/>
    <dct:isPartOf rdf:resource="https://zenodo.org/communities/ngi_forward"/>
    <dct:description>&lt;p&gt;This study presents an innovative methodology for analysing technology news using various text mining methods. News articles provide a rich source of information to track promising emerging technologies, relevant social challenges or policy issues. Our goal is to support the Next Generation Internet initiative by providing data-science tools to map and analyse the developments of the tech word.&lt;/p&gt; &lt;p&gt;Based on more than 200 000 articles from major media outlets, we are going to identify widely discussed topics, focusing on emerging technologies and policy issues and dive deeper in selected areas and highlight key focal points of recent developments.&lt;/p&gt; &lt;p&gt;To meet these goals, a number of machine learning techniques are combined. The major steps can be summarised as follows:&lt;/p&gt; &lt;p&gt;● 17 general umbrella topics are explored&lt;/p&gt; &lt;p&gt;● 5 topics are selected for further analysis&lt;/p&gt; &lt;p&gt;● Deep dives are presented with 2D interactive maps&lt;/p&gt; &lt;p&gt;More specifically, the topics selected for the deep dives are:&lt;/p&gt; &lt;p&gt;1. AI and Robots&lt;/p&gt; &lt;p&gt;2. Policy (sums up 3 relevant areas)&lt;/p&gt; &lt;p&gt;3. Media&lt;/p&gt; &lt;p&gt;4. Business&lt;/p&gt; &lt;p&gt;5. Cybersecurity&lt;/p&gt; &lt;p&gt;With the Policy topic grouping together 3 areas: Social media crisis, Privacy and 5G.&lt;/p&gt;</dct:description>
    <dct:accessRights rdf:resource="http://publications.europa.eu/resource/authority/access-right/PUBLIC"/>
    <dct:accessRights>
      <dct:RightsStatement rdf:about="info:eu-repo/semantics/openAccess">
        <rdfs:label>Open Access</rdfs:label>
      </dct:RightsStatement>
    </dct:accessRights>
    <dct:license rdf:resource="https://creativecommons.org/licenses/by/4.0/legalcode"/>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.5796271"/>
        <dcat:byteSize>975366</dcat:byteSize>
        <dcat:downloadURL rdf:resource="https://zenodo.org/record/5796271/files/D1.5_Mapping the tech world using text mining methods.pdf"/>
        <dcat:mediaType>application/pdf</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
  </rdf:Description>
  <foaf:Project rdf:about="info:eu-repo/grantAgreement/EC/H2020/825652/">
    <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">825652</dct:identifier>
    <dct:title>NGI FORWARD</dct:title>
    <frapo:isAwardedBy>
      <foaf:Organization>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">10.13039/100010661</dct:identifier>
        <foaf:name>European Commission</foaf:name>
      </foaf:Organization>
    </frapo:isAwardedBy>
  </foaf:Project>
</rdf:RDF>
66
26
views
downloads
All versions This version
Views 6666
Downloads 2626
Data volume 25.4 MB25.4 MB
Unique views 5757
Unique downloads 2323

Share

Cite as