Dataset Open Access

A web tracking data set of online browsing behavior of 2,148 users

Kulshrestha, Juhi; Oliveira, Marcos; Karacalik, Orkut; Bonnay, Denis; Wagner, Claudia


DCAT Export

<?xml version='1.0' encoding='utf-8'?>
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:adms="http://www.w3.org/ns/adms#" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dct="http://purl.org/dc/terms/" xmlns:dctype="http://purl.org/dc/dcmitype/" xmlns:dcat="http://www.w3.org/ns/dcat#" xmlns:duv="http://www.w3.org/ns/duv#" xmlns:foaf="http://xmlns.com/foaf/0.1/" xmlns:frapo="http://purl.org/cerif/frapo/" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:gsp="http://www.opengis.net/ont/geosparql#" xmlns:locn="http://www.w3.org/ns/locn#" xmlns:org="http://www.w3.org/ns/org#" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:prov="http://www.w3.org/ns/prov#" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:schema="http://schema.org/" xmlns:skos="http://www.w3.org/2004/02/skos/core#" xmlns:vcard="http://www.w3.org/2006/vcard/ns#" xmlns:wdrs="http://www.w3.org/2007/05/powder-s#">
  <rdf:Description rdf:about="https://doi.org/10.5281/zenodo.4757574">
    <rdf:type rdf:resource="http://www.w3.org/ns/dcat#Dataset"/>
    <dct:type rdf:resource="http://purl.org/dc/dcmitype/Dataset"/>
    <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://doi.org/10.5281/zenodo.4757574</dct:identifier>
    <foaf:page rdf:resource="https://doi.org/10.5281/zenodo.4757574"/>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0002-4375-4641">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0002-4375-4641</dct:identifier>
        <foaf:name>Kulshrestha, Juhi</foaf:name>
        <foaf:givenName>Juhi</foaf:givenName>
        <foaf:familyName>Kulshrestha</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>GESIS - Leibniz Institute for the Social Sciences, Germany</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description rdf:about="http://orcid.org/0000-0003-3407-5361">
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <dct:identifier rdf:datatype="http://www.w3.org/2001/XMLSchema#string">0000-0003-3407-5361</dct:identifier>
        <foaf:name>Oliveira, Marcos</foaf:name>
        <foaf:givenName>Marcos</foaf:givenName>
        <foaf:familyName>Oliveira</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>GESIS - Leibniz Institute for the Social Sciences, Germany</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Karacalik, Orkut</foaf:name>
        <foaf:givenName>Orkut</foaf:givenName>
        <foaf:familyName>Karacalik</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>GESIS - Leibniz Institute for the Social Sciences, Germany</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Bonnay, Denis</foaf:name>
        <foaf:givenName>Denis</foaf:givenName>
        <foaf:familyName>Bonnay</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>Université Paris Nanterre, France</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:creator>
      <rdf:Description>
        <rdf:type rdf:resource="http://xmlns.com/foaf/0.1/Agent"/>
        <foaf:name>Wagner, Claudia</foaf:name>
        <foaf:givenName>Claudia</foaf:givenName>
        <foaf:familyName>Wagner</foaf:familyName>
        <org:memberOf>
          <foaf:Organization>
            <foaf:name>GESIS - Leibniz Institute for the Social Sciences, Germany</foaf:name>
          </foaf:Organization>
        </org:memberOf>
      </rdf:Description>
    </dct:creator>
    <dct:title>A web tracking data set of online browsing behavior of 2,148 users</dct:title>
    <dct:publisher>
      <foaf:Agent>
        <foaf:name>Zenodo</foaf:name>
      </foaf:Agent>
    </dct:publisher>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#gYear">2020</dct:issued>
    <dcat:keyword>online behavior</dcat:keyword>
    <dcat:keyword>web browsing behavior</dcat:keyword>
    <dcat:keyword>web tracking</dcat:keyword>
    <dcat:keyword>panel data</dcat:keyword>
    <dcat:keyword>demographics</dcat:keyword>
    <dct:issued rdf:datatype="http://www.w3.org/2001/XMLSchema#date">2020-12-30</dct:issued>
    <owl:sameAs rdf:resource="https://zenodo.org/record/4757574"/>
    <adms:identifier>
      <adms:Identifier>
        <skos:notation rdf:datatype="http://www.w3.org/2001/XMLSchema#anyURI">https://zenodo.org/record/4757574</skos:notation>
        <adms:schemeAgency>url</adms:schemeAgency>
      </adms:Identifier>
    </adms:identifier>
    <dct:isVersionOf rdf:resource="https://doi.org/10.5281/zenodo.4383163"/>
    <owl:versionInfo>v1</owl:versionInfo>
    <dct:description>&lt;p&gt;This anonymized data set consists of one month&amp;#39;s (October 2018) web tracking data of 2,148 German users. For each user, the data contains the anonymized URL of the webpage the user visited, the domain of the webpage, category of the domain, which provides 41 distinct categories. In total, these 2,148 users made 9,151,243 URL visits, spanning 49,918 unique domains. For each user in our data set, we have self-reported information (collected via a survey) about their gender and age.&lt;/p&gt; &lt;p&gt;We acknowledge the support of Respondi AG, which provided the web tracking and survey data&amp;nbsp;free of charge for research purposes, with special thanks to Fran&amp;ccedil;ois Erner and Luc Kalaora at Respondi for their insights and help with data extraction.&lt;/p&gt; &lt;p&gt;The&amp;nbsp;data set is analyzed in the following paper:&amp;nbsp;&lt;/p&gt; &lt;ul&gt; &lt;li&gt;Kulshrestha, J., Oliveira, M., Karacalik, O., Bonnay, D., Wagner, C. &amp;quot;&lt;em&gt;Web Routineness and Limits of Predictability: Investigating Demographic and Behavioral Differences Using Web Tracking Data&lt;/em&gt;&lt;strong&gt;.&lt;/strong&gt;&amp;quot; Proceedings of the International AAAI Conference on Web and Social Media. 2021.&amp;nbsp;&lt;a href="https://arxiv.org/abs/2012.15112"&gt;https://arxiv.org/abs/2012.15112&lt;/a&gt;.&amp;nbsp;&lt;/li&gt; &lt;/ul&gt; &lt;p&gt;The code used to analyze the data is also available at&amp;nbsp;&lt;a href="https://github.com/gesiscss/web_tracking"&gt;https://github.com/gesiscss/web_tracking&lt;/a&gt;.&lt;/p&gt; &lt;p&gt;&lt;strong&gt;If you use data or code from this repository, please cite the paper above and the Zenodo link.&lt;/strong&gt;&lt;/p&gt; &lt;p&gt;&amp;nbsp;&lt;/p&gt;</dct:description>
    <dct:accessRights rdf:resource="http://publications.europa.eu/resource/authority/access-right/PUBLIC"/>
    <dct:accessRights>
      <dct:RightsStatement rdf:about="info:eu-repo/semantics/openAccess">
        <rdfs:label>Open Access</rdfs:label>
      </dct:RightsStatement>
    </dct:accessRights>
    <dcat:distribution>
      <dcat:Distribution>
        <dct:license rdf:resource="https://creativecommons.org/licenses/by-nc/4.0/legalcode"/>
        <dcat:accessURL rdf:resource="https://doi.org/10.5281/zenodo.4757574"/>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL>https://doi.org/10.5281/zenodo.4757574</dcat:accessURL>
        <dcat:byteSize>1323</dcat:byteSize>
        <dcat:downloadURL>https://zenodo.org/record/4757574/files/README.txt</dcat:downloadURL>
        <dcat:mediaType>text/plain</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL>https://doi.org/10.5281/zenodo.4757574</dcat:accessURL>
        <dcat:byteSize>23818399</dcat:byteSize>
        <dcat:downloadURL>https://zenodo.org/record/4757574/files/web_tracking_code.zip</dcat:downloadURL>
        <dcat:mediaType>application/zip</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
    <dcat:distribution>
      <dcat:Distribution>
        <dcat:accessURL>https://doi.org/10.5281/zenodo.4757574</dcat:accessURL>
        <dcat:byteSize>194055856</dcat:byteSize>
        <dcat:downloadURL>https://zenodo.org/record/4757574/files/web_tracking_data.tar.gz</dcat:downloadURL>
        <dcat:mediaType>application/x-tar</dcat:mediaType>
      </dcat:Distribution>
    </dcat:distribution>
  </rdf:Description>
</rdf:RDF>
224
58
views
downloads
All versions This version
Views 224112
Downloads 5827
Data volume 3.1 GB3.1 GB
Unique views 16590
Unique downloads 3713

Share

Cite as