Zenodo.org will be unavailable for 2 hours on September 29th from 06:00-08:00 UTC. See announcement.

Conference paper Open Access

Elastic Embedded Background Linking for News Articles with Keywords, Entities and Events

Cabrera-Diego, Luis Adrián; Boros, Emanuela; Doucet, Antoine


DataCite XML Export

<?xml version='1.0' encoding='utf-8'?>
<resource xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://datacite.org/schema/kernel-4" xsi:schemaLocation="http://datacite.org/schema/kernel-4 http://schema.datacite.org/meta/kernel-4.1/metadata.xsd">
  <identifier identifierType="DOI">10.5281/zenodo.6334523</identifier>
  <creators>
    <creator>
      <creatorName>Cabrera-Diego, Luis Adrián</creatorName>
      <givenName>Luis Adrián</givenName>
      <familyName>Cabrera-Diego</familyName>
      <affiliation>University of La Rochelle</affiliation>
    </creator>
    <creator>
      <creatorName>Boros, Emanuela</creatorName>
      <givenName>Emanuela</givenName>
      <familyName>Boros</familyName>
      <affiliation>University of La Rochelle</affiliation>
    </creator>
    <creator>
      <creatorName>Doucet, Antoine</creatorName>
      <givenName>Antoine</givenName>
      <familyName>Doucet</familyName>
      <affiliation>University of La Rochelle</affiliation>
    </creator>
  </creators>
  <titles>
    <title>Elastic Embedded Background Linking for News Articles with Keywords, Entities and Events</title>
  </titles>
  <publisher>Zenodo</publisher>
  <publicationYear>2022</publicationYear>
  <subjects>
    <subject>Information system, Language models, Rank aggregation</subject>
  </subjects>
  <dates>
    <date dateType="Issued">2022-03-07</date>
  </dates>
  <language>en</language>
  <resourceType resourceTypeGeneral="ConferencePaper"/>
  <alternateIdentifiers>
    <alternateIdentifier alternateIdentifierType="url">https://zenodo.org/record/6334523</alternateIdentifier>
  </alternateIdentifiers>
  <relatedIdentifiers>
    <relatedIdentifier relatedIdentifierType="DOI" relationType="IsVersionOf">10.5281/zenodo.6334522</relatedIdentifier>
    <relatedIdentifier relatedIdentifierType="URL" relationType="IsPartOf">https://zenodo.org/communities/newseye</relatedIdentifier>
  </relatedIdentifiers>
  <rightsList>
    <rights rightsURI="https://creativecommons.org/licenses/by/4.0/legalcode">Creative Commons Attribution 4.0 International</rights>
    <rights rightsURI="info:eu-repo/semantics/openAccess">Open Access</rights>
  </rightsList>
  <descriptions>
    <description descriptionType="Abstract">&lt;p&gt;In this paper, we present a collection of five flexible background linking models created for the News Track in TREC 2021 that generate ranked lists of articles to provide contextual information. The collection is based on the use of sentence embeddings indexes, created with Sentence BERT and Open Distro for ElasticSearch. For each model, we explore additional tools, from keywords extraction using YAKE, to entity and event detection, while passing through a linear combination. The associated code is available online as open-source software.&lt;/p&gt;</description>
  </descriptions>
  <fundingReferences>
    <fundingReference>
      <funderName>European Commission</funderName>
      <funderIdentifier funderIdentifierType="Crossref Funder ID">10.13039/100010661</funderIdentifier>
      <awardNumber awardURI="info:eu-repo/grantAgreement/EC/H2020/770299/">770299</awardNumber>
      <awardTitle>NewsEye: A Digital Investigator for Historical Newspapers</awardTitle>
    </fundingReference>
  </fundingReferences>
</resource>
141
71
views
downloads
All versions This version
Views 141141
Downloads 7171
Data volume 24.3 MB24.3 MB
Unique views 130130
Unique downloads 6767

Share

Cite as